{"current_steps": 1, "total_steps": 1730, "loss": 1.5901, "learning_rate": 0.0, "epoch": 0.0011552346570397113, "percentage": 0.06, "elapsed_time": "0:00:48", "remaining_time": "23:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 1730, "loss": 1.583, "learning_rate": 5.017166594399687e-07, "epoch": 0.0023104693140794225, "percentage": 0.12, "elapsed_time": "0:01:22", "remaining_time": "19:48:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 1730, "loss": 1.6153, "learning_rate": 7.952020911994375e-07, "epoch": 0.0034657039711191336, "percentage": 0.17, "elapsed_time": "0:01:56", "remaining_time": "18:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 1730, "loss": 1.5939, "learning_rate": 1.0034333188799374e-06, "epoch": 0.004620938628158845, "percentage": 0.23, "elapsed_time": "0:02:29", "remaining_time": "17:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 1730, "loss": 1.6126, "learning_rate": 1.164950007226698e-06, "epoch": 0.005776173285198556, "percentage": 0.29, "elapsed_time": "0:03:03", "remaining_time": "17:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 1730, "loss": 1.597, "learning_rate": 1.2969187506394062e-06, "epoch": 0.006931407942238267, "percentage": 0.35, "elapsed_time": "0:03:36", "remaining_time": "17:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 1730, "loss": 1.584, "learning_rate": 1.4084967333570947e-06, "epoch": 0.008086642599277978, "percentage": 0.4, "elapsed_time": "0:04:10", "remaining_time": "17:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 1730, "loss": 1.5333, "learning_rate": 1.5051499783199062e-06, "epoch": 0.00924187725631769, "percentage": 0.46, "elapsed_time": "0:04:44", "remaining_time": "16:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 1730, "loss": 1.5173, "learning_rate": 1.590404182398875e-06, "epoch": 0.0103971119133574, "percentage": 0.52, "elapsed_time": "0:05:17", "remaining_time": "16:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1730, "loss": 1.4693, "learning_rate": 1.666666666666667e-06, "epoch": 0.011552346570397111, "percentage": 0.58, "elapsed_time": "0:05:53", "remaining_time": "16:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 1730, "loss": 1.3613, "learning_rate": 1.7356544752637086e-06, "epoch": 0.012707581227436824, "percentage": 0.64, "elapsed_time": "0:06:26", "remaining_time": "16:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 1730, "loss": 1.3096, "learning_rate": 1.798635410079375e-06, "epoch": 0.013862815884476534, "percentage": 0.69, "elapsed_time": "0:07:00", "remaining_time": "16:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 1730, "loss": 1.3096, "learning_rate": 1.8565722538447281e-06, "epoch": 0.015018050541516245, "percentage": 0.75, "elapsed_time": "0:07:34", "remaining_time": "16:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 1730, "loss": 1.3067, "learning_rate": 1.9102133927970633e-06, "epoch": 0.016173285198555955, "percentage": 0.81, "elapsed_time": "0:08:08", "remaining_time": "16:38:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1730, "loss": 1.2191, "learning_rate": 1.960152098426136e-06, "epoch": 0.017328519855595668, "percentage": 0.87, "elapsed_time": "0:08:43", "remaining_time": "16:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 1730, "loss": 1.2029, "learning_rate": 2.0068666377598747e-06, "epoch": 0.01848375451263538, "percentage": 0.92, "elapsed_time": "0:09:17", "remaining_time": "16:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 1730, "loss": 1.2076, "learning_rate": 2.0507482022971233e-06, "epoch": 0.01963898916967509, "percentage": 0.98, "elapsed_time": "0:09:51", "remaining_time": "16:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 1730, "loss": 1.1862, "learning_rate": 2.0921208418388438e-06, "epoch": 0.0207942238267148, "percentage": 1.04, "elapsed_time": "0:10:24", "remaining_time": "16:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 1730, "loss": 1.1844, "learning_rate": 2.1312560015880486e-06, "epoch": 0.021949458483754514, "percentage": 1.1, "elapsed_time": "0:10:58", "remaining_time": "16:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1730, "loss": 1.1763, "learning_rate": 2.1683833261066357e-06, "epoch": 0.023104693140794223, "percentage": 1.16, "elapsed_time": "0:11:32", "remaining_time": "16:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 1730, "loss": 1.1683, "learning_rate": 2.2036988245565326e-06, "epoch": 0.024259927797833935, "percentage": 1.21, "elapsed_time": "0:12:06", "remaining_time": "16:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 1730, "loss": 1.1119, "learning_rate": 2.2373711347036773e-06, "epoch": 0.025415162454873647, "percentage": 1.27, "elapsed_time": "0:12:40", "remaining_time": "16:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 1730, "loss": 1.1001, "learning_rate": 2.269546393362655e-06, "epoch": 0.026570397111913356, "percentage": 1.33, "elapsed_time": "0:13:14", "remaining_time": "16:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 1730, "loss": 1.1154, "learning_rate": 2.3003520695193436e-06, "epoch": 0.02772563176895307, "percentage": 1.39, "elapsed_time": "0:13:48", "remaining_time": "16:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1730, "loss": 1.0793, "learning_rate": 2.329900014453396e-06, "epoch": 0.02888086642599278, "percentage": 1.45, "elapsed_time": "0:14:22", "remaining_time": "16:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 1730, "loss": 1.0672, "learning_rate": 2.358288913284697e-06, "epoch": 0.03003610108303249, "percentage": 1.5, "elapsed_time": "0:14:56", "remaining_time": "16:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 1730, "loss": 1.0833, "learning_rate": 2.385606273598312e-06, "epoch": 0.031191335740072202, "percentage": 1.56, "elapsed_time": "0:15:30", "remaining_time": "16:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 1730, "loss": 1.0795, "learning_rate": 2.4119300522370323e-06, "epoch": 0.03234657039711191, "percentage": 1.62, "elapsed_time": "0:16:04", "remaining_time": "16:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 1730, "loss": 1.0599, "learning_rate": 2.4373299964982607e-06, "epoch": 0.03350180505415162, "percentage": 1.68, "elapsed_time": "0:16:38", "remaining_time": "16:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1730, "loss": 1.066, "learning_rate": 2.4618687578661045e-06, "epoch": 0.034657039711191336, "percentage": 1.73, "elapsed_time": "0:17:12", "remaining_time": "16:14:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 1730, "loss": 1.0332, "learning_rate": 2.4856028230571215e-06, "epoch": 0.03581227436823105, "percentage": 1.79, "elapsed_time": "0:17:45", "remaining_time": "16:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 1730, "loss": 1.0566, "learning_rate": 2.5085832971998437e-06, "epoch": 0.03696750902527076, "percentage": 1.85, "elapsed_time": "0:18:19", "remaining_time": "16:12:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 1730, "loss": 1.0351, "learning_rate": 2.530856566463146e-06, "epoch": 0.03812274368231047, "percentage": 1.91, "elapsed_time": "0:18:53", "remaining_time": "16:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 1730, "loss": 1.0164, "learning_rate": 2.5524648617370923e-06, "epoch": 0.03927797833935018, "percentage": 1.97, "elapsed_time": "0:19:26", "remaining_time": "16:10:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1730, "loss": 1.0125, "learning_rate": 2.5734467405837933e-06, "epoch": 0.04043321299638989, "percentage": 2.02, "elapsed_time": "0:20:01", "remaining_time": "16:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 1730, "loss": 1.0392, "learning_rate": 2.5938375012788124e-06, "epoch": 0.0415884476534296, "percentage": 2.08, "elapsed_time": "0:20:34", "remaining_time": "16:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 1730, "loss": 1.0244, "learning_rate": 2.6136695401116585e-06, "epoch": 0.042743682310469315, "percentage": 2.14, "elapsed_time": "0:21:08", "remaining_time": "16:07:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 1730, "loss": 0.9972, "learning_rate": 2.632972661028017e-06, "epoch": 0.04389891696750903, "percentage": 2.2, "elapsed_time": "0:21:42", "remaining_time": "16:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 1730, "loss": 1.0142, "learning_rate": 2.6517743450441657e-06, "epoch": 0.04505415162454874, "percentage": 2.25, "elapsed_time": "0:22:16", "remaining_time": "16:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1730, "loss": 0.9995, "learning_rate": 2.6700999855466042e-06, "epoch": 0.046209386281588445, "percentage": 2.31, "elapsed_time": "0:22:50", "remaining_time": "16:04:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 1730, "loss": 0.998, "learning_rate": 2.687973094532893e-06, "epoch": 0.04736462093862816, "percentage": 2.37, "elapsed_time": "0:23:24", "remaining_time": "16:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 1730, "loss": 0.9798, "learning_rate": 2.705415483996501e-06, "epoch": 0.04851985559566787, "percentage": 2.43, "elapsed_time": "0:23:58", "remaining_time": "16:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 1730, "loss": 0.9879, "learning_rate": 2.722447425965978e-06, "epoch": 0.04967509025270758, "percentage": 2.49, "elapsed_time": "0:24:32", "remaining_time": "16:03:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 1730, "loss": 0.9722, "learning_rate": 2.739087794143646e-06, "epoch": 0.050830324909747295, "percentage": 2.54, "elapsed_time": "0:25:07", "remaining_time": "16:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1730, "loss": 0.9491, "learning_rate": 2.7553541896255733e-06, "epoch": 0.05198555956678701, "percentage": 2.6, "elapsed_time": "0:25:41", "remaining_time": "16:02:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 1730, "loss": 1.0037, "learning_rate": 2.771263052802624e-06, "epoch": 0.05314079422382671, "percentage": 2.66, "elapsed_time": "0:26:15", "remaining_time": "16:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 1730, "loss": 0.971, "learning_rate": 2.7868297632261957e-06, "epoch": 0.054296028880866425, "percentage": 2.72, "elapsed_time": "0:26:49", "remaining_time": "16:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 1730, "loss": 1.0084, "learning_rate": 2.8020687289593126e-06, "epoch": 0.05545126353790614, "percentage": 2.77, "elapsed_time": "0:27:23", "remaining_time": "15:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 1730, "loss": 0.9507, "learning_rate": 2.8169934667141895e-06, "epoch": 0.05660649819494585, "percentage": 2.83, "elapsed_time": "0:27:57", "remaining_time": "15:59:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1730, "loss": 0.973, "learning_rate": 2.8316166738933647e-06, "epoch": 0.05776173285198556, "percentage": 2.89, "elapsed_time": "0:28:31", "remaining_time": "15:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 1730, "loss": 0.9758, "learning_rate": 2.845950293496561e-06, "epoch": 0.058916967509025274, "percentage": 2.95, "elapsed_time": "0:29:05", "remaining_time": "15:57:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 1730, "loss": 0.9991, "learning_rate": 2.8600055727246655e-06, "epoch": 0.06007220216606498, "percentage": 3.01, "elapsed_time": "0:29:38", "remaining_time": "15:56:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 1730, "loss": 0.9661, "learning_rate": 2.8737931160013154e-06, "epoch": 0.06122743682310469, "percentage": 3.06, "elapsed_time": "0:30:12", "remaining_time": "15:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 1730, "loss": 0.9773, "learning_rate": 2.887322933038281e-06, "epoch": 0.062382671480144404, "percentage": 3.12, "elapsed_time": "0:30:46", "remaining_time": "15:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1730, "loss": 0.9644, "learning_rate": 2.900604482490407e-06, "epoch": 0.06353790613718412, "percentage": 3.18, "elapsed_time": "0:31:20", "remaining_time": "15:54:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 1730, "loss": 0.9701, "learning_rate": 2.9136467116770013e-06, "epoch": 0.06469314079422382, "percentage": 3.24, "elapsed_time": "0:31:54", "remaining_time": "15:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 1730, "loss": 0.9314, "learning_rate": 2.926458092787486e-06, "epoch": 0.06584837545126354, "percentage": 3.29, "elapsed_time": "0:32:28", "remaining_time": "15:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 1730, "loss": 0.9489, "learning_rate": 2.9390466559382293e-06, "epoch": 0.06700361010830325, "percentage": 3.35, "elapsed_time": "0:33:01", "remaining_time": "15:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 1730, "loss": 0.9697, "learning_rate": 2.951420019403574e-06, "epoch": 0.06815884476534297, "percentage": 3.41, "elapsed_time": "0:33:35", "remaining_time": "15:51:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1730, "loss": 0.923, "learning_rate": 2.963585417306073e-06, "epoch": 0.06931407942238267, "percentage": 3.47, "elapsed_time": "0:34:09", "remaining_time": "15:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 1730, "loss": 0.9448, "learning_rate": 2.9755497250179457e-06, "epoch": 0.07046931407942238, "percentage": 3.53, "elapsed_time": "0:34:43", "remaining_time": "15:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 1730, "loss": 0.9521, "learning_rate": 2.98731948249709e-06, "epoch": 0.0716245487364621, "percentage": 3.58, "elapsed_time": "0:35:16", "remaining_time": "15:49:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 1730, "loss": 0.9429, "learning_rate": 2.9989009157559695e-06, "epoch": 0.0727797833935018, "percentage": 3.64, "elapsed_time": "0:35:50", "remaining_time": "15:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 1730, "loss": 0.9641, "learning_rate": 3.0102999566398123e-06, "epoch": 0.07393501805054152, "percentage": 3.7, "elapsed_time": "0:36:23", "remaining_time": "15:47:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1730, "loss": 0.9555, "learning_rate": 3.021522261071426e-06, "epoch": 0.07509025270758123, "percentage": 3.76, "elapsed_time": "0:36:57", "remaining_time": "15:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 1730, "loss": 0.9531, "learning_rate": 3.0325732259031143e-06, "epoch": 0.07624548736462095, "percentage": 3.82, "elapsed_time": "0:37:31", "remaining_time": "15:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 1730, "loss": 0.9358, "learning_rate": 3.0434580045013773e-06, "epoch": 0.07740072202166065, "percentage": 3.87, "elapsed_time": "0:38:06", "remaining_time": "15:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 1730, "loss": 0.9496, "learning_rate": 3.054181521177061e-06, "epoch": 0.07855595667870036, "percentage": 3.93, "elapsed_time": "0:38:39", "remaining_time": "15:44:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 1730, "loss": 0.931, "learning_rate": 3.064748484562093e-06, "epoch": 0.07971119133574008, "percentage": 3.99, "elapsed_time": "0:39:13", "remaining_time": "15:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1730, "loss": 0.9674, "learning_rate": 3.075163400023762e-06, "epoch": 0.08086642599277978, "percentage": 4.05, "elapsed_time": "0:39:47", "remaining_time": "15:43:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 1730, "loss": 0.9504, "learning_rate": 3.085430581198459e-06, "epoch": 0.0820216606498195, "percentage": 4.1, "elapsed_time": "0:40:21", "remaining_time": "15:43:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 1730, "loss": 0.9513, "learning_rate": 3.095554160718781e-06, "epoch": 0.0831768953068592, "percentage": 4.16, "elapsed_time": "0:40:55", "remaining_time": "15:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 1730, "loss": 0.9152, "learning_rate": 3.1055381002007602e-06, "epoch": 0.08433212996389891, "percentage": 4.22, "elapsed_time": "0:41:29", "remaining_time": "15:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 1730, "loss": 0.9247, "learning_rate": 3.1153861995516275e-06, "epoch": 0.08548736462093863, "percentage": 4.28, "elapsed_time": "0:42:02", "remaining_time": "15:40:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1730, "loss": 0.9285, "learning_rate": 3.1251021056528336e-06, "epoch": 0.08664259927797834, "percentage": 4.34, "elapsed_time": "0:42:37", "remaining_time": "15:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 1730, "loss": 0.928, "learning_rate": 3.1346893204679857e-06, "epoch": 0.08779783393501805, "percentage": 4.39, "elapsed_time": "0:43:11", "remaining_time": "15:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 1730, "loss": 0.9135, "learning_rate": 3.1441512086208035e-06, "epoch": 0.08895306859205776, "percentage": 4.45, "elapsed_time": "0:43:45", "remaining_time": "15:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 1730, "loss": 0.9306, "learning_rate": 3.1534910044841343e-06, "epoch": 0.09010830324909748, "percentage": 4.51, "elapsed_time": "0:44:19", "remaining_time": "15:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 1730, "loss": 0.9475, "learning_rate": 3.1627118188174026e-06, "epoch": 0.09126353790613718, "percentage": 4.57, "elapsed_time": "0:44:52", "remaining_time": "15:37:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1730, "loss": 0.9445, "learning_rate": 3.171816644986573e-06, "epoch": 0.09241877256317689, "percentage": 4.62, "elapsed_time": "0:45:26", "remaining_time": "15:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 1730, "loss": 0.9388, "learning_rate": 3.18080836479775e-06, "epoch": 0.09357400722021661, "percentage": 4.68, "elapsed_time": "0:46:00", "remaining_time": "15:36:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 1730, "loss": 0.9097, "learning_rate": 3.1896897539728615e-06, "epoch": 0.09472924187725631, "percentage": 4.74, "elapsed_time": "0:46:34", "remaining_time": "15:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 1730, "loss": 0.9216, "learning_rate": 3.1984634872934573e-06, "epoch": 0.09588447653429603, "percentage": 4.8, "elapsed_time": "0:47:08", "remaining_time": "15:35:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 1730, "loss": 0.9397, "learning_rate": 3.2071321434364693e-06, "epoch": 0.09703971119133574, "percentage": 4.86, "elapsed_time": "0:47:42", "remaining_time": "15:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1730, "loss": 0.9166, "learning_rate": 3.2156982095238214e-06, "epoch": 0.09819494584837545, "percentage": 4.91, "elapsed_time": "0:48:16", "remaining_time": "15:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 1730, "loss": 0.9213, "learning_rate": 3.2241640854059465e-06, "epoch": 0.09935018050541516, "percentage": 4.97, "elapsed_time": "0:48:50", "remaining_time": "15:33:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 1730, "loss": 0.9292, "learning_rate": 3.232532087697698e-06, "epoch": 0.10050541516245487, "percentage": 5.03, "elapsed_time": "0:49:24", "remaining_time": "15:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 1730, "loss": 0.923, "learning_rate": 3.2408044535836154e-06, "epoch": 0.10166064981949459, "percentage": 5.09, "elapsed_time": "0:49:58", "remaining_time": "15:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 1730, "loss": 0.9252, "learning_rate": 3.248983344408188e-06, "epoch": 0.1028158844765343, "percentage": 5.14, "elapsed_time": "0:50:32", "remaining_time": "15:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1730, "loss": 0.9423, "learning_rate": 3.257070849065542e-06, "epoch": 0.10397111913357401, "percentage": 5.2, "elapsed_time": "0:51:06", "remaining_time": "15:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 1730, "loss": 0.9337, "learning_rate": 3.2650689872018227e-06, "epoch": 0.10512635379061372, "percentage": 5.26, "elapsed_time": "0:51:39", "remaining_time": "15:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 1730, "loss": 0.9134, "learning_rate": 3.2729797122425927e-06, "epoch": 0.10628158844765342, "percentage": 5.32, "elapsed_time": "0:52:13", "remaining_time": "15:29:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 1730, "loss": 0.9182, "learning_rate": 3.280804914256559e-06, "epoch": 0.10743682310469314, "percentage": 5.38, "elapsed_time": "0:52:46", "remaining_time": "15:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 1730, "loss": 0.883, "learning_rate": 3.2885464226661647e-06, "epoch": 0.10859205776173285, "percentage": 5.43, "elapsed_time": "0:53:20", "remaining_time": "15:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1730, "loss": 0.9009, "learning_rate": 3.2962060088147467e-06, "epoch": 0.10974729241877257, "percentage": 5.49, "elapsed_time": "0:53:54", "remaining_time": "15:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 1730, "loss": 0.9264, "learning_rate": 3.303785388399281e-06, "epoch": 0.11090252707581227, "percentage": 5.55, "elapsed_time": "0:54:28", "remaining_time": "15:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 1730, "loss": 0.9072, "learning_rate": 3.3112862237770753e-06, "epoch": 0.11205776173285198, "percentage": 5.61, "elapsed_time": "0:55:02", "remaining_time": "15:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 1730, "loss": 0.9226, "learning_rate": 3.318710126154159e-06, "epoch": 0.1132129963898917, "percentage": 5.66, "elapsed_time": "0:55:35", "remaining_time": "15:25:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 1730, "loss": 0.9002, "learning_rate": 3.3260586576625835e-06, "epoch": 0.1143682310469314, "percentage": 5.72, "elapsed_time": "0:56:09", "remaining_time": "15:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1730, "loss": 0.9335, "learning_rate": 3.333333333333334e-06, "epoch": 0.11552346570397112, "percentage": 5.78, "elapsed_time": "0:56:42", "remaining_time": "15:24:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 1730, "loss": 0.9079, "learning_rate": 3.340535622971072e-06, "epoch": 0.11667870036101083, "percentage": 5.84, "elapsed_time": "0:57:16", "remaining_time": "15:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 1730, "loss": 0.9188, "learning_rate": 3.3476669529365297e-06, "epoch": 0.11783393501805055, "percentage": 5.9, "elapsed_time": "0:57:50", "remaining_time": "15:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 1730, "loss": 0.9207, "learning_rate": 3.3547287078419544e-06, "epoch": 0.11898916967509025, "percentage": 5.95, "elapsed_time": "0:58:24", "remaining_time": "15:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 1730, "loss": 0.8937, "learning_rate": 3.361722232164634e-06, "epoch": 0.12014440433212996, "percentage": 6.01, "elapsed_time": "0:58:58", "remaining_time": "15:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1730, "loss": 0.9189, "learning_rate": 3.3686488317832306e-06, "epoch": 0.12129963898916968, "percentage": 6.07, "elapsed_time": "0:59:31", "remaining_time": "15:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 1730, "loss": 0.9034, "learning_rate": 3.375509775441284e-06, "epoch": 0.12245487364620938, "percentage": 6.13, "elapsed_time": "1:00:05", "remaining_time": "15:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 1730, "loss": 0.9008, "learning_rate": 3.3823062961420163e-06, "epoch": 0.1236101083032491, "percentage": 6.18, "elapsed_time": "1:00:39", "remaining_time": "15:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 1730, "loss": 0.8788, "learning_rate": 3.3890395924782498e-06, "epoch": 0.12476534296028881, "percentage": 6.24, "elapsed_time": "1:01:14", "remaining_time": "15:19:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 1730, "loss": 0.9252, "learning_rate": 3.3957108299010395e-06, "epoch": 0.12592057761732853, "percentage": 6.3, "elapsed_time": "1:01:47", "remaining_time": "15:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1730, "loss": 0.9221, "learning_rate": 3.402321141930376e-06, "epoch": 0.12707581227436823, "percentage": 6.36, "elapsed_time": "1:02:21", "remaining_time": "15:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 1730, "loss": 0.8957, "learning_rate": 3.408871631311096e-06, "epoch": 0.12823104693140794, "percentage": 6.42, "elapsed_time": "1:02:55", "remaining_time": "15:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 1730, "loss": 0.8895, "learning_rate": 3.415363371116969e-06, "epoch": 0.12938628158844764, "percentage": 6.47, "elapsed_time": "1:03:29", "remaining_time": "15:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 1730, "loss": 0.9094, "learning_rate": 3.4217974058057e-06, "epoch": 0.13054151624548738, "percentage": 6.53, "elapsed_time": "1:04:02", "remaining_time": "15:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 1730, "loss": 0.9063, "learning_rate": 3.428174752227455e-06, "epoch": 0.13169675090252708, "percentage": 6.59, "elapsed_time": "1:04:36", "remaining_time": "15:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1730, "loss": 0.9164, "learning_rate": 3.434496400589353e-06, "epoch": 0.1328519855595668, "percentage": 6.65, "elapsed_time": "1:05:10", "remaining_time": "15:15:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 1730, "loss": 0.9125, "learning_rate": 3.440763315378198e-06, "epoch": 0.1340072202166065, "percentage": 6.71, "elapsed_time": "1:05:44", "remaining_time": "15:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 1730, "loss": 0.892, "learning_rate": 3.446976436243603e-06, "epoch": 0.1351624548736462, "percentage": 6.76, "elapsed_time": "1:06:17", "remaining_time": "15:13:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 1730, "loss": 0.896, "learning_rate": 3.4531366788435426e-06, "epoch": 0.13631768953068593, "percentage": 6.82, "elapsed_time": "1:06:51", "remaining_time": "15:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 1730, "loss": 0.8718, "learning_rate": 3.4592449356542185e-06, "epoch": 0.13747292418772564, "percentage": 6.88, "elapsed_time": "1:07:25", "remaining_time": "15:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1730, "loss": 0.9059, "learning_rate": 3.4653020767460416e-06, "epoch": 0.13862815884476534, "percentage": 6.94, "elapsed_time": "1:07:59", "remaining_time": "15:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 1730, "loss": 0.9188, "learning_rate": 3.471308950527417e-06, "epoch": 0.13978339350180505, "percentage": 6.99, "elapsed_time": "1:08:33", "remaining_time": "15:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 1730, "loss": 0.9289, "learning_rate": 3.4772663844579142e-06, "epoch": 0.14093862815884475, "percentage": 7.05, "elapsed_time": "1:09:09", "remaining_time": "15:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 1730, "loss": 0.9007, "learning_rate": 3.48317518573233e-06, "epoch": 0.1420938628158845, "percentage": 7.11, "elapsed_time": "1:09:43", "remaining_time": "15:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 1730, "loss": 0.8807, "learning_rate": 3.4890361419370587e-06, "epoch": 0.1432490974729242, "percentage": 7.17, "elapsed_time": "1:10:16", "remaining_time": "15:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1730, "loss": 0.8969, "learning_rate": 3.4948500216800947e-06, "epoch": 0.1444043321299639, "percentage": 7.23, "elapsed_time": "1:10:50", "remaining_time": "15:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 1730, "loss": 0.9001, "learning_rate": 3.5006175751959385e-06, "epoch": 0.1455595667870036, "percentage": 7.28, "elapsed_time": "1:11:25", "remaining_time": "15:09:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 1730, "loss": 0.9093, "learning_rate": 3.506339534926595e-06, "epoch": 0.1467148014440433, "percentage": 7.34, "elapsed_time": "1:11:59", "remaining_time": "15:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 1730, "loss": 0.8793, "learning_rate": 3.512016616079781e-06, "epoch": 0.14787003610108304, "percentage": 7.4, "elapsed_time": "1:12:32", "remaining_time": "15:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 1730, "loss": 0.8855, "learning_rate": 3.5176495171654153e-06, "epoch": 0.14902527075812275, "percentage": 7.46, "elapsed_time": "1:13:06", "remaining_time": "15:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1730, "loss": 0.8642, "learning_rate": 3.523238920511395e-06, "epoch": 0.15018050541516245, "percentage": 7.51, "elapsed_time": "1:13:39", "remaining_time": "15:06:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 1730, "loss": 0.8966, "learning_rate": 3.528785492759607e-06, "epoch": 0.15133574007220216, "percentage": 7.57, "elapsed_time": "1:14:13", "remaining_time": "15:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 1730, "loss": 0.9036, "learning_rate": 3.5342898853430833e-06, "epoch": 0.1524909747292419, "percentage": 7.63, "elapsed_time": "1:14:46", "remaining_time": "15:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 1730, "loss": 0.8796, "learning_rate": 3.5397527349451433e-06, "epoch": 0.1536462093862816, "percentage": 7.69, "elapsed_time": "1:15:20", "remaining_time": "15:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 1730, "loss": 0.8993, "learning_rate": 3.5451746639413463e-06, "epoch": 0.1548014440433213, "percentage": 7.75, "elapsed_time": "1:15:54", "remaining_time": "15:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1730, "loss": 0.8887, "learning_rate": 3.550556280825011e-06, "epoch": 0.155956678700361, "percentage": 7.8, "elapsed_time": "1:16:27", "remaining_time": "15:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 1730, "loss": 0.8799, "learning_rate": 3.55589818061703e-06, "epoch": 0.1571119133574007, "percentage": 7.86, "elapsed_time": "1:17:01", "remaining_time": "15:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 1730, "loss": 0.9006, "learning_rate": 3.5612009452606784e-06, "epoch": 0.15826714801444045, "percentage": 7.92, "elapsed_time": "1:17:35", "remaining_time": "15:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 1730, "loss": 0.9254, "learning_rate": 3.5664651440020615e-06, "epoch": 0.15942238267148015, "percentage": 7.98, "elapsed_time": "1:18:09", "remaining_time": "15:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 1730, "loss": 0.8843, "learning_rate": 3.5716913337568255e-06, "epoch": 0.16057761732851986, "percentage": 8.03, "elapsed_time": "1:18:42", "remaining_time": "15:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1730, "loss": 0.8904, "learning_rate": 3.5768800594637304e-06, "epoch": 0.16173285198555956, "percentage": 8.09, "elapsed_time": "1:19:16", "remaining_time": "15:00:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 1730, "loss": 0.9226, "learning_rate": 3.582031854425634e-06, "epoch": 0.16288808664259927, "percentage": 8.15, "elapsed_time": "1:19:49", "remaining_time": "14:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 1730, "loss": 0.9165, "learning_rate": 3.587147240638428e-06, "epoch": 0.164043321299639, "percentage": 8.21, "elapsed_time": "1:20:23", "remaining_time": "14:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 1730, "loss": 0.8984, "learning_rate": 3.5922267291084367e-06, "epoch": 0.1651985559566787, "percentage": 8.27, "elapsed_time": "1:20:57", "remaining_time": "14:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 1730, "loss": 0.9018, "learning_rate": 3.59727082015875e-06, "epoch": 0.1663537906137184, "percentage": 8.32, "elapsed_time": "1:21:30", "remaining_time": "14:57:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1730, "loss": 0.8928, "learning_rate": 3.6022800037249583e-06, "epoch": 0.16750902527075812, "percentage": 8.38, "elapsed_time": "1:22:04", "remaining_time": "14:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 1730, "loss": 0.887, "learning_rate": 3.607254759640729e-06, "epoch": 0.16866425992779782, "percentage": 8.44, "elapsed_time": "1:22:37", "remaining_time": "14:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 1730, "loss": 0.8906, "learning_rate": 3.612195557913627e-06, "epoch": 0.16981949458483755, "percentage": 8.5, "elapsed_time": "1:23:11", "remaining_time": "14:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 1730, "loss": 0.8866, "learning_rate": 3.6171028589915957e-06, "epoch": 0.17097472924187726, "percentage": 8.55, "elapsed_time": "1:23:45", "remaining_time": "14:55:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 1730, "loss": 0.875, "learning_rate": 3.6219771140204575e-06, "epoch": 0.17212996389891697, "percentage": 8.61, "elapsed_time": "1:24:19", "remaining_time": "14:54:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1730, "loss": 0.9158, "learning_rate": 3.626818765092802e-06, "epoch": 0.17328519855595667, "percentage": 8.67, "elapsed_time": "1:24:53", "remaining_time": "14:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 1730, "loss": 0.8595, "learning_rate": 3.631628245488616e-06, "epoch": 0.17444043321299638, "percentage": 8.73, "elapsed_time": "1:25:26", "remaining_time": "14:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 1730, "loss": 0.8762, "learning_rate": 3.6364059799079547e-06, "epoch": 0.1755956678700361, "percentage": 8.79, "elapsed_time": "1:26:00", "remaining_time": "14:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 1730, "loss": 0.8769, "learning_rate": 3.6411523846959985e-06, "epoch": 0.17675090252707581, "percentage": 8.84, "elapsed_time": "1:26:33", "remaining_time": "14:52:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 1730, "loss": 0.9109, "learning_rate": 3.6458678680607725e-06, "epoch": 0.17790613718411552, "percentage": 8.9, "elapsed_time": "1:27:07", "remaining_time": "14:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1730, "loss": 0.8624, "learning_rate": 3.6505528302838196e-06, "epoch": 0.17906137184115523, "percentage": 8.96, "elapsed_time": "1:27:41", "remaining_time": "14:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 1730, "loss": 0.8581, "learning_rate": 3.655207663924103e-06, "epoch": 0.18021660649819496, "percentage": 9.02, "elapsed_time": "1:28:15", "remaining_time": "14:50:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 1730, "loss": 0.8699, "learning_rate": 3.65983275401539e-06, "epoch": 0.18137184115523466, "percentage": 9.08, "elapsed_time": "1:28:49", "remaining_time": "14:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 1730, "loss": 0.8896, "learning_rate": 3.664428478257371e-06, "epoch": 0.18252707581227437, "percentage": 9.13, "elapsed_time": "1:29:22", "remaining_time": "14:49:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 1730, "loss": 0.8954, "learning_rate": 3.6689952072007528e-06, "epoch": 0.18368231046931408, "percentage": 9.19, "elapsed_time": "1:29:57", "remaining_time": "14:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1730, "loss": 0.8794, "learning_rate": 3.6735333044265414e-06, "epoch": 0.18483754512635378, "percentage": 9.25, "elapsed_time": "1:30:30", "remaining_time": "14:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 1730, "loss": 0.9103, "learning_rate": 3.6780431267197503e-06, "epoch": 0.1859927797833935, "percentage": 9.31, "elapsed_time": "1:31:03", "remaining_time": "14:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 1730, "loss": 0.8945, "learning_rate": 3.6825250242377186e-06, "epoch": 0.18714801444043322, "percentage": 9.36, "elapsed_time": "1:31:37", "remaining_time": "14:46:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 1730, "loss": 0.8884, "learning_rate": 3.6869793406732633e-06, "epoch": 0.18830324909747292, "percentage": 9.42, "elapsed_time": "1:32:11", "remaining_time": "14:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 1730, "loss": 0.893, "learning_rate": 3.69140641341283e-06, "epoch": 0.18945848375451263, "percentage": 9.48, "elapsed_time": "1:32:45", "remaining_time": "14:45:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1730, "loss": 0.8739, "learning_rate": 3.6958065736898442e-06, "epoch": 0.19061371841155234, "percentage": 9.54, "elapsed_time": "1:33:19", "remaining_time": "14:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 1730, "loss": 0.8832, "learning_rate": 3.700180146733426e-06, "epoch": 0.19176895306859207, "percentage": 9.6, "elapsed_time": "1:33:53", "remaining_time": "14:44:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 1730, "loss": 0.8785, "learning_rate": 3.7045274519126395e-06, "epoch": 0.19292418772563177, "percentage": 9.65, "elapsed_time": "1:34:27", "remaining_time": "14:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 1730, "loss": 0.8722, "learning_rate": 3.7088488028764387e-06, "epoch": 0.19407942238267148, "percentage": 9.71, "elapsed_time": "1:35:01", "remaining_time": "14:43:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 1730, "loss": 0.8833, "learning_rate": 3.7131445076894563e-06, "epoch": 0.19523465703971118, "percentage": 9.77, "elapsed_time": "1:35:34", "remaining_time": "14:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1730, "loss": 0.8795, "learning_rate": 3.717414868963791e-06, "epoch": 0.1963898916967509, "percentage": 9.83, "elapsed_time": "1:36:08", "remaining_time": "14:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 1730, "loss": 0.9025, "learning_rate": 3.721660183986924e-06, "epoch": 0.19754512635379062, "percentage": 9.88, "elapsed_time": "1:36:42", "remaining_time": "14:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 1730, "loss": 0.9047, "learning_rate": 3.725880744845915e-06, "epoch": 0.19870036101083033, "percentage": 9.94, "elapsed_time": "1:37:17", "remaining_time": "14:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 1730, "loss": 0.8571, "learning_rate": 3.7300768385479928e-06, "epoch": 0.19985559566787003, "percentage": 10.0, "elapsed_time": "1:37:50", "remaining_time": "14:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 1730, "loss": 0.8776, "learning_rate": 3.7342487471376667e-06, "epoch": 0.20101083032490974, "percentage": 10.06, "elapsed_time": "1:38:24", "remaining_time": "14:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1730, "loss": 0.9018, "learning_rate": 3.7383967478104918e-06, "epoch": 0.20216606498194944, "percentage": 10.12, "elapsed_time": "1:38:58", "remaining_time": "14:39:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 1730, "loss": 0.8861, "learning_rate": 3.7425211130235835e-06, "epoch": 0.20332129963898918, "percentage": 10.17, "elapsed_time": "1:39:32", "remaining_time": "14:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 1730, "loss": 0.8974, "learning_rate": 3.7466221106030114e-06, "epoch": 0.20447653429602888, "percentage": 10.23, "elapsed_time": "1:40:05", "remaining_time": "14:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 1730, "loss": 0.8904, "learning_rate": 3.7507000038481574e-06, "epoch": 0.2056317689530686, "percentage": 10.29, "elapsed_time": "1:40:39", "remaining_time": "14:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 1730, "loss": 0.8637, "learning_rate": 3.7547550516331556e-06, "epoch": 0.2067870036101083, "percentage": 10.35, "elapsed_time": "1:41:13", "remaining_time": "14:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1730, "loss": 0.8718, "learning_rate": 3.7587875085055104e-06, "epoch": 0.20794223826714803, "percentage": 10.4, "elapsed_time": "1:41:47", "remaining_time": "14:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 1730, "loss": 0.8697, "learning_rate": 3.762797624781975e-06, "epoch": 0.20909747292418773, "percentage": 10.46, "elapsed_time": "1:42:21", "remaining_time": "14:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 1730, "loss": 0.8838, "learning_rate": 3.7667856466417917e-06, "epoch": 0.21025270758122744, "percentage": 10.52, "elapsed_time": "1:42:55", "remaining_time": "14:35:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 1730, "loss": 0.8704, "learning_rate": 3.7707518162173835e-06, "epoch": 0.21140794223826714, "percentage": 10.58, "elapsed_time": "1:43:29", "remaining_time": "14:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 1730, "loss": 0.855, "learning_rate": 3.7746963716825613e-06, "epoch": 0.21256317689530685, "percentage": 10.64, "elapsed_time": "1:44:02", "remaining_time": "14:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1730, "loss": 0.8712, "learning_rate": 3.778619547338356e-06, "epoch": 0.21371841155234658, "percentage": 10.69, "elapsed_time": "1:44:36", "remaining_time": "14:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 1730, "loss": 0.8729, "learning_rate": 3.7825215736965283e-06, "epoch": 0.2148736462093863, "percentage": 10.75, "elapsed_time": "1:45:10", "remaining_time": "14:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 1730, "loss": 0.8845, "learning_rate": 3.786402677560832e-06, "epoch": 0.216028880866426, "percentage": 10.81, "elapsed_time": "1:45:45", "remaining_time": "14:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 1730, "loss": 0.8669, "learning_rate": 3.7902630821061337e-06, "epoch": 0.2171841155234657, "percentage": 10.87, "elapsed_time": "1:46:18", "remaining_time": "14:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 1730, "loss": 0.8897, "learning_rate": 3.7941030069554073e-06, "epoch": 0.2183393501805054, "percentage": 10.92, "elapsed_time": "1:46:53", "remaining_time": "14:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1730, "loss": 0.8731, "learning_rate": 3.7979226682547152e-06, "epoch": 0.21949458483754514, "percentage": 10.98, "elapsed_time": "1:47:26", "remaining_time": "14:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 1730, "loss": 0.8946, "learning_rate": 3.8017222787462132e-06, "epoch": 0.22064981949458484, "percentage": 11.04, "elapsed_time": "1:48:01", "remaining_time": "14:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 1730, "loss": 0.8567, "learning_rate": 3.8055020478392497e-06, "epoch": 0.22180505415162455, "percentage": 11.1, "elapsed_time": "1:48:35", "remaining_time": "14:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 1730, "loss": 0.8819, "learning_rate": 3.8092621816796233e-06, "epoch": 0.22296028880866425, "percentage": 11.16, "elapsed_time": "1:49:09", "remaining_time": "14:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 1730, "loss": 0.8733, "learning_rate": 3.813002883217044e-06, "epoch": 0.22411552346570396, "percentage": 11.21, "elapsed_time": "1:49:42", "remaining_time": "14:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1730, "loss": 0.8764, "learning_rate": 3.816724352270864e-06, "epoch": 0.2252707581227437, "percentage": 11.27, "elapsed_time": "1:50:16", "remaining_time": "14:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 1730, "loss": 0.8607, "learning_rate": 3.820426785594127e-06, "epoch": 0.2264259927797834, "percentage": 11.33, "elapsed_time": "1:50:49", "remaining_time": "14:27:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 1730, "loss": 0.8726, "learning_rate": 3.824110376935989e-06, "epoch": 0.2275812274368231, "percentage": 11.39, "elapsed_time": "1:51:23", "remaining_time": "14:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 1730, "loss": 0.858, "learning_rate": 3.827775317102552e-06, "epoch": 0.2287364620938628, "percentage": 11.45, "elapsed_time": "1:51:57", "remaining_time": "14:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 1730, "loss": 0.8606, "learning_rate": 3.831421794016178e-06, "epoch": 0.2298916967509025, "percentage": 11.5, "elapsed_time": "1:52:30", "remaining_time": "14:25:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1730, "loss": 0.8613, "learning_rate": 3.835049992773302e-06, "epoch": 0.23104693140794225, "percentage": 11.56, "elapsed_time": "1:53:04", "remaining_time": "14:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 1730, "loss": 0.866, "learning_rate": 3.8386600957008155e-06, "epoch": 0.23220216606498195, "percentage": 11.62, "elapsed_time": "1:53:38", "remaining_time": "14:24:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 1730, "loss": 0.8814, "learning_rate": 3.8422522824110405e-06, "epoch": 0.23335740072202166, "percentage": 11.68, "elapsed_time": "1:54:12", "remaining_time": "14:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 1730, "loss": 0.8791, "learning_rate": 3.8458267298553554e-06, "epoch": 0.23451263537906136, "percentage": 11.73, "elapsed_time": "1:54:46", "remaining_time": "14:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 1730, "loss": 0.8797, "learning_rate": 3.849383612376498e-06, "epoch": 0.2356678700361011, "percentage": 11.79, "elapsed_time": "1:55:20", "remaining_time": "14:22:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1730, "loss": 0.8866, "learning_rate": 3.852923101759591e-06, "epoch": 0.2368231046931408, "percentage": 11.85, "elapsed_time": "1:55:53", "remaining_time": "14:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 1730, "loss": 0.8666, "learning_rate": 3.856445367281923e-06, "epoch": 0.2379783393501805, "percentage": 11.91, "elapsed_time": "1:56:28", "remaining_time": "14:21:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 1730, "loss": 0.8727, "learning_rate": 3.8599505757615295e-06, "epoch": 0.2391335740072202, "percentage": 11.97, "elapsed_time": "1:57:02", "remaining_time": "14:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 1730, "loss": 0.8801, "learning_rate": 3.863438891604603e-06, "epoch": 0.24028880866425992, "percentage": 12.02, "elapsed_time": "1:57:35", "remaining_time": "14:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 1730, "loss": 0.8203, "learning_rate": 3.866910476851757e-06, "epoch": 0.24144404332129965, "percentage": 12.08, "elapsed_time": "1:58:09", "remaining_time": "14:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1730, "loss": 0.8384, "learning_rate": 3.870365491223199e-06, "epoch": 0.24259927797833936, "percentage": 12.14, "elapsed_time": "1:58:43", "remaining_time": "14:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 1730, "loss": 0.8423, "learning_rate": 3.873804092162822e-06, "epoch": 0.24375451263537906, "percentage": 12.2, "elapsed_time": "1:59:17", "remaining_time": "14:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 1730, "loss": 0.8521, "learning_rate": 3.877226434881253e-06, "epoch": 0.24490974729241877, "percentage": 12.25, "elapsed_time": "1:59:51", "remaining_time": "14:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 1730, "loss": 0.8847, "learning_rate": 3.880632672397897e-06, "epoch": 0.24606498194945847, "percentage": 12.31, "elapsed_time": "2:00:24", "remaining_time": "14:17:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 1730, "loss": 0.86, "learning_rate": 3.884022955581984e-06, "epoch": 0.2472202166064982, "percentage": 12.37, "elapsed_time": "2:00:58", "remaining_time": "14:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1730, "loss": 0.8489, "learning_rate": 3.887397433192676e-06, "epoch": 0.2483754512635379, "percentage": 12.43, "elapsed_time": "2:01:32", "remaining_time": "14:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 1730, "loss": 0.845, "learning_rate": 3.890756251918219e-06, "epoch": 0.24953068592057762, "percentage": 12.49, "elapsed_time": "2:02:06", "remaining_time": "14:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 1730, "loss": 0.8584, "learning_rate": 3.894099556414216e-06, "epoch": 0.25068592057761735, "percentage": 12.54, "elapsed_time": "2:02:39", "remaining_time": "14:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 1730, "loss": 0.8608, "learning_rate": 3.897427489341009e-06, "epoch": 0.25184115523465705, "percentage": 12.6, "elapsed_time": "2:03:13", "remaining_time": "14:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 1730, "loss": 0.8509, "learning_rate": 3.900740191400198e-06, "epoch": 0.25299638989169676, "percentage": 12.66, "elapsed_time": "2:03:46", "remaining_time": "14:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1730, "loss": 0.8556, "learning_rate": 3.9040378013703444e-06, "epoch": 0.25415162454873647, "percentage": 12.72, "elapsed_time": "2:04:21", "remaining_time": "14:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 1730, "loss": 0.8495, "learning_rate": 3.907320456141851e-06, "epoch": 0.25530685920577617, "percentage": 12.77, "elapsed_time": "2:04:54", "remaining_time": "14:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 1730, "loss": 0.8527, "learning_rate": 3.910588290751064e-06, "epoch": 0.2564620938628159, "percentage": 12.83, "elapsed_time": "2:05:28", "remaining_time": "14:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 1730, "loss": 0.8398, "learning_rate": 3.913841438413601e-06, "epoch": 0.2576173285198556, "percentage": 12.89, "elapsed_time": "2:06:02", "remaining_time": "14:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 1730, "loss": 0.8575, "learning_rate": 3.9170800305569385e-06, "epoch": 0.2587725631768953, "percentage": 12.95, "elapsed_time": "2:06:36", "remaining_time": "14:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1730, "loss": 0.8804, "learning_rate": 3.920304196852272e-06, "epoch": 0.259927797833935, "percentage": 13.01, "elapsed_time": "2:07:10", "remaining_time": "14:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 1730, "loss": 0.8532, "learning_rate": 3.923514065245669e-06, "epoch": 0.26108303249097475, "percentage": 13.06, "elapsed_time": "2:07:44", "remaining_time": "14:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 1730, "loss": 0.8597, "learning_rate": 3.9267097619885385e-06, "epoch": 0.26223826714801446, "percentage": 13.12, "elapsed_time": "2:08:18", "remaining_time": "14:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 1730, "loss": 0.8605, "learning_rate": 3.9298914116674236e-06, "epoch": 0.26339350180505416, "percentage": 13.18, "elapsed_time": "2:08:52", "remaining_time": "14:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 1730, "loss": 0.8463, "learning_rate": 3.9330591372331475e-06, "epoch": 0.26454873646209387, "percentage": 13.24, "elapsed_time": "2:09:26", "remaining_time": "14:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1730, "loss": 0.8655, "learning_rate": 3.936213060029322e-06, "epoch": 0.2657039711191336, "percentage": 13.29, "elapsed_time": "2:10:00", "remaining_time": "14:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 1730, "loss": 0.8729, "learning_rate": 3.9393532998202405e-06, "epoch": 0.2668592057761733, "percentage": 13.35, "elapsed_time": "2:10:34", "remaining_time": "14:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 1730, "loss": 0.8626, "learning_rate": 3.942479974818166e-06, "epoch": 0.268014440433213, "percentage": 13.41, "elapsed_time": "2:11:08", "remaining_time": "14:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 1730, "loss": 0.8665, "learning_rate": 3.9455932017100315e-06, "epoch": 0.2691696750902527, "percentage": 13.47, "elapsed_time": "2:11:42", "remaining_time": "14:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 1730, "loss": 0.841, "learning_rate": 3.9486930956835726e-06, "epoch": 0.2703249097472924, "percentage": 13.53, "elapsed_time": "2:12:15", "remaining_time": "14:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1730, "loss": 0.8528, "learning_rate": 3.951779770452894e-06, "epoch": 0.27148014440433216, "percentage": 13.58, "elapsed_time": "2:12:50", "remaining_time": "14:05:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 1730, "loss": 0.8636, "learning_rate": 3.954853338283512e-06, "epoch": 0.27263537906137186, "percentage": 13.64, "elapsed_time": "2:13:24", "remaining_time": "14:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 1730, "loss": 0.884, "learning_rate": 3.95791391001684e-06, "epoch": 0.27379061371841157, "percentage": 13.7, "elapsed_time": "2:13:58", "remaining_time": "14:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 1730, "loss": 0.8532, "learning_rate": 3.960961595094187e-06, "epoch": 0.2749458483754513, "percentage": 13.76, "elapsed_time": "2:14:32", "remaining_time": "14:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 1730, "loss": 0.8555, "learning_rate": 3.96399650158023e-06, "epoch": 0.276101083032491, "percentage": 13.82, "elapsed_time": "2:15:05", "remaining_time": "14:02:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1730, "loss": 0.8634, "learning_rate": 3.96701873618601e-06, "epoch": 0.2772563176895307, "percentage": 13.87, "elapsed_time": "2:15:39", "remaining_time": "14:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 1730, "loss": 0.8574, "learning_rate": 3.970028404291448e-06, "epoch": 0.2784115523465704, "percentage": 13.93, "elapsed_time": "2:16:13", "remaining_time": "14:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 1730, "loss": 0.8741, "learning_rate": 3.973025609967386e-06, "epoch": 0.2795667870036101, "percentage": 13.99, "elapsed_time": "2:16:46", "remaining_time": "14:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 1730, "loss": 0.8705, "learning_rate": 3.976010455997187e-06, "epoch": 0.2807220216606498, "percentage": 14.05, "elapsed_time": "2:17:20", "remaining_time": "14:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 1730, "loss": 0.853, "learning_rate": 3.978983043897884e-06, "epoch": 0.2818772563176895, "percentage": 14.1, "elapsed_time": "2:17:54", "remaining_time": "13:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1730, "loss": 0.8776, "learning_rate": 3.981943473940888e-06, "epoch": 0.28303249097472927, "percentage": 14.16, "elapsed_time": "2:18:28", "remaining_time": "13:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 1730, "loss": 0.86, "learning_rate": 3.984891845172299e-06, "epoch": 0.284187725631769, "percentage": 14.22, "elapsed_time": "2:19:01", "remaining_time": "13:58:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 1730, "loss": 0.8758, "learning_rate": 3.987828255432777e-06, "epoch": 0.2853429602888087, "percentage": 14.28, "elapsed_time": "2:19:35", "remaining_time": "13:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 1730, "loss": 0.8626, "learning_rate": 3.990752801377028e-06, "epoch": 0.2864981949458484, "percentage": 14.34, "elapsed_time": "2:20:08", "remaining_time": "13:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 1730, "loss": 0.858, "learning_rate": 3.993665578492894e-06, "epoch": 0.2876534296028881, "percentage": 14.39, "elapsed_time": "2:20:43", "remaining_time": "13:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1730, "loss": 0.8429, "learning_rate": 3.996566681120062e-06, "epoch": 0.2888086642599278, "percentage": 14.45, "elapsed_time": "2:21:17", "remaining_time": "13:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 1730, "loss": 0.8686, "learning_rate": 3.999456202468397e-06, "epoch": 0.2899638989169675, "percentage": 14.51, "elapsed_time": "2:36:05", "remaining_time": "15:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 1730, "loss": 0.8422, "learning_rate": 4.0023342346359075e-06, "epoch": 0.2911191335740072, "percentage": 14.57, "elapsed_time": "2:36:39", "remaining_time": "15:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 1730, "loss": 0.8868, "learning_rate": 4.0052008686263635e-06, "epoch": 0.2922743682310469, "percentage": 14.62, "elapsed_time": "2:37:12", "remaining_time": "15:17:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 1730, "loss": 0.8639, "learning_rate": 4.0080561943665644e-06, "epoch": 0.2934296028880866, "percentage": 14.68, "elapsed_time": "2:37:46", "remaining_time": "15:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1730, "loss": 0.8453, "learning_rate": 4.010900300723259e-06, "epoch": 0.2945848375451264, "percentage": 14.74, "elapsed_time": "2:38:20", "remaining_time": "15:15:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 1730, "loss": 0.8771, "learning_rate": 4.0137332755197495e-06, "epoch": 0.2957400722021661, "percentage": 14.8, "elapsed_time": "2:38:53", "remaining_time": "15:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 1730, "loss": 0.8524, "learning_rate": 4.016555205552159e-06, "epoch": 0.2968953068592058, "percentage": 14.86, "elapsed_time": "2:39:28", "remaining_time": "15:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 1730, "loss": 0.8345, "learning_rate": 4.019366176605384e-06, "epoch": 0.2980505415162455, "percentage": 14.91, "elapsed_time": "2:40:03", "remaining_time": "15:13:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 1730, "loss": 0.8441, "learning_rate": 4.022166273468753e-06, "epoch": 0.2992057761732852, "percentage": 14.97, "elapsed_time": "2:40:37", "remaining_time": "15:12:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1730, "loss": 0.8639, "learning_rate": 4.024955579951363e-06, "epoch": 0.3003610108303249, "percentage": 15.03, "elapsed_time": "2:41:11", "remaining_time": "15:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 1730, "loss": 0.8465, "learning_rate": 4.0277341788971355e-06, "epoch": 0.3015162454873646, "percentage": 15.09, "elapsed_time": "2:41:45", "remaining_time": "15:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 1730, "loss": 0.8752, "learning_rate": 4.030502152199576e-06, "epoch": 0.3026714801444043, "percentage": 15.14, "elapsed_time": "2:42:19", "remaining_time": "15:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 1730, "loss": 0.8433, "learning_rate": 4.033259580816264e-06, "epoch": 0.303826714801444, "percentage": 15.2, "elapsed_time": "2:42:53", "remaining_time": "15:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 1730, "loss": 0.8769, "learning_rate": 4.036006544783052e-06, "epoch": 0.3049819494584838, "percentage": 15.26, "elapsed_time": "2:43:27", "remaining_time": "15:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1730, "loss": 0.8705, "learning_rate": 4.0387431232280135e-06, "epoch": 0.3061371841155235, "percentage": 15.32, "elapsed_time": "2:44:01", "remaining_time": "15:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 1730, "loss": 0.8497, "learning_rate": 4.041469394385113e-06, "epoch": 0.3072924187725632, "percentage": 15.38, "elapsed_time": "2:44:35", "remaining_time": "15:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 1730, "loss": 0.8503, "learning_rate": 4.044185435607626e-06, "epoch": 0.3084476534296029, "percentage": 15.43, "elapsed_time": "2:45:09", "remaining_time": "15:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 1730, "loss": 0.8594, "learning_rate": 4.046891323381315e-06, "epoch": 0.3096028880866426, "percentage": 15.49, "elapsed_time": "2:45:43", "remaining_time": "15:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 1730, "loss": 0.8513, "learning_rate": 4.049587133337347e-06, "epoch": 0.3107581227436823, "percentage": 15.55, "elapsed_time": "2:46:17", "remaining_time": "15:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1730, "loss": 0.8302, "learning_rate": 4.05227294026498e-06, "epoch": 0.311913357400722, "percentage": 15.61, "elapsed_time": "2:46:51", "remaining_time": "15:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 1730, "loss": 0.8787, "learning_rate": 4.05494881812401e-06, "epoch": 0.3130685920577617, "percentage": 15.66, "elapsed_time": "2:47:25", "remaining_time": "15:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 1730, "loss": 0.8572, "learning_rate": 4.057614840056999e-06, "epoch": 0.3142238267148014, "percentage": 15.72, "elapsed_time": "2:48:01", "remaining_time": "15:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 1730, "loss": 0.8656, "learning_rate": 4.060271078401261e-06, "epoch": 0.31537906137184113, "percentage": 15.78, "elapsed_time": "2:48:36", "remaining_time": "14:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 1730, "loss": 0.8574, "learning_rate": 4.0629176047006474e-06, "epoch": 0.3165342960288809, "percentage": 15.84, "elapsed_time": "2:49:10", "remaining_time": "14:58:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1730, "loss": 0.864, "learning_rate": 4.065554489717105e-06, "epoch": 0.3176895306859206, "percentage": 15.9, "elapsed_time": "2:49:44", "remaining_time": "14:58:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 1730, "loss": 0.8492, "learning_rate": 4.06818180344203e-06, "epoch": 0.3188447653429603, "percentage": 15.95, "elapsed_time": "2:50:18", "remaining_time": "14:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 1730, "loss": 0.8255, "learning_rate": 4.070799615107415e-06, "epoch": 0.32, "percentage": 16.01, "elapsed_time": "2:50:54", "remaining_time": "14:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 1730, "loss": 0.8557, "learning_rate": 4.073407993196794e-06, "epoch": 0.3211552346570397, "percentage": 16.07, "elapsed_time": "2:51:27", "remaining_time": "14:55:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 1730, "loss": 0.8433, "learning_rate": 4.076007005455996e-06, "epoch": 0.3223104693140794, "percentage": 16.13, "elapsed_time": "2:52:01", "remaining_time": "14:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1730, "loss": 0.8639, "learning_rate": 4.078596718903699e-06, "epoch": 0.3234657039711191, "percentage": 16.18, "elapsed_time": "2:52:35", "remaining_time": "14:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 1730, "loss": 0.8617, "learning_rate": 4.0811771998418e-06, "epoch": 0.32462093862815883, "percentage": 16.24, "elapsed_time": "2:53:10", "remaining_time": "14:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 1730, "loss": 0.8472, "learning_rate": 4.083748513865602e-06, "epoch": 0.32577617328519853, "percentage": 16.3, "elapsed_time": "2:53:44", "remaining_time": "14:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 1730, "loss": 0.8518, "learning_rate": 4.086310725873818e-06, "epoch": 0.3269314079422383, "percentage": 16.36, "elapsed_time": "2:54:18", "remaining_time": "14:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 1730, "loss": 0.856, "learning_rate": 4.088863900078397e-06, "epoch": 0.328086642599278, "percentage": 16.42, "elapsed_time": "2:54:52", "remaining_time": "14:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1730, "loss": 0.849, "learning_rate": 4.091408100014184e-06, "epoch": 0.3292418772563177, "percentage": 16.47, "elapsed_time": "2:55:26", "remaining_time": "14:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 1730, "loss": 0.8363, "learning_rate": 4.093943388548406e-06, "epoch": 0.3303971119133574, "percentage": 16.53, "elapsed_time": "2:56:00", "remaining_time": "14:48:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 1730, "loss": 0.859, "learning_rate": 4.096469827889988e-06, "epoch": 0.3315523465703971, "percentage": 16.59, "elapsed_time": "2:56:33", "remaining_time": "14:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 1730, "loss": 0.873, "learning_rate": 4.0989874795987185e-06, "epoch": 0.3327075812274368, "percentage": 16.65, "elapsed_time": "2:57:07", "remaining_time": "14:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 1730, "loss": 0.848, "learning_rate": 4.101496404594247e-06, "epoch": 0.3338628158844765, "percentage": 16.71, "elapsed_time": "2:57:41", "remaining_time": "14:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1730, "loss": 0.834, "learning_rate": 4.103996663164927e-06, "epoch": 0.33501805054151623, "percentage": 16.76, "elapsed_time": "2:58:14", "remaining_time": "14:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 1730, "loss": 0.8667, "learning_rate": 4.106488314976513e-06, "epoch": 0.33617328519855594, "percentage": 16.82, "elapsed_time": "2:58:49", "remaining_time": "14:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 1730, "loss": 0.8548, "learning_rate": 4.108971419080698e-06, "epoch": 0.33732851985559564, "percentage": 16.88, "elapsed_time": "2:59:23", "remaining_time": "14:43:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 1730, "loss": 0.8418, "learning_rate": 4.111446033923516e-06, "epoch": 0.3384837545126354, "percentage": 16.94, "elapsed_time": "2:59:57", "remaining_time": "14:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 1730, "loss": 0.8419, "learning_rate": 4.113912217353596e-06, "epoch": 0.3396389891696751, "percentage": 16.99, "elapsed_time": "3:00:31", "remaining_time": "14:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1730, "loss": 0.8708, "learning_rate": 4.1163700266302726e-06, "epoch": 0.3407942238267148, "percentage": 17.05, "elapsed_time": "3:01:05", "remaining_time": "14:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 1730, "loss": 0.8492, "learning_rate": 4.118819518431564e-06, "epoch": 0.3419494584837545, "percentage": 17.11, "elapsed_time": "3:01:39", "remaining_time": "14:40:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 1730, "loss": 0.8607, "learning_rate": 4.121260748862021e-06, "epoch": 0.3431046931407942, "percentage": 17.17, "elapsed_time": "3:02:13", "remaining_time": "14:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 1730, "loss": 0.8543, "learning_rate": 4.123693773460426e-06, "epoch": 0.34425992779783393, "percentage": 17.23, "elapsed_time": "3:02:47", "remaining_time": "14:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 1730, "loss": 0.852, "learning_rate": 4.126118647207383e-06, "epoch": 0.34541516245487364, "percentage": 17.28, "elapsed_time": "3:03:20", "remaining_time": "14:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1730, "loss": 0.8335, "learning_rate": 4.128535424532771e-06, "epoch": 0.34657039711191334, "percentage": 17.34, "elapsed_time": "3:03:54", "remaining_time": "14:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 1730, "loss": 0.8373, "learning_rate": 4.130944159323072e-06, "epoch": 0.34772563176895305, "percentage": 17.4, "elapsed_time": "3:04:28", "remaining_time": "14:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 1730, "loss": 0.839, "learning_rate": 4.133344904928585e-06, "epoch": 0.34888086642599275, "percentage": 17.46, "elapsed_time": "3:05:01", "remaining_time": "14:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 1730, "loss": 0.8691, "learning_rate": 4.135737714170509e-06, "epoch": 0.3500361010830325, "percentage": 17.51, "elapsed_time": "3:05:35", "remaining_time": "14:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 1730, "loss": 0.839, "learning_rate": 4.138122639347924e-06, "epoch": 0.3511913357400722, "percentage": 17.57, "elapsed_time": "3:06:08", "remaining_time": "14:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1730, "loss": 0.8585, "learning_rate": 4.140499732244644e-06, "epoch": 0.3523465703971119, "percentage": 17.63, "elapsed_time": "3:06:42", "remaining_time": "14:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 1730, "loss": 0.8369, "learning_rate": 4.142869044135967e-06, "epoch": 0.35350180505415163, "percentage": 17.69, "elapsed_time": "3:07:17", "remaining_time": "14:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 1730, "loss": 0.8578, "learning_rate": 4.145230625795312e-06, "epoch": 0.35465703971119134, "percentage": 17.75, "elapsed_time": "3:07:51", "remaining_time": "14:30:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 1730, "loss": 0.8727, "learning_rate": 4.147584527500741e-06, "epoch": 0.35581227436823104, "percentage": 17.8, "elapsed_time": "3:08:25", "remaining_time": "14:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 1730, "loss": 0.8026, "learning_rate": 4.149930799041391e-06, "epoch": 0.35696750902527075, "percentage": 17.86, "elapsed_time": "3:08:58", "remaining_time": "14:29:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1730, "loss": 0.8309, "learning_rate": 4.152269489723789e-06, "epoch": 0.35812274368231045, "percentage": 17.92, "elapsed_time": "3:09:32", "remaining_time": "14:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 1730, "loss": 0.8524, "learning_rate": 4.154600648378063e-06, "epoch": 0.35927797833935016, "percentage": 17.98, "elapsed_time": "3:10:06", "remaining_time": "14:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 1730, "loss": 0.8485, "learning_rate": 4.156924323364072e-06, "epoch": 0.3604332129963899, "percentage": 18.03, "elapsed_time": "3:10:41", "remaining_time": "14:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 1730, "loss": 0.8654, "learning_rate": 4.159240562577414e-06, "epoch": 0.3615884476534296, "percentage": 18.09, "elapsed_time": "3:11:15", "remaining_time": "14:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 1730, "loss": 0.8492, "learning_rate": 4.1615494134553584e-06, "epoch": 0.36274368231046933, "percentage": 18.15, "elapsed_time": "3:11:49", "remaining_time": "14:25:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1730, "loss": 0.818, "learning_rate": 4.163850922982668e-06, "epoch": 0.36389891696750903, "percentage": 18.21, "elapsed_time": "3:12:23", "remaining_time": "14:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 1730, "loss": 0.8586, "learning_rate": 4.166145137697341e-06, "epoch": 0.36505415162454874, "percentage": 18.27, "elapsed_time": "3:12:57", "remaining_time": "14:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 1730, "loss": 0.8468, "learning_rate": 4.1684321036962525e-06, "epoch": 0.36620938628158844, "percentage": 18.32, "elapsed_time": "3:13:31", "remaining_time": "14:22:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 1730, "loss": 0.8688, "learning_rate": 4.170711866640721e-06, "epoch": 0.36736462093862815, "percentage": 18.38, "elapsed_time": "3:14:05", "remaining_time": "14:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 1730, "loss": 0.8521, "learning_rate": 4.172984471761969e-06, "epoch": 0.36851985559566786, "percentage": 18.44, "elapsed_time": "3:14:38", "remaining_time": "14:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1730, "loss": 0.829, "learning_rate": 4.17524996386651e-06, "epoch": 0.36967509025270756, "percentage": 18.5, "elapsed_time": "3:15:12", "remaining_time": "14:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 1730, "loss": 0.8676, "learning_rate": 4.177508387341454e-06, "epoch": 0.37083032490974727, "percentage": 18.55, "elapsed_time": "3:15:46", "remaining_time": "14:19:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 1730, "loss": 0.8516, "learning_rate": 4.179759786159719e-06, "epoch": 0.371985559566787, "percentage": 18.61, "elapsed_time": "3:16:20", "remaining_time": "14:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 1730, "loss": 0.8606, "learning_rate": 4.182004203885172e-06, "epoch": 0.37314079422382673, "percentage": 18.67, "elapsed_time": "3:16:54", "remaining_time": "14:17:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 1730, "loss": 0.8272, "learning_rate": 4.1842416836776876e-06, "epoch": 0.37429602888086644, "percentage": 18.73, "elapsed_time": "3:17:28", "remaining_time": "14:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1730, "loss": 0.8438, "learning_rate": 4.1864722682981245e-06, "epoch": 0.37545126353790614, "percentage": 18.79, "elapsed_time": "3:18:02", "remaining_time": "14:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 1730, "loss": 0.8485, "learning_rate": 4.188696000113232e-06, "epoch": 0.37660649819494585, "percentage": 18.84, "elapsed_time": "3:18:35", "remaining_time": "14:15:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 1730, "loss": 0.8184, "learning_rate": 4.190912921100477e-06, "epoch": 0.37776173285198555, "percentage": 18.9, "elapsed_time": "3:19:09", "remaining_time": "14:14:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 1730, "loss": 0.8609, "learning_rate": 4.193123072852799e-06, "epoch": 0.37891696750902526, "percentage": 18.96, "elapsed_time": "3:19:43", "remaining_time": "14:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 1730, "loss": 0.8302, "learning_rate": 4.1953264965832905e-06, "epoch": 0.38007220216606497, "percentage": 19.02, "elapsed_time": "3:20:17", "remaining_time": "14:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1730, "loss": 0.8491, "learning_rate": 4.197523233129813e-06, "epoch": 0.38122743682310467, "percentage": 19.08, "elapsed_time": "3:20:51", "remaining_time": "14:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 1730, "loss": 0.8404, "learning_rate": 4.199713322959531e-06, "epoch": 0.38238267148014443, "percentage": 19.13, "elapsed_time": "3:21:24", "remaining_time": "14:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 1730, "loss": 0.8558, "learning_rate": 4.201896806173394e-06, "epoch": 0.38353790613718414, "percentage": 19.19, "elapsed_time": "3:21:58", "remaining_time": "14:10:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 1730, "loss": 0.8747, "learning_rate": 4.204073722510534e-06, "epoch": 0.38469314079422384, "percentage": 19.25, "elapsed_time": "3:22:33", "remaining_time": "14:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 1730, "loss": 0.8521, "learning_rate": 4.206244111352608e-06, "epoch": 0.38584837545126355, "percentage": 19.31, "elapsed_time": "3:23:08", "remaining_time": "14:09:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1730, "loss": 0.8548, "learning_rate": 4.208408011728075e-06, "epoch": 0.38700361010830325, "percentage": 19.36, "elapsed_time": "3:23:42", "remaining_time": "14:08:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 1730, "loss": 0.8474, "learning_rate": 4.210565462316407e-06, "epoch": 0.38815884476534296, "percentage": 19.42, "elapsed_time": "3:24:16", "remaining_time": "14:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 1730, "loss": 0.8318, "learning_rate": 4.212716501452232e-06, "epoch": 0.38931407942238266, "percentage": 19.48, "elapsed_time": "3:24:50", "remaining_time": "14:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 1730, "loss": 0.8558, "learning_rate": 4.214861167129425e-06, "epoch": 0.39046931407942237, "percentage": 19.54, "elapsed_time": "3:25:23", "remaining_time": "14:05:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 1730, "loss": 0.8436, "learning_rate": 4.216999497005137e-06, "epoch": 0.3916245487364621, "percentage": 19.6, "elapsed_time": "3:25:57", "remaining_time": "14:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1730, "loss": 0.845, "learning_rate": 4.219131528403759e-06, "epoch": 0.3927797833935018, "percentage": 19.65, "elapsed_time": "3:26:31", "remaining_time": "14:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 1730, "loss": 0.8411, "learning_rate": 4.22125729832083e-06, "epoch": 0.39393501805054154, "percentage": 19.71, "elapsed_time": "3:27:05", "remaining_time": "14:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 1730, "loss": 0.8485, "learning_rate": 4.223376843426892e-06, "epoch": 0.39509025270758125, "percentage": 19.77, "elapsed_time": "3:27:38", "remaining_time": "14:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 1730, "loss": 0.8571, "learning_rate": 4.225490200071284e-06, "epoch": 0.39624548736462095, "percentage": 19.83, "elapsed_time": "3:28:13", "remaining_time": "14:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 1730, "loss": 0.8426, "learning_rate": 4.227597404285883e-06, "epoch": 0.39740072202166066, "percentage": 19.88, "elapsed_time": "3:28:46", "remaining_time": "14:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1730, "loss": 0.876, "learning_rate": 4.229698491788791e-06, "epoch": 0.39855595667870036, "percentage": 19.94, "elapsed_time": "3:29:20", "remaining_time": "14:00:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 1730, "loss": 0.861, "learning_rate": 4.231793497987962e-06, "epoch": 0.39971119133574007, "percentage": 20.0, "elapsed_time": "3:29:54", "remaining_time": "13:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 1730, "loss": 0.8645, "learning_rate": 4.233882457984791e-06, "epoch": 0.4008664259927798, "percentage": 20.06, "elapsed_time": "3:30:27", "remaining_time": "13:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 1730, "loss": 0.8447, "learning_rate": 4.235965406577636e-06, "epoch": 0.4020216606498195, "percentage": 20.12, "elapsed_time": "3:31:01", "remaining_time": "13:58:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 1730, "loss": 0.8425, "learning_rate": 4.2380423782653e-06, "epoch": 0.4031768953068592, "percentage": 20.17, "elapsed_time": "3:31:35", "remaining_time": "13:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1730, "loss": 0.8307, "learning_rate": 4.2401134072504595e-06, "epoch": 0.4043321299638989, "percentage": 20.23, "elapsed_time": "3:32:09", "remaining_time": "13:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 1730, "loss": 0.8237, "learning_rate": 4.24217852744304e-06, "epoch": 0.40548736462093865, "percentage": 20.29, "elapsed_time": "3:32:43", "remaining_time": "13:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 1730, "loss": 0.8605, "learning_rate": 4.244237772463552e-06, "epoch": 0.40664259927797836, "percentage": 20.35, "elapsed_time": "3:33:17", "remaining_time": "13:54:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 1730, "loss": 0.8357, "learning_rate": 4.246291175646372e-06, "epoch": 0.40779783393501806, "percentage": 20.4, "elapsed_time": "3:33:51", "remaining_time": "13:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 1730, "loss": 0.8348, "learning_rate": 4.2483387700429804e-06, "epoch": 0.40895306859205777, "percentage": 20.46, "elapsed_time": "3:34:26", "remaining_time": "13:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1730, "loss": 0.8392, "learning_rate": 4.2503805884251575e-06, "epoch": 0.41010830324909747, "percentage": 20.52, "elapsed_time": "3:35:00", "remaining_time": "13:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 1730, "loss": 0.8405, "learning_rate": 4.252416663288126e-06, "epoch": 0.4112635379061372, "percentage": 20.58, "elapsed_time": "3:35:34", "remaining_time": "13:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 1730, "loss": 0.8374, "learning_rate": 4.2544470268536555e-06, "epoch": 0.4124187725631769, "percentage": 20.64, "elapsed_time": "3:36:07", "remaining_time": "13:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 1730, "loss": 0.8442, "learning_rate": 4.2564717110731246e-06, "epoch": 0.4135740072202166, "percentage": 20.69, "elapsed_time": "3:36:41", "remaining_time": "13:50:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 1730, "loss": 0.8273, "learning_rate": 4.258490747630532e-06, "epoch": 0.4147292418772563, "percentage": 20.75, "elapsed_time": "3:37:15", "remaining_time": "13:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1730, "loss": 0.8664, "learning_rate": 4.26050416794548e-06, "epoch": 0.41588447653429605, "percentage": 20.81, "elapsed_time": "3:37:49", "remaining_time": "13:48:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 1730, "loss": 0.8351, "learning_rate": 4.262512003176097e-06, "epoch": 0.41703971119133576, "percentage": 20.87, "elapsed_time": "3:38:22", "remaining_time": "13:48:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 1730, "loss": 0.8419, "learning_rate": 4.264514284221944e-06, "epoch": 0.41819494584837547, "percentage": 20.92, "elapsed_time": "3:38:56", "remaining_time": "13:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 1730, "loss": 0.84, "learning_rate": 4.2665110417268545e-06, "epoch": 0.41935018050541517, "percentage": 20.98, "elapsed_time": "3:39:30", "remaining_time": "13:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 1730, "loss": 0.8483, "learning_rate": 4.26850230608176e-06, "epoch": 0.4205054151624549, "percentage": 21.04, "elapsed_time": "3:40:04", "remaining_time": "13:45:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1730, "loss": 0.8371, "learning_rate": 4.270488107427459e-06, "epoch": 0.4216606498194946, "percentage": 21.1, "elapsed_time": "3:40:38", "remaining_time": "13:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 1730, "loss": 0.8448, "learning_rate": 4.272468475657351e-06, "epoch": 0.4228158844765343, "percentage": 21.16, "elapsed_time": "3:41:12", "remaining_time": "13:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 1730, "loss": 0.8522, "learning_rate": 4.27444344042015e-06, "epoch": 0.423971119133574, "percentage": 21.21, "elapsed_time": "3:41:46", "remaining_time": "13:43:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 1730, "loss": 0.8348, "learning_rate": 4.27641303112253e-06, "epoch": 0.4251263537906137, "percentage": 21.27, "elapsed_time": "3:42:20", "remaining_time": "13:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 1730, "loss": 0.8376, "learning_rate": 4.278377276931768e-06, "epoch": 0.4262815884476534, "percentage": 21.33, "elapsed_time": "3:42:54", "remaining_time": "13:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1730, "loss": 0.8435, "learning_rate": 4.280336206778326e-06, "epoch": 0.42743682310469316, "percentage": 21.39, "elapsed_time": "3:43:27", "remaining_time": "13:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 1730, "loss": 0.8374, "learning_rate": 4.2822898493584105e-06, "epoch": 0.42859205776173287, "percentage": 21.45, "elapsed_time": "3:44:01", "remaining_time": "13:40:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 1730, "loss": 0.8169, "learning_rate": 4.2842382331364965e-06, "epoch": 0.4297472924187726, "percentage": 21.5, "elapsed_time": "3:44:34", "remaining_time": "13:39:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 1730, "loss": 0.8561, "learning_rate": 4.2861813863478135e-06, "epoch": 0.4309025270758123, "percentage": 21.56, "elapsed_time": "3:45:08", "remaining_time": "13:39:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 1730, "loss": 0.8299, "learning_rate": 4.288119337000801e-06, "epoch": 0.432057761732852, "percentage": 21.62, "elapsed_time": "3:45:42", "remaining_time": "13:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1730, "loss": 0.8273, "learning_rate": 4.290052112879532e-06, "epoch": 0.4332129963898917, "percentage": 21.68, "elapsed_time": "3:46:16", "remaining_time": "13:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 1730, "loss": 0.8215, "learning_rate": 4.291979741546102e-06, "epoch": 0.4343682310469314, "percentage": 21.73, "elapsed_time": "3:46:49", "remaining_time": "13:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 1730, "loss": 0.871, "learning_rate": 4.293902250342989e-06, "epoch": 0.4355234657039711, "percentage": 21.79, "elapsed_time": "3:47:23", "remaining_time": "13:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 1730, "loss": 0.8582, "learning_rate": 4.295819666395376e-06, "epoch": 0.4366787003610108, "percentage": 21.85, "elapsed_time": "3:47:58", "remaining_time": "13:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 1730, "loss": 0.8288, "learning_rate": 4.297732016613455e-06, "epoch": 0.43783393501805057, "percentage": 21.91, "elapsed_time": "3:48:32", "remaining_time": "13:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1730, "loss": 0.8574, "learning_rate": 4.299639327694684e-06, "epoch": 0.4389891696750903, "percentage": 21.97, "elapsed_time": "3:49:06", "remaining_time": "13:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 1730, "loss": 0.8337, "learning_rate": 4.301541626126033e-06, "epoch": 0.44014440433213, "percentage": 22.02, "elapsed_time": "3:49:40", "remaining_time": "13:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 1730, "loss": 0.8388, "learning_rate": 4.303438938186182e-06, "epoch": 0.4412996389891697, "percentage": 22.08, "elapsed_time": "3:50:14", "remaining_time": "13:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 1730, "loss": 0.8381, "learning_rate": 4.305331289947705e-06, "epoch": 0.4424548736462094, "percentage": 22.14, "elapsed_time": "3:50:48", "remaining_time": "13:31:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 1730, "loss": 0.8297, "learning_rate": 4.307218707279219e-06, "epoch": 0.4436101083032491, "percentage": 22.2, "elapsed_time": "3:51:22", "remaining_time": "13:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1730, "loss": 0.8464, "learning_rate": 4.309101215847502e-06, "epoch": 0.4447653429602888, "percentage": 22.25, "elapsed_time": "3:51:56", "remaining_time": "13:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 1730, "loss": 0.8307, "learning_rate": 4.310978841119592e-06, "epoch": 0.4459205776173285, "percentage": 22.31, "elapsed_time": "3:52:30", "remaining_time": "13:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 1730, "loss": 0.8342, "learning_rate": 4.312851608364853e-06, "epoch": 0.4470758122743682, "percentage": 22.37, "elapsed_time": "3:53:04", "remaining_time": "13:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 1730, "loss": 0.839, "learning_rate": 4.3147195426570124e-06, "epoch": 0.4482310469314079, "percentage": 22.43, "elapsed_time": "3:53:39", "remaining_time": "13:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 1730, "loss": 0.8602, "learning_rate": 4.31658266887618e-06, "epoch": 0.4493862815884477, "percentage": 22.49, "elapsed_time": "3:54:13", "remaining_time": "13:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1730, "loss": 0.8374, "learning_rate": 4.318441011710832e-06, "epoch": 0.4505415162454874, "percentage": 22.54, "elapsed_time": "3:54:47", "remaining_time": "13:26:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 1730, "loss": 0.8458, "learning_rate": 4.3202945956597785e-06, "epoch": 0.4516967509025271, "percentage": 22.6, "elapsed_time": "3:55:21", "remaining_time": "13:25:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 1730, "loss": 0.8238, "learning_rate": 4.322143445034095e-06, "epoch": 0.4528519855595668, "percentage": 22.66, "elapsed_time": "3:55:54", "remaining_time": "13:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 1730, "loss": 0.8371, "learning_rate": 4.323987583959045e-06, "epoch": 0.4540072202166065, "percentage": 22.72, "elapsed_time": "3:56:29", "remaining_time": "13:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 1730, "loss": 0.8201, "learning_rate": 4.325827036375958e-06, "epoch": 0.4551624548736462, "percentage": 22.77, "elapsed_time": "3:57:03", "remaining_time": "13:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1730, "loss": 0.8385, "learning_rate": 4.327661826044101e-06, "epoch": 0.4563176895306859, "percentage": 22.83, "elapsed_time": "3:57:37", "remaining_time": "13:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 1730, "loss": 0.8013, "learning_rate": 4.329491976542521e-06, "epoch": 0.4574729241877256, "percentage": 22.89, "elapsed_time": "3:58:11", "remaining_time": "13:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 1730, "loss": 0.8228, "learning_rate": 4.3313175112718595e-06, "epoch": 0.4586281588447653, "percentage": 22.95, "elapsed_time": "3:58:45", "remaining_time": "13:21:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 1730, "loss": 0.8336, "learning_rate": 4.333138453456147e-06, "epoch": 0.459783393501805, "percentage": 23.01, "elapsed_time": "3:59:19", "remaining_time": "13:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 1730, "loss": 0.8417, "learning_rate": 4.334954826144581e-06, "epoch": 0.4609386281588448, "percentage": 23.06, "elapsed_time": "3:59:53", "remaining_time": "13:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1730, "loss": 0.843, "learning_rate": 4.336766652213271e-06, "epoch": 0.4620938628158845, "percentage": 23.12, "elapsed_time": "4:00:26", "remaining_time": "13:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 1730, "loss": 0.8301, "learning_rate": 4.3385739543669715e-06, "epoch": 0.4632490974729242, "percentage": 23.18, "elapsed_time": "4:01:00", "remaining_time": "13:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 1730, "loss": 0.8497, "learning_rate": 4.340376755140784e-06, "epoch": 0.4644043321299639, "percentage": 23.24, "elapsed_time": "4:01:35", "remaining_time": "13:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 1730, "loss": 0.8252, "learning_rate": 4.34217507690185e-06, "epoch": 0.4655595667870036, "percentage": 23.29, "elapsed_time": "4:02:09", "remaining_time": "13:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 1730, "loss": 0.8312, "learning_rate": 4.343968941851009e-06, "epoch": 0.4667148014440433, "percentage": 23.35, "elapsed_time": "4:02:43", "remaining_time": "13:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1730, "loss": 0.8177, "learning_rate": 4.345758372024448e-06, "epoch": 0.467870036101083, "percentage": 23.41, "elapsed_time": "4:03:17", "remaining_time": "13:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 1730, "loss": 0.8258, "learning_rate": 4.347543389295324e-06, "epoch": 0.4690252707581227, "percentage": 23.47, "elapsed_time": "4:03:50", "remaining_time": "13:15:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 1730, "loss": 0.8379, "learning_rate": 4.3493240153753665e-06, "epoch": 0.47018050541516243, "percentage": 23.53, "elapsed_time": "4:04:25", "remaining_time": "13:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 1730, "loss": 0.8396, "learning_rate": 4.3511002718164665e-06, "epoch": 0.4713357400722022, "percentage": 23.58, "elapsed_time": "4:04:59", "remaining_time": "13:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 1730, "loss": 0.8381, "learning_rate": 4.352872180012237e-06, "epoch": 0.4724909747292419, "percentage": 23.64, "elapsed_time": "4:05:32", "remaining_time": "13:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1730, "loss": 0.8333, "learning_rate": 4.35463976119956e-06, "epoch": 0.4736462093862816, "percentage": 23.7, "elapsed_time": "4:06:07", "remaining_time": "13:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 1730, "loss": 0.8191, "learning_rate": 4.356403036460116e-06, "epoch": 0.4748014440433213, "percentage": 23.76, "elapsed_time": "4:06:40", "remaining_time": "13:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 1730, "loss": 0.8225, "learning_rate": 4.358162026721892e-06, "epoch": 0.475956678700361, "percentage": 23.82, "elapsed_time": "4:07:15", "remaining_time": "13:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 1730, "loss": 0.804, "learning_rate": 4.359916752760669e-06, "epoch": 0.4771119133574007, "percentage": 23.87, "elapsed_time": "4:07:49", "remaining_time": "13:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 1730, "loss": 0.8286, "learning_rate": 4.361667235201499e-06, "epoch": 0.4782671480144404, "percentage": 23.93, "elapsed_time": "4:08:22", "remaining_time": "13:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1730, "loss": 0.8229, "learning_rate": 4.363413494520154e-06, "epoch": 0.47942238267148013, "percentage": 23.99, "elapsed_time": "4:08:56", "remaining_time": "13:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 1730, "loss": 0.8397, "learning_rate": 4.365155551044572e-06, "epoch": 0.48057761732851983, "percentage": 24.05, "elapsed_time": "4:09:29", "remaining_time": "13:08:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 1730, "loss": 0.8356, "learning_rate": 4.366893424956263e-06, "epoch": 0.48173285198555954, "percentage": 24.1, "elapsed_time": "4:10:03", "remaining_time": "13:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 1730, "loss": 0.8342, "learning_rate": 4.368627136291726e-06, "epoch": 0.4828880866425993, "percentage": 24.16, "elapsed_time": "4:10:37", "remaining_time": "13:06:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 1730, "loss": 0.8481, "learning_rate": 4.370356704943825e-06, "epoch": 0.484043321299639, "percentage": 24.22, "elapsed_time": "4:11:10", "remaining_time": "13:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1730, "loss": 0.8375, "learning_rate": 4.372082150663167e-06, "epoch": 0.4851985559566787, "percentage": 24.28, "elapsed_time": "4:11:44", "remaining_time": "13:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 1730, "loss": 0.8259, "learning_rate": 4.3738034930594475e-06, "epoch": 0.4863537906137184, "percentage": 24.34, "elapsed_time": "4:12:17", "remaining_time": "13:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 1730, "loss": 0.8394, "learning_rate": 4.3755207516027904e-06, "epoch": 0.4875090252707581, "percentage": 24.39, "elapsed_time": "4:12:52", "remaining_time": "13:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 1730, "loss": 0.82, "learning_rate": 4.3772339456250705e-06, "epoch": 0.48866425992779783, "percentage": 24.45, "elapsed_time": "4:13:26", "remaining_time": "13:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 1730, "loss": 0.8223, "learning_rate": 4.3789430943212215e-06, "epoch": 0.48981949458483753, "percentage": 24.51, "elapsed_time": "4:13:59", "remaining_time": "13:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1730, "loss": 0.8316, "learning_rate": 4.38064821675052e-06, "epoch": 0.49097472924187724, "percentage": 24.57, "elapsed_time": "4:14:33", "remaining_time": "13:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 1730, "loss": 0.8497, "learning_rate": 4.382349331837865e-06, "epoch": 0.49212996389891694, "percentage": 24.62, "elapsed_time": "4:15:06", "remaining_time": "13:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 1730, "loss": 0.8224, "learning_rate": 4.38404645837504e-06, "epoch": 0.4932851985559567, "percentage": 24.68, "elapsed_time": "4:15:41", "remaining_time": "13:00:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 1730, "loss": 0.8055, "learning_rate": 4.385739615021954e-06, "epoch": 0.4944404332129964, "percentage": 24.74, "elapsed_time": "4:16:15", "remaining_time": "12:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 1730, "loss": 0.85, "learning_rate": 4.387428820307874e-06, "epoch": 0.4955956678700361, "percentage": 24.8, "elapsed_time": "4:16:48", "remaining_time": "12:58:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1730, "loss": 0.8343, "learning_rate": 4.389114092632645e-06, "epoch": 0.4967509025270758, "percentage": 24.86, "elapsed_time": "4:17:22", "remaining_time": "12:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 1730, "loss": 0.8457, "learning_rate": 4.390795450267887e-06, "epoch": 0.4979061371841155, "percentage": 24.91, "elapsed_time": "4:17:56", "remaining_time": "12:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 1730, "loss": 0.8307, "learning_rate": 4.392472911358188e-06, "epoch": 0.49906137184115523, "percentage": 24.97, "elapsed_time": "4:18:30", "remaining_time": "12:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 1730, "loss": 0.8565, "learning_rate": 4.394146493922276e-06, "epoch": 0.500216606498195, "percentage": 25.03, "elapsed_time": "4:19:04", "remaining_time": "12:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 1730, "loss": 0.8364, "learning_rate": 4.395816215854185e-06, "epoch": 0.5013718411552347, "percentage": 25.09, "elapsed_time": "4:19:38", "remaining_time": "12:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1730, "loss": 0.8266, "learning_rate": 4.397482094924396e-06, "epoch": 0.5025270758122744, "percentage": 25.14, "elapsed_time": "4:20:11", "remaining_time": "12:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 1730, "loss": 0.8181, "learning_rate": 4.3991441487809775e-06, "epoch": 0.5036823104693141, "percentage": 25.2, "elapsed_time": "4:20:45", "remaining_time": "12:53:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 1730, "loss": 0.7895, "learning_rate": 4.400802394950703e-06, "epoch": 0.5048375451263538, "percentage": 25.26, "elapsed_time": "4:21:19", "remaining_time": "12:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 1730, "loss": 0.8364, "learning_rate": 4.402456850840167e-06, "epoch": 0.5059927797833935, "percentage": 25.32, "elapsed_time": "4:21:53", "remaining_time": "12:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 1730, "loss": 0.8449, "learning_rate": 4.4041075337368695e-06, "epoch": 0.5071480144404332, "percentage": 25.38, "elapsed_time": "4:22:27", "remaining_time": "12:51:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1730, "loss": 0.8422, "learning_rate": 4.405754460810312e-06, "epoch": 0.5083032490974729, "percentage": 25.43, "elapsed_time": "4:23:00", "remaining_time": "12:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 1730, "loss": 0.851, "learning_rate": 4.407397649113065e-06, "epoch": 0.5094584837545126, "percentage": 25.49, "elapsed_time": "4:23:34", "remaining_time": "12:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 1730, "loss": 0.8238, "learning_rate": 4.40903711558182e-06, "epoch": 0.5106137184115523, "percentage": 25.55, "elapsed_time": "4:24:08", "remaining_time": "12:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 1730, "loss": 0.848, "learning_rate": 4.41067287703845e-06, "epoch": 0.511768953068592, "percentage": 25.61, "elapsed_time": "4:24:42", "remaining_time": "12:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 1730, "loss": 0.8171, "learning_rate": 4.4123049501910335e-06, "epoch": 0.5129241877256318, "percentage": 25.66, "elapsed_time": "4:25:16", "remaining_time": "12:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1730, "loss": 0.8338, "learning_rate": 4.4139333516348865e-06, "epoch": 0.5140794223826715, "percentage": 25.72, "elapsed_time": "4:25:50", "remaining_time": "12:47:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 1730, "loss": 0.8164, "learning_rate": 4.415558097853571e-06, "epoch": 0.5152346570397112, "percentage": 25.78, "elapsed_time": "4:26:24", "remaining_time": "12:46:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 1730, "loss": 0.8414, "learning_rate": 4.4171792052198945e-06, "epoch": 0.5163898916967509, "percentage": 25.84, "elapsed_time": "4:26:57", "remaining_time": "12:46:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 1730, "loss": 0.8043, "learning_rate": 4.418796689996907e-06, "epoch": 0.5175451263537906, "percentage": 25.9, "elapsed_time": "4:27:31", "remaining_time": "12:45:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 1730, "loss": 0.8499, "learning_rate": 4.420410568338873e-06, "epoch": 0.5187003610108303, "percentage": 25.95, "elapsed_time": "4:28:05", "remaining_time": "12:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1730, "loss": 0.8331, "learning_rate": 4.42202085629224e-06, "epoch": 0.51985559566787, "percentage": 26.01, "elapsed_time": "4:28:38", "remaining_time": "12:44:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 1730, "loss": 0.8265, "learning_rate": 4.423627569796601e-06, "epoch": 0.5210108303249098, "percentage": 26.07, "elapsed_time": "4:29:12", "remaining_time": "12:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 1730, "loss": 0.8276, "learning_rate": 4.425230724685638e-06, "epoch": 0.5221660649819495, "percentage": 26.13, "elapsed_time": "4:29:46", "remaining_time": "12:42:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 1730, "loss": 0.8575, "learning_rate": 4.426830336688054e-06, "epoch": 0.5233212996389892, "percentage": 26.18, "elapsed_time": "4:30:20", "remaining_time": "12:42:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 1730, "loss": 0.8255, "learning_rate": 4.428426421428507e-06, "epoch": 0.5244765342960289, "percentage": 26.24, "elapsed_time": "4:30:53", "remaining_time": "12:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1730, "loss": 0.8397, "learning_rate": 4.430018994428521e-06, "epoch": 0.5256317689530686, "percentage": 26.3, "elapsed_time": "4:31:28", "remaining_time": "12:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 1730, "loss": 0.8377, "learning_rate": 4.431608071107392e-06, "epoch": 0.5267870036101083, "percentage": 26.36, "elapsed_time": "4:32:01", "remaining_time": "12:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 1730, "loss": 0.8257, "learning_rate": 4.433193666783084e-06, "epoch": 0.527942238267148, "percentage": 26.42, "elapsed_time": "4:32:36", "remaining_time": "12:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 1730, "loss": 0.8455, "learning_rate": 4.434775796673116e-06, "epoch": 0.5290974729241877, "percentage": 26.47, "elapsed_time": "4:33:09", "remaining_time": "12:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 1730, "loss": 0.8263, "learning_rate": 4.4363544758954355e-06, "epoch": 0.5302527075812274, "percentage": 26.53, "elapsed_time": "4:33:43", "remaining_time": "12:37:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1730, "loss": 0.8546, "learning_rate": 4.437929719469291e-06, "epoch": 0.5314079422382672, "percentage": 26.59, "elapsed_time": "4:34:18", "remaining_time": "12:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 1730, "loss": 0.8367, "learning_rate": 4.439501542316081e-06, "epoch": 0.5325631768953069, "percentage": 26.65, "elapsed_time": "4:34:52", "remaining_time": "12:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 1730, "loss": 0.8443, "learning_rate": 4.44106995926021e-06, "epoch": 0.5337184115523466, "percentage": 26.71, "elapsed_time": "4:35:26", "remaining_time": "12:35:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 1730, "loss": 0.8341, "learning_rate": 4.442634985029922e-06, "epoch": 0.5348736462093863, "percentage": 26.76, "elapsed_time": "4:35:59", "remaining_time": "12:35:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 1730, "loss": 0.8427, "learning_rate": 4.444196634258136e-06, "epoch": 0.536028880866426, "percentage": 26.82, "elapsed_time": "4:36:33", "remaining_time": "12:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1730, "loss": 0.8441, "learning_rate": 4.445754921483257e-06, "epoch": 0.5371841155234657, "percentage": 26.88, "elapsed_time": "4:37:07", "remaining_time": "12:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 1730, "loss": 0.8342, "learning_rate": 4.44730986115e-06, "epoch": 0.5383393501805054, "percentage": 26.94, "elapsed_time": "4:37:41", "remaining_time": "12:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 1730, "loss": 0.8453, "learning_rate": 4.448861467610187e-06, "epoch": 0.5394945848375451, "percentage": 26.99, "elapsed_time": "4:38:15", "remaining_time": "12:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 1730, "loss": 0.8468, "learning_rate": 4.450409755123541e-06, "epoch": 0.5406498194945848, "percentage": 27.05, "elapsed_time": "4:38:48", "remaining_time": "12:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 1730, "loss": 0.8352, "learning_rate": 4.4519547378584725e-06, "epoch": 0.5418050541516245, "percentage": 27.11, "elapsed_time": "4:39:22", "remaining_time": "12:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1730, "loss": 0.8255, "learning_rate": 4.453496429892863e-06, "epoch": 0.5429602888086643, "percentage": 27.17, "elapsed_time": "4:39:56", "remaining_time": "12:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 1730, "loss": 0.8033, "learning_rate": 4.455034845214828e-06, "epoch": 0.544115523465704, "percentage": 27.23, "elapsed_time": "4:40:30", "remaining_time": "12:29:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 1730, "loss": 0.827, "learning_rate": 4.45656999772348e-06, "epoch": 0.5452707581227437, "percentage": 27.28, "elapsed_time": "4:41:04", "remaining_time": "12:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 1730, "loss": 0.8585, "learning_rate": 4.458101901229686e-06, "epoch": 0.5464259927797834, "percentage": 27.34, "elapsed_time": "4:41:39", "remaining_time": "12:28:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 1730, "loss": 0.8228, "learning_rate": 4.459630569456809e-06, "epoch": 0.5475812274368231, "percentage": 27.4, "elapsed_time": "4:42:12", "remaining_time": "12:27:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1730, "loss": 0.8308, "learning_rate": 4.461156016041445e-06, "epoch": 0.5487364620938628, "percentage": 27.46, "elapsed_time": "4:42:45", "remaining_time": "12:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 1730, "loss": 0.841, "learning_rate": 4.4626782545341565e-06, "epoch": 0.5498916967509025, "percentage": 27.51, "elapsed_time": "4:43:20", "remaining_time": "12:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 1730, "loss": 0.8265, "learning_rate": 4.4641972984001906e-06, "epoch": 0.5510469314079423, "percentage": 27.57, "elapsed_time": "4:43:53", "remaining_time": "12:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 1730, "loss": 0.8231, "learning_rate": 4.465713161020199e-06, "epoch": 0.552202166064982, "percentage": 27.63, "elapsed_time": "4:44:27", "remaining_time": "12:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 1730, "loss": 0.8266, "learning_rate": 4.46722585569094e-06, "epoch": 0.5533574007220217, "percentage": 27.69, "elapsed_time": "4:45:00", "remaining_time": "12:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1730, "loss": 0.8296, "learning_rate": 4.468735395625979e-06, "epoch": 0.5545126353790614, "percentage": 27.75, "elapsed_time": "4:45:34", "remaining_time": "12:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 1730, "loss": 0.8345, "learning_rate": 4.470241793956387e-06, "epoch": 0.5556678700361011, "percentage": 27.8, "elapsed_time": "4:46:08", "remaining_time": "12:23:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 1730, "loss": 0.8371, "learning_rate": 4.471745063731417e-06, "epoch": 0.5568231046931408, "percentage": 27.86, "elapsed_time": "4:46:42", "remaining_time": "12:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 1730, "loss": 0.8183, "learning_rate": 4.473245217919187e-06, "epoch": 0.5579783393501805, "percentage": 27.92, "elapsed_time": "4:47:15", "remaining_time": "12:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 1730, "loss": 0.8317, "learning_rate": 4.474742269407355e-06, "epoch": 0.5591335740072202, "percentage": 27.98, "elapsed_time": "4:47:49", "remaining_time": "12:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1730, "loss": 0.8414, "learning_rate": 4.476236231003773e-06, "epoch": 0.5602888086642599, "percentage": 28.03, "elapsed_time": "4:48:22", "remaining_time": "12:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 1730, "loss": 0.8004, "learning_rate": 4.477727115437156e-06, "epoch": 0.5614440433212996, "percentage": 28.09, "elapsed_time": "4:48:56", "remaining_time": "12:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 1730, "loss": 0.7967, "learning_rate": 4.479214935357724e-06, "epoch": 0.5625992779783393, "percentage": 28.15, "elapsed_time": "4:49:30", "remaining_time": "12:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 1730, "loss": 0.841, "learning_rate": 4.480699703337852e-06, "epoch": 0.563754512635379, "percentage": 28.21, "elapsed_time": "4:50:05", "remaining_time": "12:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 1730, "loss": 0.8369, "learning_rate": 4.4821814318727016e-06, "epoch": 0.5649097472924187, "percentage": 28.27, "elapsed_time": "4:50:38", "remaining_time": "12:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1730, "loss": 0.8405, "learning_rate": 4.4836601333808566e-06, "epoch": 0.5660649819494585, "percentage": 28.32, "elapsed_time": "4:51:12", "remaining_time": "12:16:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 1730, "loss": 0.8106, "learning_rate": 4.485135820204948e-06, "epoch": 0.5672202166064982, "percentage": 28.38, "elapsed_time": "4:51:46", "remaining_time": "12:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 1730, "loss": 0.7992, "learning_rate": 4.4866085046122675e-06, "epoch": 0.568375451263538, "percentage": 28.44, "elapsed_time": "4:52:19", "remaining_time": "12:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 1730, "loss": 0.8227, "learning_rate": 4.488078198795384e-06, "epoch": 0.5695306859205777, "percentage": 28.5, "elapsed_time": "4:52:53", "remaining_time": "12:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 1730, "loss": 0.8377, "learning_rate": 4.4895449148727455e-06, "epoch": 0.5706859205776174, "percentage": 28.55, "elapsed_time": "4:53:27", "remaining_time": "12:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1730, "loss": 0.789, "learning_rate": 4.491008664889282e-06, "epoch": 0.5718411552346571, "percentage": 28.61, "elapsed_time": "4:54:01", "remaining_time": "12:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 1730, "loss": 0.8288, "learning_rate": 4.492469460816997e-06, "epoch": 0.5729963898916968, "percentage": 28.67, "elapsed_time": "4:54:35", "remaining_time": "12:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 1730, "loss": 0.8194, "learning_rate": 4.493927314555554e-06, "epoch": 0.5741516245487365, "percentage": 28.73, "elapsed_time": "4:55:08", "remaining_time": "12:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 1730, "loss": 0.8136, "learning_rate": 4.495382237932863e-06, "epoch": 0.5753068592057762, "percentage": 28.79, "elapsed_time": "4:55:42", "remaining_time": "12:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 1730, "loss": 0.8239, "learning_rate": 4.496834242705651e-06, "epoch": 0.5764620938628159, "percentage": 28.84, "elapsed_time": "4:56:16", "remaining_time": "12:10:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1730, "loss": 0.8234, "learning_rate": 4.498283340560032e-06, "epoch": 0.5776173285198556, "percentage": 28.9, "elapsed_time": "4:56:50", "remaining_time": "12:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 1730, "loss": 0.8167, "learning_rate": 4.4997295431120764e-06, "epoch": 0.5787725631768953, "percentage": 28.96, "elapsed_time": "5:10:45", "remaining_time": "12:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 1730, "loss": 0.8012, "learning_rate": 4.5011728619083665e-06, "epoch": 0.579927797833935, "percentage": 29.02, "elapsed_time": "5:11:18", "remaining_time": "12:41:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 1730, "loss": 0.8248, "learning_rate": 4.502613308426546e-06, "epoch": 0.5810830324909747, "percentage": 29.08, "elapsed_time": "5:11:52", "remaining_time": "12:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 1730, "loss": 0.8298, "learning_rate": 4.504050894075876e-06, "epoch": 0.5822382671480144, "percentage": 29.13, "elapsed_time": "5:12:26", "remaining_time": "12:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1730, "loss": 0.8228, "learning_rate": 4.5054856301977696e-06, "epoch": 0.5833935018050541, "percentage": 29.19, "elapsed_time": "5:13:00", "remaining_time": "12:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 1730, "loss": 0.8222, "learning_rate": 4.506917528066332e-06, "epoch": 0.5845487364620938, "percentage": 29.25, "elapsed_time": "5:13:33", "remaining_time": "12:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 1730, "loss": 0.8455, "learning_rate": 4.5083465988888945e-06, "epoch": 0.5857039711191335, "percentage": 29.31, "elapsed_time": "5:14:07", "remaining_time": "12:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 1730, "loss": 0.8269, "learning_rate": 4.509772853806533e-06, "epoch": 0.5868592057761732, "percentage": 29.36, "elapsed_time": "5:14:42", "remaining_time": "12:37:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 1730, "loss": 0.817, "learning_rate": 4.511196303894598e-06, "epoch": 0.588014440433213, "percentage": 29.42, "elapsed_time": "5:15:17", "remaining_time": "12:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1730, "loss": 0.8352, "learning_rate": 4.512616960163228e-06, "epoch": 0.5891696750902528, "percentage": 29.48, "elapsed_time": "5:15:50", "remaining_time": "12:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 1730, "loss": 0.8209, "learning_rate": 4.514034833557855e-06, "epoch": 0.5903249097472925, "percentage": 29.54, "elapsed_time": "5:16:24", "remaining_time": "12:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 1730, "loss": 0.8199, "learning_rate": 4.515449934959719e-06, "epoch": 0.5914801444043322, "percentage": 29.6, "elapsed_time": "5:16:58", "remaining_time": "12:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 1730, "loss": 0.8396, "learning_rate": 4.516862275186361e-06, "epoch": 0.5926353790613719, "percentage": 29.65, "elapsed_time": "5:17:32", "remaining_time": "12:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 1730, "loss": 0.8314, "learning_rate": 4.518271864992127e-06, "epoch": 0.5937906137184116, "percentage": 29.71, "elapsed_time": "5:18:07", "remaining_time": "12:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1730, "loss": 0.8063, "learning_rate": 4.519678715068652e-06, "epoch": 0.5949458483754513, "percentage": 29.77, "elapsed_time": "5:18:40", "remaining_time": "12:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 1730, "loss": 0.8279, "learning_rate": 4.521082836045353e-06, "epoch": 0.596101083032491, "percentage": 29.83, "elapsed_time": "5:19:14", "remaining_time": "12:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 1730, "loss": 0.8217, "learning_rate": 4.5224842384899045e-06, "epoch": 0.5972563176895307, "percentage": 29.88, "elapsed_time": "5:19:48", "remaining_time": "12:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 1730, "loss": 0.8465, "learning_rate": 4.523882932908722e-06, "epoch": 0.5984115523465704, "percentage": 29.94, "elapsed_time": "5:20:22", "remaining_time": "12:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 1730, "loss": 0.8448, "learning_rate": 4.52527892974743e-06, "epoch": 0.5995667870036101, "percentage": 30.0, "elapsed_time": "5:20:55", "remaining_time": "12:28:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1730, "loss": 0.8216, "learning_rate": 4.526672239391333e-06, "epoch": 0.6007220216606498, "percentage": 30.06, "elapsed_time": "5:21:29", "remaining_time": "12:28:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 1730, "loss": 0.8007, "learning_rate": 4.528062872165875e-06, "epoch": 0.6018772563176895, "percentage": 30.12, "elapsed_time": "5:22:03", "remaining_time": "12:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 1730, "loss": 0.8185, "learning_rate": 4.529450838337104e-06, "epoch": 0.6030324909747292, "percentage": 30.17, "elapsed_time": "5:22:37", "remaining_time": "12:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 1730, "loss": 0.8377, "learning_rate": 4.5308361481121244e-06, "epoch": 0.6041877256317689, "percentage": 30.23, "elapsed_time": "5:23:10", "remaining_time": "12:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 1730, "loss": 0.8197, "learning_rate": 4.532218811639545e-06, "epoch": 0.6053429602888086, "percentage": 30.29, "elapsed_time": "5:23:44", "remaining_time": "12:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1730, "loss": 0.8146, "learning_rate": 4.533598839009929e-06, "epoch": 0.6064981949458483, "percentage": 30.35, "elapsed_time": "5:24:23", "remaining_time": "12:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 1730, "loss": 0.8324, "learning_rate": 4.5349762402562325e-06, "epoch": 0.607653429602888, "percentage": 30.4, "elapsed_time": "5:24:59", "remaining_time": "12:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 1730, "loss": 0.8299, "learning_rate": 4.5363510253542444e-06, "epoch": 0.6088086642599277, "percentage": 30.46, "elapsed_time": "5:25:34", "remaining_time": "12:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 1730, "loss": 0.8373, "learning_rate": 4.537723204223021e-06, "epoch": 0.6099638989169676, "percentage": 30.52, "elapsed_time": "5:26:08", "remaining_time": "12:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 1730, "loss": 0.8064, "learning_rate": 4.53909278672531e-06, "epoch": 0.6111191335740073, "percentage": 30.58, "elapsed_time": "5:26:42", "remaining_time": "12:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1730, "loss": 0.834, "learning_rate": 4.540459782667983e-06, "epoch": 0.612274368231047, "percentage": 30.64, "elapsed_time": "5:27:16", "remaining_time": "12:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 1730, "loss": 0.8341, "learning_rate": 4.541824201802449e-06, "epoch": 0.6134296028880867, "percentage": 30.69, "elapsed_time": "5:27:50", "remaining_time": "12:20:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 1730, "loss": 0.8356, "learning_rate": 4.543186053825081e-06, "epoch": 0.6145848375451264, "percentage": 30.75, "elapsed_time": "5:28:24", "remaining_time": "12:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 1730, "loss": 0.8118, "learning_rate": 4.544545348377621e-06, "epoch": 0.6157400722021661, "percentage": 30.81, "elapsed_time": "5:28:59", "remaining_time": "12:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 1730, "loss": 0.8397, "learning_rate": 4.545902095047594e-06, "epoch": 0.6168953068592058, "percentage": 30.87, "elapsed_time": "5:29:33", "remaining_time": "12:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1730, "loss": 0.8422, "learning_rate": 4.547256303368714e-06, "epoch": 0.6180505415162455, "percentage": 30.92, "elapsed_time": "5:30:06", "remaining_time": "12:17:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 1730, "loss": 0.8224, "learning_rate": 4.5486079828212835e-06, "epoch": 0.6192057761732852, "percentage": 30.98, "elapsed_time": "5:30:41", "remaining_time": "12:16:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 1730, "loss": 0.7988, "learning_rate": 4.549957142832593e-06, "epoch": 0.6203610108303249, "percentage": 31.04, "elapsed_time": "5:31:15", "remaining_time": "12:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 1730, "loss": 0.8397, "learning_rate": 4.5513037927773155e-06, "epoch": 0.6215162454873646, "percentage": 31.1, "elapsed_time": "5:31:49", "remaining_time": "12:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 1730, "loss": 0.8421, "learning_rate": 4.552647941977898e-06, "epoch": 0.6226714801444043, "percentage": 31.16, "elapsed_time": "5:32:23", "remaining_time": "12:14:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1730, "loss": 0.8129, "learning_rate": 4.553989599704948e-06, "epoch": 0.623826714801444, "percentage": 31.21, "elapsed_time": "5:32:57", "remaining_time": "12:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 1730, "loss": 0.8049, "learning_rate": 4.555328775177616e-06, "epoch": 0.6249819494584837, "percentage": 31.27, "elapsed_time": "5:33:31", "remaining_time": "12:12:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 1730, "loss": 0.8255, "learning_rate": 4.556665477563979e-06, "epoch": 0.6261371841155234, "percentage": 31.33, "elapsed_time": "5:34:05", "remaining_time": "12:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 1730, "loss": 0.8172, "learning_rate": 4.557999715981412e-06, "epoch": 0.6272924187725631, "percentage": 31.39, "elapsed_time": "5:34:39", "remaining_time": "12:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 1730, "loss": 0.8336, "learning_rate": 4.559331499496967e-06, "epoch": 0.6284476534296028, "percentage": 31.45, "elapsed_time": "5:35:12", "remaining_time": "12:10:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1730, "loss": 0.7958, "learning_rate": 4.560660837127738e-06, "epoch": 0.6296028880866426, "percentage": 31.5, "elapsed_time": "5:35:46", "remaining_time": "12:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 1730, "loss": 0.8313, "learning_rate": 4.5619877378412295e-06, "epoch": 0.6307581227436823, "percentage": 31.56, "elapsed_time": "5:36:20", "remaining_time": "12:09:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 1730, "loss": 0.8257, "learning_rate": 4.563312210555719e-06, "epoch": 0.6319133574007221, "percentage": 31.62, "elapsed_time": "5:36:54", "remaining_time": "12:08:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 1730, "loss": 0.8292, "learning_rate": 4.564634264140616e-06, "epoch": 0.6330685920577618, "percentage": 31.68, "elapsed_time": "5:37:28", "remaining_time": "12:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 1730, "loss": 0.828, "learning_rate": 4.5659539074168204e-06, "epoch": 0.6342238267148015, "percentage": 31.73, "elapsed_time": "5:38:01", "remaining_time": "12:07:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1730, "loss": 0.829, "learning_rate": 4.5672711491570735e-06, "epoch": 0.6353790613718412, "percentage": 31.79, "elapsed_time": "5:38:35", "remaining_time": "12:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 1730, "loss": 0.8323, "learning_rate": 4.568585998086309e-06, "epoch": 0.6365342960288809, "percentage": 31.85, "elapsed_time": "5:39:09", "remaining_time": "12:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 1730, "loss": 0.8424, "learning_rate": 4.569898462881998e-06, "epoch": 0.6376895306859206, "percentage": 31.91, "elapsed_time": "5:39:43", "remaining_time": "12:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 1730, "loss": 0.8471, "learning_rate": 4.571208552174497e-06, "epoch": 0.6388447653429603, "percentage": 31.97, "elapsed_time": "5:40:17", "remaining_time": "12:04:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 1730, "loss": 0.8277, "learning_rate": 4.572516274547383e-06, "epoch": 0.64, "percentage": 32.02, "elapsed_time": "5:40:50", "remaining_time": "12:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1730, "loss": 0.8458, "learning_rate": 4.573821638537794e-06, "epoch": 0.6411552346570397, "percentage": 32.08, "elapsed_time": "5:41:24", "remaining_time": "12:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 1730, "loss": 0.8196, "learning_rate": 4.5751246526367635e-06, "epoch": 0.6423104693140794, "percentage": 32.14, "elapsed_time": "5:41:58", "remaining_time": "12:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 1730, "loss": 0.8235, "learning_rate": 4.576425325289549e-06, "epoch": 0.6434657039711191, "percentage": 32.2, "elapsed_time": "5:42:32", "remaining_time": "12:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 1730, "loss": 0.7819, "learning_rate": 4.577723664895965e-06, "epoch": 0.6446209386281588, "percentage": 32.25, "elapsed_time": "5:43:06", "remaining_time": "12:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 1730, "loss": 0.8063, "learning_rate": 4.579019679810706e-06, "epoch": 0.6457761732851985, "percentage": 32.31, "elapsed_time": "5:43:40", "remaining_time": "11:59:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1730, "loss": 0.8145, "learning_rate": 4.5803133783436676e-06, "epoch": 0.6469314079422382, "percentage": 32.37, "elapsed_time": "5:44:13", "remaining_time": "11:59:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 1730, "loss": 0.7849, "learning_rate": 4.5816047687602695e-06, "epoch": 0.648086642599278, "percentage": 32.43, "elapsed_time": "5:44:47", "remaining_time": "11:58:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 1730, "loss": 0.8262, "learning_rate": 4.582893859281769e-06, "epoch": 0.6492418772563177, "percentage": 32.49, "elapsed_time": "5:45:22", "remaining_time": "11:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 1730, "loss": 0.8371, "learning_rate": 4.584180658085578e-06, "epoch": 0.6503971119133574, "percentage": 32.54, "elapsed_time": "5:45:56", "remaining_time": "11:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 1730, "loss": 0.8258, "learning_rate": 4.585465173305571e-06, "epoch": 0.6515523465703971, "percentage": 32.6, "elapsed_time": "5:46:29", "remaining_time": "11:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1730, "loss": 0.8289, "learning_rate": 4.586747413032399e-06, "epoch": 0.6527075812274368, "percentage": 32.66, "elapsed_time": "5:47:03", "remaining_time": "11:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 1730, "loss": 0.8208, "learning_rate": 4.588027385313786e-06, "epoch": 0.6538628158844766, "percentage": 32.72, "elapsed_time": "5:47:37", "remaining_time": "11:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 1730, "loss": 0.8236, "learning_rate": 4.589305098154845e-06, "epoch": 0.6550180505415163, "percentage": 32.77, "elapsed_time": "5:48:12", "remaining_time": "11:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 1730, "loss": 0.8397, "learning_rate": 4.5905805595183656e-06, "epoch": 0.656173285198556, "percentage": 32.83, "elapsed_time": "5:48:46", "remaining_time": "11:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 1730, "loss": 0.8077, "learning_rate": 4.59185377732512e-06, "epoch": 0.6573285198555957, "percentage": 32.89, "elapsed_time": "5:49:19", "remaining_time": "11:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1730, "loss": 0.828, "learning_rate": 4.5931247594541535e-06, "epoch": 0.6584837545126354, "percentage": 32.95, "elapsed_time": "5:49:53", "remaining_time": "11:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 1730, "loss": 0.8053, "learning_rate": 4.594393513743081e-06, "epoch": 0.6596389891696751, "percentage": 33.01, "elapsed_time": "5:50:27", "remaining_time": "11:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 1730, "loss": 0.8308, "learning_rate": 4.595660047988374e-06, "epoch": 0.6607942238267148, "percentage": 33.06, "elapsed_time": "5:51:02", "remaining_time": "11:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 1730, "loss": 0.8376, "learning_rate": 4.59692436994565e-06, "epoch": 0.6619494584837545, "percentage": 33.12, "elapsed_time": "5:51:36", "remaining_time": "11:49:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 1730, "loss": 0.8343, "learning_rate": 4.598186487329957e-06, "epoch": 0.6631046931407942, "percentage": 33.18, "elapsed_time": "5:52:09", "remaining_time": "11:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1730, "loss": 0.8169, "learning_rate": 4.599446407816052e-06, "epoch": 0.6642599277978339, "percentage": 33.24, "elapsed_time": "5:52:43", "remaining_time": "11:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 1730, "loss": 0.8414, "learning_rate": 4.600704139038687e-06, "epoch": 0.6654151624548736, "percentage": 33.29, "elapsed_time": "5:53:17", "remaining_time": "11:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 1730, "loss": 0.8144, "learning_rate": 4.601959688592886e-06, "epoch": 0.6665703971119133, "percentage": 33.35, "elapsed_time": "5:53:51", "remaining_time": "11:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 1730, "loss": 0.8086, "learning_rate": 4.603213064034216e-06, "epoch": 0.667725631768953, "percentage": 33.41, "elapsed_time": "5:54:25", "remaining_time": "11:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 1730, "loss": 0.8266, "learning_rate": 4.6044642728790615e-06, "epoch": 0.6688808664259928, "percentage": 33.47, "elapsed_time": "5:54:58", "remaining_time": "11:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1730, "loss": 0.8365, "learning_rate": 4.605713322604896e-06, "epoch": 0.6700361010830325, "percentage": 33.53, "elapsed_time": "5:55:32", "remaining_time": "11:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 1730, "loss": 0.8273, "learning_rate": 4.606960220650551e-06, "epoch": 0.6711913357400722, "percentage": 33.58, "elapsed_time": "5:56:06", "remaining_time": "11:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 1730, "loss": 0.8169, "learning_rate": 4.608204974416482e-06, "epoch": 0.6723465703971119, "percentage": 33.64, "elapsed_time": "5:56:40", "remaining_time": "11:43:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 1730, "loss": 0.8256, "learning_rate": 4.609447591265024e-06, "epoch": 0.6735018050541516, "percentage": 33.7, "elapsed_time": "5:57:14", "remaining_time": "11:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 1730, "loss": 0.8546, "learning_rate": 4.610688078520667e-06, "epoch": 0.6746570397111913, "percentage": 33.76, "elapsed_time": "5:57:48", "remaining_time": "11:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1730, "loss": 0.829, "learning_rate": 4.611926443470302e-06, "epoch": 0.675812274368231, "percentage": 33.82, "elapsed_time": "5:58:22", "remaining_time": "11:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 1730, "loss": 0.8206, "learning_rate": 4.613162693363485e-06, "epoch": 0.6769675090252708, "percentage": 33.87, "elapsed_time": "5:58:56", "remaining_time": "11:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 1730, "loss": 0.8214, "learning_rate": 4.614396835412691e-06, "epoch": 0.6781227436823105, "percentage": 33.93, "elapsed_time": "5:59:30", "remaining_time": "11:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 1730, "loss": 0.8128, "learning_rate": 4.6156288767935645e-06, "epoch": 0.6792779783393502, "percentage": 33.99, "elapsed_time": "6:00:04", "remaining_time": "11:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 1730, "loss": 0.8269, "learning_rate": 4.61685882464517e-06, "epoch": 0.6804332129963899, "percentage": 34.05, "elapsed_time": "6:00:38", "remaining_time": "11:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1730, "loss": 0.817, "learning_rate": 4.61808668607024e-06, "epoch": 0.6815884476534296, "percentage": 34.1, "elapsed_time": "6:01:11", "remaining_time": "11:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 1730, "loss": 0.8168, "learning_rate": 4.619312468135426e-06, "epoch": 0.6827436823104693, "percentage": 34.16, "elapsed_time": "6:01:46", "remaining_time": "11:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 1730, "loss": 0.8208, "learning_rate": 4.620536177871534e-06, "epoch": 0.683898916967509, "percentage": 34.22, "elapsed_time": "6:02:19", "remaining_time": "11:36:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 1730, "loss": 0.8032, "learning_rate": 4.621757822273772e-06, "epoch": 0.6850541516245487, "percentage": 34.28, "elapsed_time": "6:02:53", "remaining_time": "11:35:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 1730, "loss": 0.8234, "learning_rate": 4.62297740830199e-06, "epoch": 0.6862093862815885, "percentage": 34.34, "elapsed_time": "6:03:27", "remaining_time": "11:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1730, "loss": 0.8205, "learning_rate": 4.624194942880917e-06, "epoch": 0.6873646209386282, "percentage": 34.39, "elapsed_time": "6:04:00", "remaining_time": "11:34:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 1730, "loss": 0.8372, "learning_rate": 4.625410432900395e-06, "epoch": 0.6885198555956679, "percentage": 34.45, "elapsed_time": "6:04:34", "remaining_time": "11:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 1730, "loss": 0.813, "learning_rate": 4.626623885215616e-06, "epoch": 0.6896750902527076, "percentage": 34.51, "elapsed_time": "6:05:09", "remaining_time": "11:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 1730, "loss": 0.801, "learning_rate": 4.627835306647352e-06, "epoch": 0.6908303249097473, "percentage": 34.57, "elapsed_time": "6:05:43", "remaining_time": "11:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 1730, "loss": 0.818, "learning_rate": 4.6290447039821865e-06, "epoch": 0.691985559566787, "percentage": 34.62, "elapsed_time": "6:06:17", "remaining_time": "11:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1730, "loss": 0.8189, "learning_rate": 4.63025208397274e-06, "epoch": 0.6931407942238267, "percentage": 34.68, "elapsed_time": "6:06:52", "remaining_time": "11:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 1730, "loss": 0.8217, "learning_rate": 4.631457453337899e-06, "epoch": 0.6942960288808664, "percentage": 34.74, "elapsed_time": "6:07:26", "remaining_time": "11:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 1730, "loss": 0.8413, "learning_rate": 4.632660818763041e-06, "epoch": 0.6954512635379061, "percentage": 34.8, "elapsed_time": "6:08:00", "remaining_time": "11:29:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 1730, "loss": 0.8437, "learning_rate": 4.633862186900253e-06, "epoch": 0.6966064981949458, "percentage": 34.86, "elapsed_time": "6:08:34", "remaining_time": "11:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 1730, "loss": 0.8396, "learning_rate": 4.635061564368554e-06, "epoch": 0.6977617328519855, "percentage": 34.91, "elapsed_time": "6:09:08", "remaining_time": "11:28:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1730, "loss": 0.828, "learning_rate": 4.636258957754115e-06, "epoch": 0.6989169675090253, "percentage": 34.97, "elapsed_time": "6:09:41", "remaining_time": "11:27:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 1730, "loss": 0.8403, "learning_rate": 4.6374543736104774e-06, "epoch": 0.700072202166065, "percentage": 35.03, "elapsed_time": "6:10:15", "remaining_time": "11:26:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 1730, "loss": 0.8206, "learning_rate": 4.638647818458763e-06, "epoch": 0.7012274368231047, "percentage": 35.09, "elapsed_time": "6:10:49", "remaining_time": "11:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 1730, "loss": 0.8203, "learning_rate": 4.639839298787892e-06, "epoch": 0.7023826714801444, "percentage": 35.14, "elapsed_time": "6:11:23", "remaining_time": "11:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 1730, "loss": 0.8127, "learning_rate": 4.641028821054792e-06, "epoch": 0.7035379061371841, "percentage": 35.2, "elapsed_time": "6:11:56", "remaining_time": "11:24:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1730, "loss": 0.8218, "learning_rate": 4.642216391684613e-06, "epoch": 0.7046931407942238, "percentage": 35.26, "elapsed_time": "6:12:30", "remaining_time": "11:23:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 1730, "loss": 0.7877, "learning_rate": 4.643402017070924e-06, "epoch": 0.7058483754512636, "percentage": 35.32, "elapsed_time": "6:13:04", "remaining_time": "11:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 1730, "loss": 0.8062, "learning_rate": 4.644585703575936e-06, "epoch": 0.7070036101083033, "percentage": 35.38, "elapsed_time": "6:13:37", "remaining_time": "11:22:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 1730, "loss": 0.8068, "learning_rate": 4.645767457530693e-06, "epoch": 0.708158844765343, "percentage": 35.43, "elapsed_time": "6:14:11", "remaining_time": "11:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 1730, "loss": 0.8185, "learning_rate": 4.64694728523528e-06, "epoch": 0.7093140794223827, "percentage": 35.49, "elapsed_time": "6:14:48", "remaining_time": "11:21:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1730, "loss": 0.8305, "learning_rate": 4.648125192959028e-06, "epoch": 0.7104693140794224, "percentage": 35.55, "elapsed_time": "6:15:22", "remaining_time": "11:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 1730, "loss": 0.8176, "learning_rate": 4.649301186940709e-06, "epoch": 0.7116245487364621, "percentage": 35.61, "elapsed_time": "6:15:56", "remaining_time": "11:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 1730, "loss": 0.8011, "learning_rate": 4.650475273388737e-06, "epoch": 0.7127797833935018, "percentage": 35.66, "elapsed_time": "6:16:30", "remaining_time": "11:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 1730, "loss": 0.8319, "learning_rate": 4.65164745848136e-06, "epoch": 0.7139350180505415, "percentage": 35.72, "elapsed_time": "6:17:04", "remaining_time": "11:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 1730, "loss": 0.8394, "learning_rate": 4.652817748366864e-06, "epoch": 0.7150902527075812, "percentage": 35.78, "elapsed_time": "6:17:37", "remaining_time": "11:17:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1730, "loss": 0.825, "learning_rate": 4.653986149163757e-06, "epoch": 0.7162454873646209, "percentage": 35.84, "elapsed_time": "6:18:12", "remaining_time": "11:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 1730, "loss": 0.7891, "learning_rate": 4.655152666960967e-06, "epoch": 0.7174007220216606, "percentage": 35.9, "elapsed_time": "6:18:45", "remaining_time": "11:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 1730, "loss": 0.8105, "learning_rate": 4.656317307818032e-06, "epoch": 0.7185559566787003, "percentage": 35.95, "elapsed_time": "6:19:19", "remaining_time": "11:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 1730, "loss": 0.8125, "learning_rate": 4.657480077765284e-06, "epoch": 0.71971119133574, "percentage": 36.01, "elapsed_time": "6:19:52", "remaining_time": "11:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 1730, "loss": 0.8385, "learning_rate": 4.6586409828040405e-06, "epoch": 0.7208664259927798, "percentage": 36.07, "elapsed_time": "6:20:26", "remaining_time": "11:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1730, "loss": 0.8221, "learning_rate": 4.659800028906792e-06, "epoch": 0.7220216606498195, "percentage": 36.13, "elapsed_time": "6:21:00", "remaining_time": "11:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 1730, "loss": 0.824, "learning_rate": 4.660957222017384e-06, "epoch": 0.7231768953068592, "percentage": 36.18, "elapsed_time": "6:21:33", "remaining_time": "11:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 1730, "loss": 0.813, "learning_rate": 4.662112568051194e-06, "epoch": 0.724332129963899, "percentage": 36.24, "elapsed_time": "6:22:07", "remaining_time": "11:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 1730, "loss": 0.8229, "learning_rate": 4.663266072895327e-06, "epoch": 0.7254873646209387, "percentage": 36.3, "elapsed_time": "6:22:41", "remaining_time": "11:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 1730, "loss": 0.8201, "learning_rate": 4.664417742408782e-06, "epoch": 0.7266425992779784, "percentage": 36.36, "elapsed_time": "6:23:15", "remaining_time": "11:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1730, "loss": 0.8048, "learning_rate": 4.6655675824226375e-06, "epoch": 0.7277978339350181, "percentage": 36.42, "elapsed_time": "6:23:49", "remaining_time": "11:10:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 1730, "loss": 0.8145, "learning_rate": 4.666715598740224e-06, "epoch": 0.7289530685920578, "percentage": 36.47, "elapsed_time": "6:24:23", "remaining_time": "11:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 1730, "loss": 0.8236, "learning_rate": 4.667861797137309e-06, "epoch": 0.7301083032490975, "percentage": 36.53, "elapsed_time": "6:24:57", "remaining_time": "11:08:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 1730, "loss": 0.8416, "learning_rate": 4.669006183362259e-06, "epoch": 0.7312635379061372, "percentage": 36.59, "elapsed_time": "6:25:31", "remaining_time": "11:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 1730, "loss": 0.8004, "learning_rate": 4.670148763136221e-06, "epoch": 0.7324187725631769, "percentage": 36.65, "elapsed_time": "6:26:04", "remaining_time": "11:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1730, "loss": 0.8249, "learning_rate": 4.6712895421532935e-06, "epoch": 0.7335740072202166, "percentage": 36.71, "elapsed_time": "6:26:39", "remaining_time": "11:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 1730, "loss": 0.8346, "learning_rate": 4.672428526080691e-06, "epoch": 0.7347292418772563, "percentage": 36.76, "elapsed_time": "6:27:12", "remaining_time": "11:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 1730, "loss": 0.8206, "learning_rate": 4.673565720558918e-06, "epoch": 0.735884476534296, "percentage": 36.82, "elapsed_time": "6:27:46", "remaining_time": "11:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 1730, "loss": 0.8278, "learning_rate": 4.674701131201937e-06, "epoch": 0.7370397111913357, "percentage": 36.88, "elapsed_time": "6:28:19", "remaining_time": "11:04:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 1730, "loss": 0.8051, "learning_rate": 4.675834763597334e-06, "epoch": 0.7381949458483754, "percentage": 36.94, "elapsed_time": "6:28:53", "remaining_time": "11:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1730, "loss": 0.8131, "learning_rate": 4.676966623306479e-06, "epoch": 0.7393501805054151, "percentage": 36.99, "elapsed_time": "6:29:28", "remaining_time": "11:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 1730, "loss": 0.834, "learning_rate": 4.678096715864696e-06, "epoch": 0.7405054151624548, "percentage": 37.05, "elapsed_time": "6:30:01", "remaining_time": "11:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 1730, "loss": 0.808, "learning_rate": 4.679225046781422e-06, "epoch": 0.7416606498194945, "percentage": 37.11, "elapsed_time": "6:30:35", "remaining_time": "11:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 1730, "loss": 0.8236, "learning_rate": 4.6803516215403704e-06, "epoch": 0.7428158844765343, "percentage": 37.17, "elapsed_time": "6:31:09", "remaining_time": "11:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 1730, "loss": 0.8343, "learning_rate": 4.6814764455996875e-06, "epoch": 0.743971119133574, "percentage": 37.23, "elapsed_time": "6:31:43", "remaining_time": "11:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1730, "loss": 0.8165, "learning_rate": 4.682599524392114e-06, "epoch": 0.7451263537906138, "percentage": 37.28, "elapsed_time": "6:32:17", "remaining_time": "10:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 1730, "loss": 0.8284, "learning_rate": 4.683720863325141e-06, "epoch": 0.7462815884476535, "percentage": 37.34, "elapsed_time": "6:32:51", "remaining_time": "10:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 1730, "loss": 0.8213, "learning_rate": 4.6848404677811685e-06, "epoch": 0.7474368231046932, "percentage": 37.4, "elapsed_time": "6:33:25", "remaining_time": "10:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 1730, "loss": 0.8399, "learning_rate": 4.685958343117656e-06, "epoch": 0.7485920577617329, "percentage": 37.46, "elapsed_time": "6:33:58", "remaining_time": "10:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 1730, "loss": 0.8254, "learning_rate": 4.687074494667283e-06, "epoch": 0.7497472924187726, "percentage": 37.51, "elapsed_time": "6:34:32", "remaining_time": "10:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1730, "loss": 0.8283, "learning_rate": 4.688188927738093e-06, "epoch": 0.7509025270758123, "percentage": 37.57, "elapsed_time": "6:35:06", "remaining_time": "10:56:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 1730, "loss": 0.8334, "learning_rate": 4.689301647613653e-06, "epoch": 0.752057761732852, "percentage": 37.63, "elapsed_time": "6:35:40", "remaining_time": "10:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 1730, "loss": 0.8195, "learning_rate": 4.690412659553201e-06, "epoch": 0.7532129963898917, "percentage": 37.69, "elapsed_time": "6:36:14", "remaining_time": "10:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 1730, "loss": 0.8164, "learning_rate": 4.69152196879179e-06, "epoch": 0.7543682310469314, "percentage": 37.75, "elapsed_time": "6:36:48", "remaining_time": "10:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 1730, "loss": 0.8112, "learning_rate": 4.692629580540446e-06, "epoch": 0.7555234657039711, "percentage": 37.8, "elapsed_time": "6:37:21", "remaining_time": "10:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1730, "loss": 0.8228, "learning_rate": 4.693735499986305e-06, "epoch": 0.7566787003610108, "percentage": 37.86, "elapsed_time": "6:37:55", "remaining_time": "10:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 1730, "loss": 0.8169, "learning_rate": 4.694839732292768e-06, "epoch": 0.7578339350180505, "percentage": 37.92, "elapsed_time": "6:38:29", "remaining_time": "10:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 1730, "loss": 0.8274, "learning_rate": 4.695942282599635e-06, "epoch": 0.7589891696750902, "percentage": 37.98, "elapsed_time": "6:39:03", "remaining_time": "10:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 1730, "loss": 0.8127, "learning_rate": 4.69704315602326e-06, "epoch": 0.7601444043321299, "percentage": 38.03, "elapsed_time": "6:39:37", "remaining_time": "10:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 1730, "loss": 0.8053, "learning_rate": 4.698142357656684e-06, "epoch": 0.7612996389891696, "percentage": 38.09, "elapsed_time": "6:40:10", "remaining_time": "10:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1730, "loss": 0.8049, "learning_rate": 4.699239892569782e-06, "epoch": 0.7624548736462093, "percentage": 38.15, "elapsed_time": "6:40:44", "remaining_time": "10:49:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 1730, "loss": 0.8098, "learning_rate": 4.700335765809401e-06, "epoch": 0.763610108303249, "percentage": 38.21, "elapsed_time": "6:41:18", "remaining_time": "10:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 1730, "loss": 0.8203, "learning_rate": 4.701429982399501e-06, "epoch": 0.7647653429602889, "percentage": 38.27, "elapsed_time": "6:41:53", "remaining_time": "10:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 1730, "loss": 0.8174, "learning_rate": 4.702522547341289e-06, "epoch": 0.7659205776173286, "percentage": 38.32, "elapsed_time": "6:42:27", "remaining_time": "10:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 1730, "loss": 0.8111, "learning_rate": 4.703613465613363e-06, "epoch": 0.7670758122743683, "percentage": 38.38, "elapsed_time": "6:43:01", "remaining_time": "10:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1730, "loss": 0.7999, "learning_rate": 4.704702742171842e-06, "epoch": 0.768231046931408, "percentage": 38.44, "elapsed_time": "6:43:34", "remaining_time": "10:46:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 1730, "loss": 0.8332, "learning_rate": 4.705790381950503e-06, "epoch": 0.7693862815884477, "percentage": 38.5, "elapsed_time": "6:44:08", "remaining_time": "10:45:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 1730, "loss": 0.8179, "learning_rate": 4.706876389860915e-06, "epoch": 0.7705415162454874, "percentage": 38.55, "elapsed_time": "6:44:42", "remaining_time": "10:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 1730, "loss": 0.7875, "learning_rate": 4.707960770792576e-06, "epoch": 0.7716967509025271, "percentage": 38.61, "elapsed_time": "6:45:15", "remaining_time": "10:44:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 1730, "loss": 0.8029, "learning_rate": 4.709043529613039e-06, "epoch": 0.7728519855595668, "percentage": 38.67, "elapsed_time": "6:45:49", "remaining_time": "10:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1730, "loss": 0.8184, "learning_rate": 4.710124671168044e-06, "epoch": 0.7740072202166065, "percentage": 38.73, "elapsed_time": "6:46:24", "remaining_time": "10:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 1730, "loss": 0.8192, "learning_rate": 4.7112042002816544e-06, "epoch": 0.7751624548736462, "percentage": 38.79, "elapsed_time": "6:46:58", "remaining_time": "10:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 1730, "loss": 0.827, "learning_rate": 4.7122821217563755e-06, "epoch": 0.7763176895306859, "percentage": 38.84, "elapsed_time": "6:47:31", "remaining_time": "10:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 1730, "loss": 0.8072, "learning_rate": 4.7133584403732955e-06, "epoch": 0.7774729241877256, "percentage": 38.9, "elapsed_time": "6:48:05", "remaining_time": "10:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 1730, "loss": 0.8111, "learning_rate": 4.7144331608922e-06, "epoch": 0.7786281588447653, "percentage": 38.96, "elapsed_time": "6:48:39", "remaining_time": "10:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1730, "loss": 0.8077, "learning_rate": 4.715506288051709e-06, "epoch": 0.779783393501805, "percentage": 39.02, "elapsed_time": "6:49:13", "remaining_time": "10:39:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 1730, "loss": 0.8429, "learning_rate": 4.716577826569394e-06, "epoch": 0.7809386281588447, "percentage": 39.08, "elapsed_time": "6:49:47", "remaining_time": "10:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 1730, "loss": 0.8125, "learning_rate": 4.717647781141908e-06, "epoch": 0.7820938628158844, "percentage": 39.13, "elapsed_time": "6:50:22", "remaining_time": "10:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 1730, "loss": 0.8131, "learning_rate": 4.7187161564451065e-06, "epoch": 0.7832490974729241, "percentage": 39.19, "elapsed_time": "6:50:56", "remaining_time": "10:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 1730, "loss": 0.8292, "learning_rate": 4.71978295713417e-06, "epoch": 0.7844043321299639, "percentage": 39.25, "elapsed_time": "6:51:30", "remaining_time": "10:36:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1730, "loss": 0.8032, "learning_rate": 4.720848187843727e-06, "epoch": 0.7855595667870036, "percentage": 39.31, "elapsed_time": "6:52:04", "remaining_time": "10:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 1730, "loss": 0.8287, "learning_rate": 4.721911853187975e-06, "epoch": 0.7867148014440434, "percentage": 39.36, "elapsed_time": "6:52:38", "remaining_time": "10:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 1730, "loss": 0.8098, "learning_rate": 4.722973957760799e-06, "epoch": 0.7878700361010831, "percentage": 39.42, "elapsed_time": "6:53:12", "remaining_time": "10:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 1730, "loss": 0.8303, "learning_rate": 4.724034506135888e-06, "epoch": 0.7890252707581228, "percentage": 39.48, "elapsed_time": "6:53:46", "remaining_time": "10:34:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 1730, "loss": 0.7875, "learning_rate": 4.725093502866861e-06, "epoch": 0.7901805054151625, "percentage": 39.54, "elapsed_time": "6:54:21", "remaining_time": "10:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.7261509524873765e-06, "epoch": 0.7913357400722022, "percentage": 39.6, "elapsed_time": "6:54:54", "remaining_time": "10:32:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 1730, "loss": 0.8168, "learning_rate": 4.727206859511253e-06, "epoch": 0.7924909747292419, "percentage": 39.65, "elapsed_time": "6:55:28", "remaining_time": "10:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 1730, "loss": 0.8061, "learning_rate": 4.7282612284325845e-06, "epoch": 0.7936462093862816, "percentage": 39.71, "elapsed_time": "6:56:03", "remaining_time": "10:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 1730, "loss": 0.8077, "learning_rate": 4.729314063725853e-06, "epoch": 0.7948014440433213, "percentage": 39.77, "elapsed_time": "6:56:37", "remaining_time": "10:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 1730, "loss": 0.8161, "learning_rate": 4.730365369846044e-06, "epoch": 0.795956678700361, "percentage": 39.83, "elapsed_time": "6:57:10", "remaining_time": "10:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1730, "loss": 0.8042, "learning_rate": 4.73141515122876e-06, "epoch": 0.7971119133574007, "percentage": 39.88, "elapsed_time": "6:57:44", "remaining_time": "10:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 1730, "loss": 0.7871, "learning_rate": 4.732463412290331e-06, "epoch": 0.7982671480144404, "percentage": 39.94, "elapsed_time": "6:58:17", "remaining_time": "10:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 1730, "loss": 0.8163, "learning_rate": 4.73351015742793e-06, "epoch": 0.7994223826714801, "percentage": 40.0, "elapsed_time": "6:58:51", "remaining_time": "10:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 1730, "loss": 0.8073, "learning_rate": 4.734555391019678e-06, "epoch": 0.8005776173285198, "percentage": 40.06, "elapsed_time": "6:59:25", "remaining_time": "10:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 1730, "loss": 0.8186, "learning_rate": 4.735599117424759e-06, "epoch": 0.8017328519855595, "percentage": 40.12, "elapsed_time": "6:59:59", "remaining_time": "10:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1730, "loss": 0.8198, "learning_rate": 4.736641340983524e-06, "epoch": 0.8028880866425993, "percentage": 40.17, "elapsed_time": "7:00:33", "remaining_time": "10:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 1730, "loss": 0.7954, "learning_rate": 4.737682066017604e-06, "epoch": 0.804043321299639, "percentage": 40.23, "elapsed_time": "7:01:07", "remaining_time": "10:25:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 1730, "loss": 0.8197, "learning_rate": 4.738721296830016e-06, "epoch": 0.8051985559566787, "percentage": 40.29, "elapsed_time": "7:01:41", "remaining_time": "10:24:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 1730, "loss": 0.8361, "learning_rate": 4.739759037705269e-06, "epoch": 0.8063537906137184, "percentage": 40.35, "elapsed_time": "7:02:14", "remaining_time": "10:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 1730, "loss": 0.8055, "learning_rate": 4.740795292909469e-06, "epoch": 0.8075090252707581, "percentage": 40.4, "elapsed_time": "7:02:48", "remaining_time": "10:23:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1730, "loss": 0.7907, "learning_rate": 4.741830066690428e-06, "epoch": 0.8086642599277978, "percentage": 40.46, "elapsed_time": "7:03:21", "remaining_time": "10:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 1730, "loss": 0.8235, "learning_rate": 4.742863363277765e-06, "epoch": 0.8098194945848376, "percentage": 40.52, "elapsed_time": "7:03:55", "remaining_time": "10:22:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 1730, "loss": 0.8076, "learning_rate": 4.743895186883009e-06, "epoch": 0.8109747292418773, "percentage": 40.58, "elapsed_time": "7:04:29", "remaining_time": "10:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 1730, "loss": 0.8316, "learning_rate": 4.744925541699707e-06, "epoch": 0.812129963898917, "percentage": 40.64, "elapsed_time": "7:05:03", "remaining_time": "10:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 1730, "loss": 0.8075, "learning_rate": 4.74595443190352e-06, "epoch": 0.8132851985559567, "percentage": 40.69, "elapsed_time": "7:05:37", "remaining_time": "10:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1730, "loss": 0.8421, "learning_rate": 4.746981861652332e-06, "epoch": 0.8144404332129964, "percentage": 40.75, "elapsed_time": "7:06:10", "remaining_time": "10:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 1730, "loss": 0.8132, "learning_rate": 4.7480078350863404e-06, "epoch": 0.8155956678700361, "percentage": 40.81, "elapsed_time": "7:06:44", "remaining_time": "10:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 1730, "loss": 0.8326, "learning_rate": 4.749032356328167e-06, "epoch": 0.8167509025270758, "percentage": 40.87, "elapsed_time": "7:07:18", "remaining_time": "10:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 1730, "loss": 0.8118, "learning_rate": 4.750055429482949e-06, "epoch": 0.8179061371841155, "percentage": 40.92, "elapsed_time": "7:07:52", "remaining_time": "10:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 1730, "loss": 0.816, "learning_rate": 4.751077058638445e-06, "epoch": 0.8190613718411552, "percentage": 40.98, "elapsed_time": "7:08:26", "remaining_time": "10:16:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1730, "loss": 0.8061, "learning_rate": 4.752097247865126e-06, "epoch": 0.8202166064981949, "percentage": 41.04, "elapsed_time": "7:09:00", "remaining_time": "10:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 1730, "loss": 0.7946, "learning_rate": 4.753116001216277e-06, "epoch": 0.8213718411552346, "percentage": 41.1, "elapsed_time": "7:09:34", "remaining_time": "10:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 1730, "loss": 0.8379, "learning_rate": 4.754133322728095e-06, "epoch": 0.8225270758122744, "percentage": 41.16, "elapsed_time": "7:10:08", "remaining_time": "10:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 1730, "loss": 0.8101, "learning_rate": 4.755149216419776e-06, "epoch": 0.8236823104693141, "percentage": 41.21, "elapsed_time": "7:10:42", "remaining_time": "10:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 1730, "loss": 0.8225, "learning_rate": 4.756163686293624e-06, "epoch": 0.8248375451263538, "percentage": 41.27, "elapsed_time": "7:11:16", "remaining_time": "10:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1730, "loss": 0.848, "learning_rate": 4.757176736335135e-06, "epoch": 0.8259927797833935, "percentage": 41.33, "elapsed_time": "7:11:50", "remaining_time": "10:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 1730, "loss": 0.8426, "learning_rate": 4.758188370513093e-06, "epoch": 0.8271480144404332, "percentage": 41.39, "elapsed_time": "7:12:24", "remaining_time": "10:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 1730, "loss": 0.8306, "learning_rate": 4.759198592779668e-06, "epoch": 0.8283032490974729, "percentage": 41.45, "elapsed_time": "7:12:57", "remaining_time": "10:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 1730, "loss": 0.825, "learning_rate": 4.760207407070501e-06, "epoch": 0.8294584837545126, "percentage": 41.5, "elapsed_time": "7:13:32", "remaining_time": "10:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 1730, "loss": 0.8071, "learning_rate": 4.761214817304805e-06, "epoch": 0.8306137184115523, "percentage": 41.56, "elapsed_time": "7:14:06", "remaining_time": "10:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1730, "loss": 0.8158, "learning_rate": 4.7622208273854484e-06, "epoch": 0.8317689530685921, "percentage": 41.62, "elapsed_time": "7:14:40", "remaining_time": "10:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 1730, "loss": 0.8226, "learning_rate": 4.763225441199049e-06, "epoch": 0.8329241877256318, "percentage": 41.68, "elapsed_time": "7:15:14", "remaining_time": "10:09:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 1730, "loss": 0.8025, "learning_rate": 4.764228662616066e-06, "epoch": 0.8340794223826715, "percentage": 41.73, "elapsed_time": "7:15:48", "remaining_time": "10:08:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 1730, "loss": 0.842, "learning_rate": 4.765230495490885e-06, "epoch": 0.8352346570397112, "percentage": 41.79, "elapsed_time": "7:16:22", "remaining_time": "10:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 1730, "loss": 0.8135, "learning_rate": 4.766230943661912e-06, "epoch": 0.8363898916967509, "percentage": 41.85, "elapsed_time": "7:16:56", "remaining_time": "10:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1730, "loss": 0.8087, "learning_rate": 4.767230010951657e-06, "epoch": 0.8375451263537906, "percentage": 41.91, "elapsed_time": "7:17:29", "remaining_time": "10:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 1730, "loss": 0.8242, "learning_rate": 4.768227701166823e-06, "epoch": 0.8387003610108303, "percentage": 41.97, "elapsed_time": "7:18:04", "remaining_time": "10:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 1730, "loss": 0.8418, "learning_rate": 4.769224018098397e-06, "epoch": 0.83985559566787, "percentage": 42.02, "elapsed_time": "7:18:38", "remaining_time": "10:05:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 1730, "loss": 0.8013, "learning_rate": 4.770218965521729e-06, "epoch": 0.8410108303249098, "percentage": 42.08, "elapsed_time": "7:19:12", "remaining_time": "10:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 1730, "loss": 0.7984, "learning_rate": 4.771212547196624e-06, "epoch": 0.8421660649819495, "percentage": 42.14, "elapsed_time": "7:19:46", "remaining_time": "10:03:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1730, "loss": 0.809, "learning_rate": 4.772204766867427e-06, "epoch": 0.8433212996389892, "percentage": 42.2, "elapsed_time": "7:20:20", "remaining_time": "10:03:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 1730, "loss": 0.8186, "learning_rate": 4.773195628263101e-06, "epoch": 0.8444765342960289, "percentage": 42.25, "elapsed_time": "7:20:54", "remaining_time": "10:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 1730, "loss": 0.8111, "learning_rate": 4.77418513509732e-06, "epoch": 0.8456317689530686, "percentage": 42.31, "elapsed_time": "7:21:28", "remaining_time": "10:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 1730, "loss": 0.8218, "learning_rate": 4.775173291068547e-06, "epoch": 0.8467870036101083, "percentage": 42.37, "elapsed_time": "7:22:02", "remaining_time": "10:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 1730, "loss": 0.8107, "learning_rate": 4.776160099860117e-06, "epoch": 0.847942238267148, "percentage": 42.43, "elapsed_time": "7:22:37", "remaining_time": "10:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1730, "loss": 0.8088, "learning_rate": 4.777145565140325e-06, "epoch": 0.8490974729241877, "percentage": 42.49, "elapsed_time": "7:23:11", "remaining_time": "9:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 1730, "loss": 0.7977, "learning_rate": 4.778129690562499e-06, "epoch": 0.8502527075812274, "percentage": 42.54, "elapsed_time": "7:23:45", "remaining_time": "9:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 1730, "loss": 0.8105, "learning_rate": 4.7791124797650865e-06, "epoch": 0.8514079422382671, "percentage": 42.6, "elapsed_time": "7:24:19", "remaining_time": "9:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 1730, "loss": 0.825, "learning_rate": 4.780093936371737e-06, "epoch": 0.8525631768953068, "percentage": 42.66, "elapsed_time": "7:24:54", "remaining_time": "9:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 1730, "loss": 0.8088, "learning_rate": 4.781074063991377e-06, "epoch": 0.8537184115523466, "percentage": 42.72, "elapsed_time": "7:25:27", "remaining_time": "9:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1730, "loss": 0.7909, "learning_rate": 4.782052866218294e-06, "epoch": 0.8548736462093863, "percentage": 42.77, "elapsed_time": "7:26:01", "remaining_time": "9:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 1730, "loss": 0.8036, "learning_rate": 4.783030346632214e-06, "epoch": 0.856028880866426, "percentage": 42.83, "elapsed_time": "7:26:35", "remaining_time": "9:56:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 1730, "loss": 0.8118, "learning_rate": 4.784006508798379e-06, "epoch": 0.8571841155234657, "percentage": 42.89, "elapsed_time": "7:27:09", "remaining_time": "9:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 1730, "loss": 0.8319, "learning_rate": 4.7849813562676265e-06, "epoch": 0.8583393501805054, "percentage": 42.95, "elapsed_time": "7:27:42", "remaining_time": "9:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 1730, "loss": 0.8153, "learning_rate": 4.785954892576465e-06, "epoch": 0.8594945848375452, "percentage": 43.01, "elapsed_time": "7:28:16", "remaining_time": "9:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1730, "loss": 0.8164, "learning_rate": 4.786927121247155e-06, "epoch": 0.8606498194945849, "percentage": 43.06, "elapsed_time": "7:28:49", "remaining_time": "9:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 1730, "loss": 0.7877, "learning_rate": 4.787898045787781e-06, "epoch": 0.8618050541516246, "percentage": 43.12, "elapsed_time": "7:29:23", "remaining_time": "9:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 1730, "loss": 0.8096, "learning_rate": 4.788867669692332e-06, "epoch": 0.8629602888086643, "percentage": 43.18, "elapsed_time": "7:29:58", "remaining_time": "9:52:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 1730, "loss": 0.791, "learning_rate": 4.78983599644077e-06, "epoch": 0.864115523465704, "percentage": 43.24, "elapsed_time": "7:30:31", "remaining_time": "9:51:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 1730, "loss": 0.7906, "learning_rate": 4.790803029499111e-06, "epoch": 0.8652707581227437, "percentage": 43.29, "elapsed_time": "7:31:04", "remaining_time": "9:50:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1730, "loss": 0.7749, "learning_rate": 4.7917687723195e-06, "epoch": 0.8664259927797834, "percentage": 43.35, "elapsed_time": "7:31:38", "remaining_time": "9:50:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 1730, "loss": 0.7991, "learning_rate": 4.792733228340281e-06, "epoch": 0.8675812274368231, "percentage": 43.41, "elapsed_time": "7:45:04", "remaining_time": "10:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 1730, "loss": 0.7999, "learning_rate": 4.793696400986071e-06, "epoch": 0.8687364620938628, "percentage": 43.47, "elapsed_time": "7:45:38", "remaining_time": "10:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 1730, "loss": 0.8337, "learning_rate": 4.794658293667835e-06, "epoch": 0.8698916967509025, "percentage": 43.53, "elapsed_time": "7:46:11", "remaining_time": "10:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 1730, "loss": 0.8128, "learning_rate": 4.795618909782958e-06, "epoch": 0.8710469314079422, "percentage": 43.58, "elapsed_time": "7:46:45", "remaining_time": "10:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1730, "loss": 0.8088, "learning_rate": 4.7965782527153145e-06, "epoch": 0.8722021660649819, "percentage": 43.64, "elapsed_time": "7:47:18", "remaining_time": "10:03:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 1730, "loss": 0.8195, "learning_rate": 4.797536325835345e-06, "epoch": 0.8733574007220216, "percentage": 43.7, "elapsed_time": "7:47:53", "remaining_time": "10:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 1730, "loss": 0.8067, "learning_rate": 4.798493132500121e-06, "epoch": 0.8745126353790613, "percentage": 43.76, "elapsed_time": "7:48:27", "remaining_time": "10:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 1730, "loss": 0.8032, "learning_rate": 4.799448676053423e-06, "epoch": 0.8756678700361011, "percentage": 43.82, "elapsed_time": "7:49:01", "remaining_time": "10:01:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 1730, "loss": 0.8369, "learning_rate": 4.800402959825802e-06, "epoch": 0.8768231046931408, "percentage": 43.87, "elapsed_time": "7:49:34", "remaining_time": "10:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1730, "loss": 0.8112, "learning_rate": 4.801355987134653e-06, "epoch": 0.8779783393501805, "percentage": 43.93, "elapsed_time": "7:50:09", "remaining_time": "10:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 1730, "loss": 0.819, "learning_rate": 4.802307761284289e-06, "epoch": 0.8791335740072203, "percentage": 43.99, "elapsed_time": "7:50:42", "remaining_time": "9:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 1730, "loss": 0.8149, "learning_rate": 4.803258285566001e-06, "epoch": 0.88028880866426, "percentage": 44.05, "elapsed_time": "7:51:16", "remaining_time": "9:58:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 1730, "loss": 0.8095, "learning_rate": 4.804207563258135e-06, "epoch": 0.8814440433212997, "percentage": 44.1, "elapsed_time": "7:51:50", "remaining_time": "9:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 1730, "loss": 0.8188, "learning_rate": 4.80515559762615e-06, "epoch": 0.8825992779783394, "percentage": 44.16, "elapsed_time": "7:52:23", "remaining_time": "9:57:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1730, "loss": 0.8248, "learning_rate": 4.806102391922697e-06, "epoch": 0.8837545126353791, "percentage": 44.22, "elapsed_time": "7:52:57", "remaining_time": "9:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 1730, "loss": 0.8083, "learning_rate": 4.8070479493876735e-06, "epoch": 0.8849097472924188, "percentage": 44.28, "elapsed_time": "7:53:31", "remaining_time": "9:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 1730, "loss": 0.8104, "learning_rate": 4.8079922732483016e-06, "epoch": 0.8860649819494585, "percentage": 44.34, "elapsed_time": "7:54:04", "remaining_time": "9:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 1730, "loss": 0.8083, "learning_rate": 4.808935366719187e-06, "epoch": 0.8872202166064982, "percentage": 44.39, "elapsed_time": "7:54:38", "remaining_time": "9:54:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 1730, "loss": 0.8181, "learning_rate": 4.8098772330023855e-06, "epoch": 0.8883754512635379, "percentage": 44.45, "elapsed_time": "7:55:11", "remaining_time": "9:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1730, "loss": 0.8166, "learning_rate": 4.81081787528747e-06, "epoch": 0.8895306859205776, "percentage": 44.51, "elapsed_time": "7:55:46", "remaining_time": "9:53:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 1730, "loss": 0.8061, "learning_rate": 4.8117572967515955e-06, "epoch": 0.8906859205776173, "percentage": 44.57, "elapsed_time": "7:56:19", "remaining_time": "9:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 1730, "loss": 0.796, "learning_rate": 4.812695500559561e-06, "epoch": 0.891841155234657, "percentage": 44.62, "elapsed_time": "7:56:53", "remaining_time": "9:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 1730, "loss": 0.8269, "learning_rate": 4.813632489863876e-06, "epoch": 0.8929963898916967, "percentage": 44.68, "elapsed_time": "7:57:27", "remaining_time": "9:51:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 1730, "loss": 0.8166, "learning_rate": 4.814568267804822e-06, "epoch": 0.8941516245487364, "percentage": 44.74, "elapsed_time": "7:58:02", "remaining_time": "9:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1730, "loss": 0.8006, "learning_rate": 4.815502837510518e-06, "epoch": 0.8953068592057761, "percentage": 44.8, "elapsed_time": "7:58:36", "remaining_time": "9:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 1730, "loss": 0.7987, "learning_rate": 4.816436202096981e-06, "epoch": 0.8964620938628158, "percentage": 44.86, "elapsed_time": "7:59:13", "remaining_time": "9:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 1730, "loss": 0.8148, "learning_rate": 4.817368364668191e-06, "epoch": 0.8976173285198557, "percentage": 44.91, "elapsed_time": "7:59:50", "remaining_time": "9:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 1730, "loss": 0.833, "learning_rate": 4.8182993283161485e-06, "epoch": 0.8987725631768954, "percentage": 44.97, "elapsed_time": "8:00:23", "remaining_time": "9:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 1730, "loss": 0.8245, "learning_rate": 4.819229096120941e-06, "epoch": 0.8999277978339351, "percentage": 45.03, "elapsed_time": "8:00:57", "remaining_time": "9:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1730, "loss": 0.826, "learning_rate": 4.820157671150801e-06, "epoch": 0.9010830324909748, "percentage": 45.09, "elapsed_time": "8:01:32", "remaining_time": "9:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 1730, "loss": 0.8322, "learning_rate": 4.821085056462168e-06, "epoch": 0.9022382671480145, "percentage": 45.14, "elapsed_time": "8:02:06", "remaining_time": "9:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 1730, "loss": 0.8305, "learning_rate": 4.822011255099747e-06, "epoch": 0.9033935018050542, "percentage": 45.2, "elapsed_time": "8:02:39", "remaining_time": "9:45:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 1730, "loss": 0.8119, "learning_rate": 4.8229362700965724e-06, "epoch": 0.9045487364620939, "percentage": 45.26, "elapsed_time": "8:03:13", "remaining_time": "9:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 1730, "loss": 0.8334, "learning_rate": 4.823860104474065e-06, "epoch": 0.9057039711191336, "percentage": 45.32, "elapsed_time": "8:03:47", "remaining_time": "9:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1730, "loss": 0.8148, "learning_rate": 4.8247827612420875e-06, "epoch": 0.9068592057761733, "percentage": 45.38, "elapsed_time": "8:04:21", "remaining_time": "9:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 1730, "loss": 0.8228, "learning_rate": 4.825704243399014e-06, "epoch": 0.908014440433213, "percentage": 45.43, "elapsed_time": "8:04:55", "remaining_time": "9:42:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 1730, "loss": 0.8027, "learning_rate": 4.8266245539317745e-06, "epoch": 0.9091696750902527, "percentage": 45.49, "elapsed_time": "8:05:29", "remaining_time": "9:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 1730, "loss": 0.796, "learning_rate": 4.827543695815926e-06, "epoch": 0.9103249097472924, "percentage": 45.55, "elapsed_time": "8:06:03", "remaining_time": "9:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 1730, "loss": 0.8125, "learning_rate": 4.828461672015701e-06, "epoch": 0.9114801444043321, "percentage": 45.61, "elapsed_time": "8:06:37", "remaining_time": "9:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1730, "loss": 0.7954, "learning_rate": 4.82937848548407e-06, "epoch": 0.9126353790613718, "percentage": 45.66, "elapsed_time": "8:07:11", "remaining_time": "9:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 1730, "loss": 0.8045, "learning_rate": 4.830294139162795e-06, "epoch": 0.9137906137184115, "percentage": 45.72, "elapsed_time": "8:07:45", "remaining_time": "9:39:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 1730, "loss": 0.8072, "learning_rate": 4.83120863598249e-06, "epoch": 0.9149458483754512, "percentage": 45.78, "elapsed_time": "8:08:18", "remaining_time": "9:38:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 1730, "loss": 0.7935, "learning_rate": 4.832121978862673e-06, "epoch": 0.9161010830324909, "percentage": 45.84, "elapsed_time": "8:08:52", "remaining_time": "9:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 1730, "loss": 0.7944, "learning_rate": 4.833034170711828e-06, "epoch": 0.9172563176895306, "percentage": 45.9, "elapsed_time": "8:09:25", "remaining_time": "9:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1730, "loss": 0.8029, "learning_rate": 4.833945214427451e-06, "epoch": 0.9184115523465703, "percentage": 45.95, "elapsed_time": "8:10:00", "remaining_time": "9:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 1730, "loss": 0.8342, "learning_rate": 4.834855112896116e-06, "epoch": 0.91956678700361, "percentage": 46.01, "elapsed_time": "8:10:34", "remaining_time": "9:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.835763868993521e-06, "epoch": 0.9207220216606499, "percentage": 46.07, "elapsed_time": "8:11:08", "remaining_time": "9:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 1730, "loss": 0.8021, "learning_rate": 4.83667148558455e-06, "epoch": 0.9218772563176896, "percentage": 46.13, "elapsed_time": "8:11:41", "remaining_time": "9:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 1730, "loss": 0.8305, "learning_rate": 4.8375779655233195e-06, "epoch": 0.9230324909747293, "percentage": 46.18, "elapsed_time": "8:12:15", "remaining_time": "9:33:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1730, "loss": 0.8141, "learning_rate": 4.83848331165324e-06, "epoch": 0.924187725631769, "percentage": 46.24, "elapsed_time": "8:12:49", "remaining_time": "9:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 1730, "loss": 0.809, "learning_rate": 4.839387526807064e-06, "epoch": 0.9253429602888087, "percentage": 46.3, "elapsed_time": "8:13:22", "remaining_time": "9:32:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 1730, "loss": 0.8075, "learning_rate": 4.84029061380694e-06, "epoch": 0.9264981949458484, "percentage": 46.36, "elapsed_time": "8:13:56", "remaining_time": "9:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 1730, "loss": 0.8116, "learning_rate": 4.841192575464469e-06, "epoch": 0.9276534296028881, "percentage": 46.42, "elapsed_time": "8:14:30", "remaining_time": "9:30:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 1730, "loss": 0.8085, "learning_rate": 4.842093414580753e-06, "epoch": 0.9288086642599278, "percentage": 46.47, "elapsed_time": "8:15:04", "remaining_time": "9:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1730, "loss": 0.8202, "learning_rate": 4.842993133946448e-06, "epoch": 0.9299638989169675, "percentage": 46.53, "elapsed_time": "8:15:38", "remaining_time": "9:29:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 1730, "loss": 0.8222, "learning_rate": 4.8438917363418184e-06, "epoch": 0.9311191335740072, "percentage": 46.59, "elapsed_time": "8:16:12", "remaining_time": "9:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 1730, "loss": 0.8009, "learning_rate": 4.844789224536785e-06, "epoch": 0.9322743682310469, "percentage": 46.65, "elapsed_time": "8:16:46", "remaining_time": "9:28:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 1730, "loss": 0.8129, "learning_rate": 4.845685601290977e-06, "epoch": 0.9334296028880866, "percentage": 46.71, "elapsed_time": "8:17:20", "remaining_time": "9:27:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 1730, "loss": 0.8084, "learning_rate": 4.846580869353787e-06, "epoch": 0.9345848375451263, "percentage": 46.76, "elapsed_time": "8:17:53", "remaining_time": "9:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1730, "loss": 0.8058, "learning_rate": 4.847475031464417e-06, "epoch": 0.935740072202166, "percentage": 46.82, "elapsed_time": "8:18:27", "remaining_time": "9:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 1730, "loss": 0.8, "learning_rate": 4.848368090351928e-06, "epoch": 0.9368953068592057, "percentage": 46.88, "elapsed_time": "8:19:01", "remaining_time": "9:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 1730, "loss": 0.8071, "learning_rate": 4.849260048735293e-06, "epoch": 0.9380505415162455, "percentage": 46.94, "elapsed_time": "8:19:36", "remaining_time": "9:24:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 1730, "loss": 0.8173, "learning_rate": 4.8501509093234474e-06, "epoch": 0.9392057761732852, "percentage": 46.99, "elapsed_time": "8:20:10", "remaining_time": "9:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 1730, "loss": 0.8057, "learning_rate": 4.851040674815336e-06, "epoch": 0.9403610108303249, "percentage": 47.05, "elapsed_time": "8:20:44", "remaining_time": "9:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1730, "loss": 0.7952, "learning_rate": 4.851929347899962e-06, "epoch": 0.9415162454873646, "percentage": 47.11, "elapsed_time": "8:21:17", "remaining_time": "9:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 1730, "loss": 0.815, "learning_rate": 4.852816931256436e-06, "epoch": 0.9426714801444044, "percentage": 47.17, "elapsed_time": "8:21:51", "remaining_time": "9:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 1730, "loss": 0.8169, "learning_rate": 4.853703427554027e-06, "epoch": 0.9438267148014441, "percentage": 47.23, "elapsed_time": "8:22:25", "remaining_time": "9:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 1730, "loss": 0.8134, "learning_rate": 4.854588839452205e-06, "epoch": 0.9449819494584838, "percentage": 47.28, "elapsed_time": "8:22:59", "remaining_time": "9:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 1730, "loss": 0.8198, "learning_rate": 4.855473169600699e-06, "epoch": 0.9461371841155235, "percentage": 47.34, "elapsed_time": "8:23:32", "remaining_time": "9:20:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1730, "loss": 0.8426, "learning_rate": 4.856356420639528e-06, "epoch": 0.9472924187725632, "percentage": 47.4, "elapsed_time": "8:24:06", "remaining_time": "9:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 1730, "loss": 0.8025, "learning_rate": 4.857238595199068e-06, "epoch": 0.9484476534296029, "percentage": 47.46, "elapsed_time": "8:24:40", "remaining_time": "9:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 1730, "loss": 0.8267, "learning_rate": 4.858119695900084e-06, "epoch": 0.9496028880866426, "percentage": 47.51, "elapsed_time": "8:25:14", "remaining_time": "9:18:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 1730, "loss": 0.7936, "learning_rate": 4.858999725353784e-06, "epoch": 0.9507581227436823, "percentage": 47.57, "elapsed_time": "8:25:48", "remaining_time": "9:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 1730, "loss": 0.8245, "learning_rate": 4.859878686161861e-06, "epoch": 0.951913357400722, "percentage": 47.63, "elapsed_time": "8:26:23", "remaining_time": "9:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1730, "loss": 0.8036, "learning_rate": 4.860756580916543e-06, "epoch": 0.9530685920577617, "percentage": 47.69, "elapsed_time": "8:26:56", "remaining_time": "9:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 1730, "loss": 0.8132, "learning_rate": 4.861633412200637e-06, "epoch": 0.9542238267148014, "percentage": 47.75, "elapsed_time": "8:27:30", "remaining_time": "9:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 1730, "loss": 0.8189, "learning_rate": 4.862509182587578e-06, "epoch": 0.9553790613718411, "percentage": 47.8, "elapsed_time": "8:28:04", "remaining_time": "9:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 1730, "loss": 0.8056, "learning_rate": 4.8633838946414675e-06, "epoch": 0.9565342960288808, "percentage": 47.86, "elapsed_time": "8:28:38", "remaining_time": "9:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 1730, "loss": 0.8108, "learning_rate": 4.864257550917123e-06, "epoch": 0.9576895306859206, "percentage": 47.92, "elapsed_time": "8:29:12", "remaining_time": "9:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1730, "loss": 0.8031, "learning_rate": 4.8651301539601235e-06, "epoch": 0.9588447653429603, "percentage": 47.98, "elapsed_time": "8:29:46", "remaining_time": "9:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 1730, "loss": 0.8199, "learning_rate": 4.866001706306853e-06, "epoch": 0.96, "percentage": 48.03, "elapsed_time": "8:30:20", "remaining_time": "9:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 1730, "loss": 0.8175, "learning_rate": 4.866872210484541e-06, "epoch": 0.9611552346570397, "percentage": 48.09, "elapsed_time": "8:30:53", "remaining_time": "9:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 1730, "loss": 0.7998, "learning_rate": 4.867741669011313e-06, "epoch": 0.9623104693140794, "percentage": 48.15, "elapsed_time": "8:31:27", "remaining_time": "9:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 1730, "loss": 0.7809, "learning_rate": 4.868610084396232e-06, "epoch": 0.9634657039711191, "percentage": 48.21, "elapsed_time": "8:32:01", "remaining_time": "9:10:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1730, "loss": 0.8219, "learning_rate": 4.869477459139337e-06, "epoch": 0.9646209386281589, "percentage": 48.27, "elapsed_time": "8:32:36", "remaining_time": "9:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 1730, "loss": 0.807, "learning_rate": 4.8703437957316945e-06, "epoch": 0.9657761732851986, "percentage": 48.32, "elapsed_time": "8:33:09", "remaining_time": "9:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 1730, "loss": 0.8213, "learning_rate": 4.871209096655434e-06, "epoch": 0.9669314079422383, "percentage": 48.38, "elapsed_time": "8:33:43", "remaining_time": "9:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 1730, "loss": 0.8167, "learning_rate": 4.872073364383795e-06, "epoch": 0.968086642599278, "percentage": 48.44, "elapsed_time": "8:34:17", "remaining_time": "9:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 1730, "loss": 0.7926, "learning_rate": 4.872936601381167e-06, "epoch": 0.9692418772563177, "percentage": 48.5, "elapsed_time": "8:34:51", "remaining_time": "9:06:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1730, "loss": 0.769, "learning_rate": 4.873798810103137e-06, "epoch": 0.9703971119133574, "percentage": 48.55, "elapsed_time": "8:35:25", "remaining_time": "9:06:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 1730, "loss": 0.8033, "learning_rate": 4.874659992996521e-06, "epoch": 0.9715523465703971, "percentage": 48.61, "elapsed_time": "8:35:59", "remaining_time": "9:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 1730, "loss": 0.7991, "learning_rate": 4.875520152499416e-06, "epoch": 0.9727075812274368, "percentage": 48.67, "elapsed_time": "8:36:33", "remaining_time": "9:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 1730, "loss": 0.811, "learning_rate": 4.876379291041238e-06, "epoch": 0.9738628158844765, "percentage": 48.73, "elapsed_time": "8:37:06", "remaining_time": "9:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 1730, "loss": 0.7795, "learning_rate": 4.87723741104276e-06, "epoch": 0.9750180505415162, "percentage": 48.79, "elapsed_time": "8:37:40", "remaining_time": "9:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1730, "loss": 0.8024, "learning_rate": 4.878094514916154e-06, "epoch": 0.976173285198556, "percentage": 48.84, "elapsed_time": "8:38:14", "remaining_time": "9:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 1730, "loss": 0.8273, "learning_rate": 4.87895060506504e-06, "epoch": 0.9773285198555957, "percentage": 48.9, "elapsed_time": "8:38:48", "remaining_time": "9:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 1730, "loss": 0.8249, "learning_rate": 4.879805683884512e-06, "epoch": 0.9784837545126354, "percentage": 48.96, "elapsed_time": "8:39:22", "remaining_time": "9:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 1730, "loss": 0.8009, "learning_rate": 4.88065975376119e-06, "epoch": 0.9796389891696751, "percentage": 49.02, "elapsed_time": "8:39:55", "remaining_time": "9:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 1730, "loss": 0.8114, "learning_rate": 4.881512817073255e-06, "epoch": 0.9807942238267148, "percentage": 49.08, "elapsed_time": "8:40:29", "remaining_time": "9:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1730, "loss": 0.7919, "learning_rate": 4.882364876190489e-06, "epoch": 0.9819494584837545, "percentage": 49.13, "elapsed_time": "8:41:03", "remaining_time": "8:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.883215933474314e-06, "epoch": 0.9831046931407942, "percentage": 49.19, "elapsed_time": "8:41:37", "remaining_time": "8:58:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 1730, "loss": 0.8142, "learning_rate": 4.884065991277834e-06, "epoch": 0.9842599277978339, "percentage": 49.25, "elapsed_time": "8:42:11", "remaining_time": "8:58:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 1730, "loss": 0.7958, "learning_rate": 4.8849150519458725e-06, "epoch": 0.9854151624548736, "percentage": 49.31, "elapsed_time": "8:42:45", "remaining_time": "8:57:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 1730, "loss": 0.8132, "learning_rate": 4.88576311781501e-06, "epoch": 0.9865703971119134, "percentage": 49.36, "elapsed_time": "8:43:19", "remaining_time": "8:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1730, "loss": 0.8156, "learning_rate": 4.886610191213622e-06, "epoch": 0.9877256317689531, "percentage": 49.42, "elapsed_time": "8:43:53", "remaining_time": "8:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 1730, "loss": 0.8221, "learning_rate": 4.8874562744619224e-06, "epoch": 0.9888808664259928, "percentage": 49.48, "elapsed_time": "8:44:27", "remaining_time": "8:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 1730, "loss": 0.8267, "learning_rate": 4.888301369871998e-06, "epoch": 0.9900361010830325, "percentage": 49.54, "elapsed_time": "8:45:02", "remaining_time": "8:54:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 1730, "loss": 0.8206, "learning_rate": 4.8891454797478435e-06, "epoch": 0.9911913357400722, "percentage": 49.6, "elapsed_time": "8:45:36", "remaining_time": "8:54:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 1730, "loss": 0.8466, "learning_rate": 4.889988606385404e-06, "epoch": 0.9923465703971119, "percentage": 49.65, "elapsed_time": "8:46:09", "remaining_time": "8:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1730, "loss": 0.801, "learning_rate": 4.890830752072613e-06, "epoch": 0.9935018050541516, "percentage": 49.71, "elapsed_time": "8:46:43", "remaining_time": "8:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 1730, "loss": 0.7935, "learning_rate": 4.891671919089425e-06, "epoch": 0.9946570397111913, "percentage": 49.77, "elapsed_time": "8:47:17", "remaining_time": "8:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 1730, "loss": 0.8104, "learning_rate": 4.892512109707855e-06, "epoch": 0.995812274368231, "percentage": 49.83, "elapsed_time": "8:47:51", "remaining_time": "8:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 1730, "loss": 0.7755, "learning_rate": 4.893351326192016e-06, "epoch": 0.9969675090252708, "percentage": 49.88, "elapsed_time": "8:48:26", "remaining_time": "8:50:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 1730, "loss": 0.783, "learning_rate": 4.8941895707981555e-06, "epoch": 0.9981227436823105, "percentage": 49.94, "elapsed_time": "8:48:59", "remaining_time": "8:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1730, "loss": 0.7952, "learning_rate": 4.895026845774691e-06, "epoch": 0.9992779783393502, "percentage": 50.0, "elapsed_time": "8:49:33", "remaining_time": "8:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 1730, "loss": 1.0888, "learning_rate": 4.895863153362244e-06, "epoch": 1.00043321299639, "percentage": 50.06, "elapsed_time": "8:50:07", "remaining_time": "8:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 1730, "loss": 0.8026, "learning_rate": 4.8966984957936845e-06, "epoch": 1.0015884476534296, "percentage": 50.12, "elapsed_time": "8:50:40", "remaining_time": "8:48:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 1730, "loss": 0.7892, "learning_rate": 4.897532875294154e-06, "epoch": 1.0027436823104694, "percentage": 50.17, "elapsed_time": "8:51:14", "remaining_time": "8:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 1730, "loss": 0.7766, "learning_rate": 4.898366294081111e-06, "epoch": 1.003898916967509, "percentage": 50.23, "elapsed_time": "8:51:48", "remaining_time": "8:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1730, "loss": 0.794, "learning_rate": 4.899198754364365e-06, "epoch": 1.0050541516245488, "percentage": 50.29, "elapsed_time": "8:52:22", "remaining_time": "8:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 1730, "loss": 0.787, "learning_rate": 4.900030258346106e-06, "epoch": 1.0062093862815884, "percentage": 50.35, "elapsed_time": "8:52:56", "remaining_time": "8:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 1730, "loss": 0.7726, "learning_rate": 4.900860808220946e-06, "epoch": 1.0073646209386282, "percentage": 50.4, "elapsed_time": "8:53:29", "remaining_time": "8:44:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 1730, "loss": 0.7672, "learning_rate": 4.90169040617595e-06, "epoch": 1.0085198555956678, "percentage": 50.46, "elapsed_time": "8:54:03", "remaining_time": "8:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 1730, "loss": 0.7804, "learning_rate": 4.902519054390672e-06, "epoch": 1.0096750902527076, "percentage": 50.52, "elapsed_time": "8:54:37", "remaining_time": "8:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1730, "loss": 0.7895, "learning_rate": 4.9033467550371886e-06, "epoch": 1.0108303249097472, "percentage": 50.58, "elapsed_time": "8:55:12", "remaining_time": "8:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 1730, "loss": 0.7916, "learning_rate": 4.904173510280135e-06, "epoch": 1.011985559566787, "percentage": 50.64, "elapsed_time": "8:55:45", "remaining_time": "8:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 1730, "loss": 0.7975, "learning_rate": 4.904999322276735e-06, "epoch": 1.0131407942238266, "percentage": 50.69, "elapsed_time": "8:56:19", "remaining_time": "8:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 1730, "loss": 0.7881, "learning_rate": 4.905824193176839e-06, "epoch": 1.0142960288808665, "percentage": 50.75, "elapsed_time": "8:56:53", "remaining_time": "8:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 1730, "loss": 0.7897, "learning_rate": 4.906648125122953e-06, "epoch": 1.015451263537906, "percentage": 50.81, "elapsed_time": "8:57:27", "remaining_time": "8:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1730, "loss": 0.7735, "learning_rate": 4.907471120250281e-06, "epoch": 1.0166064981949459, "percentage": 50.87, "elapsed_time": "8:58:00", "remaining_time": "8:39:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 1730, "loss": 0.788, "learning_rate": 4.9082931806867475e-06, "epoch": 1.0177617328519855, "percentage": 50.92, "elapsed_time": "8:58:35", "remaining_time": "8:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 1730, "loss": 0.7902, "learning_rate": 4.909114308553034e-06, "epoch": 1.0189169675090253, "percentage": 50.98, "elapsed_time": "8:59:09", "remaining_time": "8:38:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 1730, "loss": 0.8, "learning_rate": 4.909934505962614e-06, "epoch": 1.020072202166065, "percentage": 51.04, "elapsed_time": "8:59:43", "remaining_time": "8:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 1730, "loss": 0.7957, "learning_rate": 4.9107537750217884e-06, "epoch": 1.0212274368231047, "percentage": 51.1, "elapsed_time": "9:00:16", "remaining_time": "8:37:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.9115721178297095e-06, "epoch": 1.0223826714801445, "percentage": 51.16, "elapsed_time": "9:00:50", "remaining_time": "8:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 1730, "loss": 0.7611, "learning_rate": 4.9123895364784185e-06, "epoch": 1.023537906137184, "percentage": 51.21, "elapsed_time": "9:01:24", "remaining_time": "8:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 1730, "loss": 0.808, "learning_rate": 4.913206033052878e-06, "epoch": 1.024693140794224, "percentage": 51.27, "elapsed_time": "9:01:58", "remaining_time": "8:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 1730, "loss": 0.7432, "learning_rate": 4.914021609631002e-06, "epoch": 1.0258483754512635, "percentage": 51.33, "elapsed_time": "9:02:31", "remaining_time": "8:34:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 1730, "loss": 0.7872, "learning_rate": 4.914836268283691e-06, "epoch": 1.0270036101083033, "percentage": 51.39, "elapsed_time": "9:03:05", "remaining_time": "8:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1730, "loss": 0.7876, "learning_rate": 4.915650011074855e-06, "epoch": 1.028158844765343, "percentage": 51.45, "elapsed_time": "9:03:40", "remaining_time": "8:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 1730, "loss": 0.7919, "learning_rate": 4.916462840061458e-06, "epoch": 1.0293140794223827, "percentage": 51.5, "elapsed_time": "9:04:13", "remaining_time": "8:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 1730, "loss": 0.7961, "learning_rate": 4.917274757293539e-06, "epoch": 1.0304693140794223, "percentage": 51.56, "elapsed_time": "9:04:47", "remaining_time": "8:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 1730, "loss": 0.7908, "learning_rate": 4.918085764814244e-06, "epoch": 1.0316245487364621, "percentage": 51.62, "elapsed_time": "9:05:21", "remaining_time": "8:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 1730, "loss": 0.7752, "learning_rate": 4.918895864659863e-06, "epoch": 1.0327797833935017, "percentage": 51.68, "elapsed_time": "9:05:55", "remaining_time": "8:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1730, "loss": 0.8114, "learning_rate": 4.919705058859854e-06, "epoch": 1.0339350180505416, "percentage": 51.73, "elapsed_time": "9:06:29", "remaining_time": "8:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 1730, "loss": 0.801, "learning_rate": 4.920513349436876e-06, "epoch": 1.0350902527075811, "percentage": 51.79, "elapsed_time": "9:07:03", "remaining_time": "8:29:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 1730, "loss": 0.7736, "learning_rate": 4.921320738406821e-06, "epoch": 1.036245487364621, "percentage": 51.85, "elapsed_time": "9:07:37", "remaining_time": "8:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 1730, "loss": 0.7968, "learning_rate": 4.922127227778841e-06, "epoch": 1.0374007220216606, "percentage": 51.91, "elapsed_time": "9:08:11", "remaining_time": "8:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 1730, "loss": 0.7695, "learning_rate": 4.922932819555381e-06, "epoch": 1.0385559566787004, "percentage": 51.97, "elapsed_time": "9:08:45", "remaining_time": "8:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1730, "loss": 0.7764, "learning_rate": 4.923737515732209e-06, "epoch": 1.03971119133574, "percentage": 52.02, "elapsed_time": "9:09:19", "remaining_time": "8:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 1730, "loss": 0.7881, "learning_rate": 4.924541318298439e-06, "epoch": 1.0408664259927798, "percentage": 52.08, "elapsed_time": "9:09:53", "remaining_time": "8:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 1730, "loss": 0.791, "learning_rate": 4.925344229236571e-06, "epoch": 1.0420216606498194, "percentage": 52.14, "elapsed_time": "9:10:26", "remaining_time": "8:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 1730, "loss": 0.778, "learning_rate": 4.926146250522511e-06, "epoch": 1.0431768953068592, "percentage": 52.2, "elapsed_time": "9:11:00", "remaining_time": "8:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 1730, "loss": 0.7784, "learning_rate": 4.926947384125606e-06, "epoch": 1.044332129963899, "percentage": 52.25, "elapsed_time": "9:11:34", "remaining_time": "8:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1730, "loss": 0.7729, "learning_rate": 4.927747632008672e-06, "epoch": 1.0454873646209386, "percentage": 52.31, "elapsed_time": "9:12:08", "remaining_time": "8:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 1730, "loss": 0.7846, "learning_rate": 4.928546996128022e-06, "epoch": 1.0466425992779784, "percentage": 52.37, "elapsed_time": "9:12:42", "remaining_time": "8:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 1730, "loss": 0.7672, "learning_rate": 4.929345478433492e-06, "epoch": 1.047797833935018, "percentage": 52.43, "elapsed_time": "9:13:16", "remaining_time": "8:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 1730, "loss": 0.777, "learning_rate": 4.930143080868476e-06, "epoch": 1.0489530685920578, "percentage": 52.49, "elapsed_time": "9:13:50", "remaining_time": "8:21:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 1730, "loss": 0.8104, "learning_rate": 4.930939805369947e-06, "epoch": 1.0501083032490974, "percentage": 52.54, "elapsed_time": "9:14:23", "remaining_time": "8:20:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1730, "loss": 0.7729, "learning_rate": 4.931735653868489e-06, "epoch": 1.0512635379061372, "percentage": 52.6, "elapsed_time": "9:14:58", "remaining_time": "8:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 1730, "loss": 0.7957, "learning_rate": 4.932530628288331e-06, "epoch": 1.0524187725631768, "percentage": 52.66, "elapsed_time": "9:15:31", "remaining_time": "8:19:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 1730, "loss": 0.7988, "learning_rate": 4.933324730547361e-06, "epoch": 1.0535740072202167, "percentage": 52.72, "elapsed_time": "9:16:05", "remaining_time": "8:18:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 1730, "loss": 0.7637, "learning_rate": 4.934117962557165e-06, "epoch": 1.0547292418772563, "percentage": 52.77, "elapsed_time": "9:16:39", "remaining_time": "8:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 1730, "loss": 0.77, "learning_rate": 4.934910326223052e-06, "epoch": 1.055884476534296, "percentage": 52.83, "elapsed_time": "9:17:13", "remaining_time": "8:17:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1730, "loss": 0.7778, "learning_rate": 4.93570182344408e-06, "epoch": 1.0570397111913357, "percentage": 52.89, "elapsed_time": "9:17:46", "remaining_time": "8:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 1730, "loss": 0.7879, "learning_rate": 4.936492456113085e-06, "epoch": 1.0581949458483755, "percentage": 52.95, "elapsed_time": "9:18:21", "remaining_time": "8:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 1730, "loss": 0.7698, "learning_rate": 4.937282226116702e-06, "epoch": 1.059350180505415, "percentage": 53.01, "elapsed_time": "9:18:55", "remaining_time": "8:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 1730, "loss": 0.7637, "learning_rate": 4.938071135335405e-06, "epoch": 1.060505415162455, "percentage": 53.06, "elapsed_time": "9:19:28", "remaining_time": "8:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 1730, "loss": 0.8057, "learning_rate": 4.938859185643519e-06, "epoch": 1.0616606498194945, "percentage": 53.12, "elapsed_time": "9:20:03", "remaining_time": "8:14:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1730, "loss": 0.7773, "learning_rate": 4.93964637890926e-06, "epoch": 1.0628158844765343, "percentage": 53.18, "elapsed_time": "9:20:36", "remaining_time": "8:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 1730, "loss": 0.7912, "learning_rate": 4.9404327169947486e-06, "epoch": 1.0639711191335741, "percentage": 53.24, "elapsed_time": "9:21:10", "remaining_time": "8:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 1730, "loss": 0.7873, "learning_rate": 4.941218201756049e-06, "epoch": 1.0651263537906137, "percentage": 53.29, "elapsed_time": "9:21:44", "remaining_time": "8:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 1730, "loss": 0.7853, "learning_rate": 4.942002835043187e-06, "epoch": 1.0662815884476535, "percentage": 53.35, "elapsed_time": "9:22:18", "remaining_time": "8:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 1730, "loss": 0.7853, "learning_rate": 4.9427866187001785e-06, "epoch": 1.0674368231046931, "percentage": 53.41, "elapsed_time": "9:22:52", "remaining_time": "8:10:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1730, "loss": 0.7851, "learning_rate": 4.943569554565055e-06, "epoch": 1.068592057761733, "percentage": 53.47, "elapsed_time": "9:23:26", "remaining_time": "8:10:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 1730, "loss": 0.7881, "learning_rate": 4.9443516444698915e-06, "epoch": 1.0697472924187725, "percentage": 53.53, "elapsed_time": "9:24:00", "remaining_time": "8:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 1730, "loss": 0.813, "learning_rate": 4.945132890240829e-06, "epoch": 1.0709025270758123, "percentage": 53.58, "elapsed_time": "9:24:34", "remaining_time": "8:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 1730, "loss": 0.7998, "learning_rate": 4.9459132936981044e-06, "epoch": 1.072057761732852, "percentage": 53.64, "elapsed_time": "9:25:08", "remaining_time": "8:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 1730, "loss": 0.764, "learning_rate": 4.94669285665607e-06, "epoch": 1.0732129963898918, "percentage": 53.7, "elapsed_time": "9:25:42", "remaining_time": "8:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1730, "loss": 0.7734, "learning_rate": 4.9474715809232256e-06, "epoch": 1.0743682310469314, "percentage": 53.76, "elapsed_time": "9:26:15", "remaining_time": "8:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 1730, "loss": 0.7959, "learning_rate": 4.948249468302239e-06, "epoch": 1.0755234657039712, "percentage": 53.82, "elapsed_time": "9:26:50", "remaining_time": "8:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 1730, "loss": 0.7987, "learning_rate": 4.9490265205899695e-06, "epoch": 1.0766787003610108, "percentage": 53.87, "elapsed_time": "9:27:23", "remaining_time": "8:05:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 1730, "loss": 0.8067, "learning_rate": 4.949802739577501e-06, "epoch": 1.0778339350180506, "percentage": 53.93, "elapsed_time": "9:27:57", "remaining_time": "8:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 1730, "loss": 0.7855, "learning_rate": 4.950578127050157e-06, "epoch": 1.0789891696750902, "percentage": 53.99, "elapsed_time": "9:28:31", "remaining_time": "8:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1730, "loss": 0.7821, "learning_rate": 4.95135268478753e-06, "epoch": 1.08014440433213, "percentage": 54.05, "elapsed_time": "9:29:07", "remaining_time": "8:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 1730, "loss": 0.7954, "learning_rate": 4.952126414563509e-06, "epoch": 1.0812996389891696, "percentage": 54.1, "elapsed_time": "9:29:40", "remaining_time": "8:03:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 1730, "loss": 0.771, "learning_rate": 4.952899318146298e-06, "epoch": 1.0824548736462094, "percentage": 54.16, "elapsed_time": "9:30:14", "remaining_time": "8:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 1730, "loss": 0.7737, "learning_rate": 4.953671397298441e-06, "epoch": 1.083610108303249, "percentage": 54.22, "elapsed_time": "9:30:47", "remaining_time": "8:01:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 1730, "loss": 0.7702, "learning_rate": 4.954442653776852e-06, "epoch": 1.0847653429602888, "percentage": 54.28, "elapsed_time": "9:31:22", "remaining_time": "8:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1730, "loss": 0.772, "learning_rate": 4.955213089332832e-06, "epoch": 1.0859205776173284, "percentage": 54.34, "elapsed_time": "9:31:55", "remaining_time": "8:00:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 1730, "loss": 0.7828, "learning_rate": 4.955982705712095e-06, "epoch": 1.0870758122743682, "percentage": 54.39, "elapsed_time": "9:32:29", "remaining_time": "8:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 1730, "loss": 0.7848, "learning_rate": 4.956751504654796e-06, "epoch": 1.088231046931408, "percentage": 54.45, "elapsed_time": "9:33:03", "remaining_time": "7:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 1730, "loss": 0.7655, "learning_rate": 4.957519487895548e-06, "epoch": 1.0893862815884476, "percentage": 54.51, "elapsed_time": "9:33:37", "remaining_time": "7:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 1730, "loss": 0.773, "learning_rate": 4.958286657163448e-06, "epoch": 1.0905415162454875, "percentage": 54.57, "elapsed_time": "9:34:11", "remaining_time": "7:58:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1730, "loss": 0.7755, "learning_rate": 4.959053014182106e-06, "epoch": 1.091696750902527, "percentage": 54.62, "elapsed_time": "9:34:44", "remaining_time": "7:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 1730, "loss": 0.8009, "learning_rate": 4.959818560669656e-06, "epoch": 1.0928519855595669, "percentage": 54.68, "elapsed_time": "9:35:18", "remaining_time": "7:56:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 1730, "loss": 0.7705, "learning_rate": 4.96058329833879e-06, "epoch": 1.0940072202166065, "percentage": 54.74, "elapsed_time": "9:35:52", "remaining_time": "7:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 1730, "loss": 0.7727, "learning_rate": 4.9613472288967775e-06, "epoch": 1.0951624548736463, "percentage": 54.8, "elapsed_time": "9:36:26", "remaining_time": "7:55:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 1730, "loss": 0.7921, "learning_rate": 4.962110354045489e-06, "epoch": 1.0963176895306859, "percentage": 54.86, "elapsed_time": "9:37:00", "remaining_time": "7:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1730, "loss": 0.7827, "learning_rate": 4.962872675481414e-06, "epoch": 1.0974729241877257, "percentage": 54.91, "elapsed_time": "9:37:34", "remaining_time": "7:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 1730, "loss": 0.7663, "learning_rate": 4.96363419489569e-06, "epoch": 1.0986281588447653, "percentage": 54.97, "elapsed_time": "9:38:08", "remaining_time": "7:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 1730, "loss": 0.7735, "learning_rate": 4.964394913974124e-06, "epoch": 1.099783393501805, "percentage": 55.03, "elapsed_time": "9:38:42", "remaining_time": "7:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 1730, "loss": 0.8092, "learning_rate": 4.965154834397211e-06, "epoch": 1.1009386281588447, "percentage": 55.09, "elapsed_time": "9:39:16", "remaining_time": "7:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 1730, "loss": 0.791, "learning_rate": 4.965913957840159e-06, "epoch": 1.1020938628158845, "percentage": 55.14, "elapsed_time": "9:39:50", "remaining_time": "7:51:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1730, "loss": 0.7682, "learning_rate": 4.966672285972911e-06, "epoch": 1.103249097472924, "percentage": 55.2, "elapsed_time": "9:40:24", "remaining_time": "7:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 1730, "loss": 0.7934, "learning_rate": 4.967429820460167e-06, "epoch": 1.104404332129964, "percentage": 55.26, "elapsed_time": "9:40:58", "remaining_time": "7:50:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 1730, "loss": 0.7758, "learning_rate": 4.968186562961406e-06, "epoch": 1.1055595667870035, "percentage": 55.32, "elapsed_time": "9:41:32", "remaining_time": "7:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 1730, "loss": 0.7949, "learning_rate": 4.968942515130908e-06, "epoch": 1.1067148014440433, "percentage": 55.38, "elapsed_time": "9:42:06", "remaining_time": "7:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 1730, "loss": 0.801, "learning_rate": 4.969697678617774e-06, "epoch": 1.1078700361010831, "percentage": 55.43, "elapsed_time": "9:42:40", "remaining_time": "7:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1730, "loss": 0.7872, "learning_rate": 4.970452055065948e-06, "epoch": 1.1090252707581227, "percentage": 55.49, "elapsed_time": "9:43:14", "remaining_time": "7:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 1730, "loss": 0.8076, "learning_rate": 4.971205646114243e-06, "epoch": 1.1101805054151626, "percentage": 55.55, "elapsed_time": "9:43:48", "remaining_time": "7:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 1730, "loss": 0.7646, "learning_rate": 4.9719584533963555e-06, "epoch": 1.1113357400722021, "percentage": 55.61, "elapsed_time": "9:44:22", "remaining_time": "7:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 1730, "loss": 0.7704, "learning_rate": 4.9727104785408915e-06, "epoch": 1.112490974729242, "percentage": 55.66, "elapsed_time": "9:44:56", "remaining_time": "7:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 1730, "loss": 0.7787, "learning_rate": 4.973461723171385e-06, "epoch": 1.1136462093862816, "percentage": 55.72, "elapsed_time": "9:45:30", "remaining_time": "7:45:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1730, "loss": 0.7824, "learning_rate": 4.974212188906321e-06, "epoch": 1.1148014440433214, "percentage": 55.78, "elapsed_time": "9:46:04", "remaining_time": "7:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 1730, "loss": 0.8069, "learning_rate": 4.974961877359156e-06, "epoch": 1.115956678700361, "percentage": 55.84, "elapsed_time": "9:46:38", "remaining_time": "7:43:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 1730, "loss": 0.7603, "learning_rate": 4.975710790138337e-06, "epoch": 1.1171119133574008, "percentage": 55.9, "elapsed_time": "9:47:12", "remaining_time": "7:43:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 1730, "loss": 0.7884, "learning_rate": 4.976458928847323e-06, "epoch": 1.1182671480144404, "percentage": 55.95, "elapsed_time": "9:47:45", "remaining_time": "7:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 1730, "loss": 0.7902, "learning_rate": 4.977206295084609e-06, "epoch": 1.1194223826714802, "percentage": 56.01, "elapsed_time": "9:48:20", "remaining_time": "7:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1730, "loss": 0.7927, "learning_rate": 4.977952890443742e-06, "epoch": 1.1205776173285198, "percentage": 56.07, "elapsed_time": "9:48:54", "remaining_time": "7:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 1730, "loss": 0.8075, "learning_rate": 4.978698716513342e-06, "epoch": 1.1217328519855596, "percentage": 56.13, "elapsed_time": "9:49:28", "remaining_time": "7:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 1730, "loss": 0.767, "learning_rate": 4.9794437748771245e-06, "epoch": 1.1228880866425992, "percentage": 56.18, "elapsed_time": "9:50:02", "remaining_time": "7:40:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 1730, "loss": 0.8103, "learning_rate": 4.98018806711392e-06, "epoch": 1.124043321299639, "percentage": 56.24, "elapsed_time": "9:50:35", "remaining_time": "7:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 1730, "loss": 0.7939, "learning_rate": 4.980931594797693e-06, "epoch": 1.1251985559566786, "percentage": 56.3, "elapsed_time": "9:51:10", "remaining_time": "7:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.981674359497562e-06, "epoch": 1.1263537906137184, "percentage": 56.36, "elapsed_time": "9:51:44", "remaining_time": "7:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 1730, "loss": 0.7765, "learning_rate": 4.98241636277782e-06, "epoch": 1.1275090252707582, "percentage": 56.42, "elapsed_time": "9:52:17", "remaining_time": "7:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 1730, "loss": 0.7786, "learning_rate": 4.9831576061979556e-06, "epoch": 1.1286642599277978, "percentage": 56.47, "elapsed_time": "9:52:51", "remaining_time": "7:36:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 1730, "loss": 0.7663, "learning_rate": 4.98389809131267e-06, "epoch": 1.1298194945848374, "percentage": 56.53, "elapsed_time": "9:53:24", "remaining_time": "7:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 1730, "loss": 0.8018, "learning_rate": 4.984637819671897e-06, "epoch": 1.1309747292418773, "percentage": 56.59, "elapsed_time": "9:53:58", "remaining_time": "7:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1730, "loss": 0.8052, "learning_rate": 4.985376792820825e-06, "epoch": 1.132129963898917, "percentage": 56.65, "elapsed_time": "9:54:32", "remaining_time": "7:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 1730, "loss": 0.7608, "learning_rate": 4.986115012299915e-06, "epoch": 1.1332851985559567, "percentage": 56.71, "elapsed_time": "9:55:06", "remaining_time": "7:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 1730, "loss": 0.8069, "learning_rate": 4.986852479644916e-06, "epoch": 1.1344404332129965, "percentage": 56.76, "elapsed_time": "9:55:39", "remaining_time": "7:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 1730, "loss": 0.7694, "learning_rate": 4.987589196386893e-06, "epoch": 1.135595667870036, "percentage": 56.82, "elapsed_time": "9:56:13", "remaining_time": "7:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 1730, "loss": 0.7738, "learning_rate": 4.988325164052236e-06, "epoch": 1.136750902527076, "percentage": 56.88, "elapsed_time": "9:56:47", "remaining_time": "7:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1730, "loss": 0.7624, "learning_rate": 4.989060384162687e-06, "epoch": 1.1379061371841155, "percentage": 56.94, "elapsed_time": "9:57:21", "remaining_time": "7:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 1730, "loss": 0.7827, "learning_rate": 4.989794858235352e-06, "epoch": 1.1390613718411553, "percentage": 56.99, "elapsed_time": "9:57:54", "remaining_time": "7:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 1730, "loss": 0.7849, "learning_rate": 4.990528587782728e-06, "epoch": 1.140216606498195, "percentage": 57.05, "elapsed_time": "9:58:28", "remaining_time": "7:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 1730, "loss": 0.8019, "learning_rate": 4.991261574312715e-06, "epoch": 1.1413718411552347, "percentage": 57.11, "elapsed_time": "9:59:01", "remaining_time": "7:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 1730, "loss": 0.8075, "learning_rate": 4.991993819328633e-06, "epoch": 1.1425270758122743, "percentage": 57.17, "elapsed_time": "9:59:35", "remaining_time": "7:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1730, "loss": 0.7916, "learning_rate": 4.992725324329251e-06, "epoch": 1.1436823104693141, "percentage": 57.23, "elapsed_time": "10:00:09", "remaining_time": "7:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 1730, "loss": 0.7943, "learning_rate": 4.993456090808793e-06, "epoch": 1.1448375451263537, "percentage": 57.28, "elapsed_time": "10:00:42", "remaining_time": "7:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 1730, "loss": 0.7993, "learning_rate": 4.994186120256964e-06, "epoch": 1.1459927797833935, "percentage": 57.34, "elapsed_time": "10:01:16", "remaining_time": "7:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 1730, "loss": 0.7806, "learning_rate": 4.99491541415897e-06, "epoch": 1.1471480144404331, "percentage": 57.4, "elapsed_time": "10:01:51", "remaining_time": "7:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 1730, "loss": 0.7753, "learning_rate": 4.995643973995523e-06, "epoch": 1.148303249097473, "percentage": 57.46, "elapsed_time": "10:02:25", "remaining_time": "7:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1730, "loss": 0.7487, "learning_rate": 4.996371801242876e-06, "epoch": 1.1494584837545125, "percentage": 57.51, "elapsed_time": "10:02:59", "remaining_time": "7:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 1730, "loss": 0.7776, "learning_rate": 4.997098897372832e-06, "epoch": 1.1506137184115524, "percentage": 57.57, "elapsed_time": "10:03:33", "remaining_time": "7:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 1730, "loss": 0.7718, "learning_rate": 4.99782526385276e-06, "epoch": 1.1517689530685922, "percentage": 57.63, "elapsed_time": "10:04:07", "remaining_time": "7:24:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 1730, "loss": 0.7849, "learning_rate": 4.998550902145619e-06, "epoch": 1.1529241877256318, "percentage": 57.69, "elapsed_time": "10:04:40", "remaining_time": "7:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 1730, "loss": 0.7944, "learning_rate": 4.999275813709971e-06, "epoch": 1.1540794223826714, "percentage": 57.75, "elapsed_time": "10:05:14", "remaining_time": "7:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1730, "loss": 0.8039, "learning_rate": 5e-06, "epoch": 1.1552346570397112, "percentage": 57.8, "elapsed_time": "10:05:47", "remaining_time": "7:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 1730, "loss": 0.792, "learning_rate": 4.999976851655541e-06, "epoch": 1.156389891696751, "percentage": 57.86, "elapsed_time": "10:21:05", "remaining_time": "7:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 1730, "loss": 0.7816, "learning_rate": 4.999907407050885e-06, "epoch": 1.1575451263537906, "percentage": 57.92, "elapsed_time": "10:21:40", "remaining_time": "7:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 1730, "loss": 0.7473, "learning_rate": 4.999791667472181e-06, "epoch": 1.1587003610108304, "percentage": 57.98, "elapsed_time": "10:22:13", "remaining_time": "7:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 1730, "loss": 0.7964, "learning_rate": 4.999629635062988e-06, "epoch": 1.15985559566787, "percentage": 58.03, "elapsed_time": "10:22:47", "remaining_time": "7:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1730, "loss": 0.7885, "learning_rate": 4.999421312824233e-06, "epoch": 1.1610108303249098, "percentage": 58.09, "elapsed_time": "10:23:21", "remaining_time": "7:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 1730, "loss": 0.7553, "learning_rate": 4.99916670461415e-06, "epoch": 1.1621660649819494, "percentage": 58.15, "elapsed_time": "10:23:55", "remaining_time": "7:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 1730, "loss": 0.757, "learning_rate": 4.998865815148222e-06, "epoch": 1.1633212996389892, "percentage": 58.21, "elapsed_time": "10:24:29", "remaining_time": "7:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 1730, "loss": 0.793, "learning_rate": 4.998518649999077e-06, "epoch": 1.1644765342960288, "percentage": 58.27, "elapsed_time": "10:25:04", "remaining_time": "7:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 1730, "loss": 0.7684, "learning_rate": 4.998125215596399e-06, "epoch": 1.1656317689530686, "percentage": 58.32, "elapsed_time": "10:25:37", "remaining_time": "7:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1730, "loss": 0.794, "learning_rate": 4.9976855192268e-06, "epoch": 1.1667870036101082, "percentage": 58.38, "elapsed_time": "10:26:11", "remaining_time": "7:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 1730, "loss": 0.7872, "learning_rate": 4.997199569033688e-06, "epoch": 1.167942238267148, "percentage": 58.44, "elapsed_time": "10:26:45", "remaining_time": "7:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 1730, "loss": 0.797, "learning_rate": 4.996667374017118e-06, "epoch": 1.1690974729241876, "percentage": 58.5, "elapsed_time": "10:27:19", "remaining_time": "7:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 1730, "loss": 0.7912, "learning_rate": 4.996088944033622e-06, "epoch": 1.1702527075812275, "percentage": 58.55, "elapsed_time": "10:27:53", "remaining_time": "7:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 1730, "loss": 0.7714, "learning_rate": 4.995464289796029e-06, "epoch": 1.171407942238267, "percentage": 58.61, "elapsed_time": "10:28:27", "remaining_time": "7:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1730, "loss": 0.7755, "learning_rate": 4.994793422873265e-06, "epoch": 1.1725631768953069, "percentage": 58.67, "elapsed_time": "10:29:01", "remaining_time": "7:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 1730, "loss": 0.8052, "learning_rate": 4.994076355690139e-06, "epoch": 1.1737184115523465, "percentage": 58.73, "elapsed_time": "10:29:35", "remaining_time": "7:22:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 1730, "loss": 0.7955, "learning_rate": 4.993313101527112e-06, "epoch": 1.1748736462093863, "percentage": 58.79, "elapsed_time": "10:30:09", "remaining_time": "7:21:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 1730, "loss": 0.7595, "learning_rate": 4.992503674520057e-06, "epoch": 1.176028880866426, "percentage": 58.84, "elapsed_time": "10:30:43", "remaining_time": "7:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 1730, "loss": 0.7812, "learning_rate": 4.991648089659987e-06, "epoch": 1.1771841155234657, "percentage": 58.9, "elapsed_time": "10:31:16", "remaining_time": "7:20:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1730, "loss": 0.7884, "learning_rate": 4.990746362792786e-06, "epoch": 1.1783393501805055, "percentage": 58.96, "elapsed_time": "10:31:50", "remaining_time": "7:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 1730, "loss": 0.7999, "learning_rate": 4.989798510618911e-06, "epoch": 1.179494584837545, "percentage": 59.02, "elapsed_time": "10:32:24", "remaining_time": "7:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 1730, "loss": 0.7949, "learning_rate": 4.988804550693086e-06, "epoch": 1.180649819494585, "percentage": 59.08, "elapsed_time": "10:32:58", "remaining_time": "7:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 1730, "loss": 0.793, "learning_rate": 4.9877645014239686e-06, "epoch": 1.1818050541516245, "percentage": 59.13, "elapsed_time": "10:33:32", "remaining_time": "7:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 1730, "loss": 0.7915, "learning_rate": 4.9866783820738255e-06, "epoch": 1.1829602888086643, "percentage": 59.19, "elapsed_time": "10:34:07", "remaining_time": "7:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1730, "loss": 0.7678, "learning_rate": 4.985546212758157e-06, "epoch": 1.184115523465704, "percentage": 59.25, "elapsed_time": "10:34:41", "remaining_time": "7:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 1730, "loss": 0.79, "learning_rate": 4.984368014445336e-06, "epoch": 1.1852707581227437, "percentage": 59.31, "elapsed_time": "10:35:16", "remaining_time": "7:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 1730, "loss": 0.7638, "learning_rate": 4.983143808956219e-06, "epoch": 1.1864259927797833, "percentage": 59.36, "elapsed_time": "10:35:50", "remaining_time": "7:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 1730, "loss": 0.7906, "learning_rate": 4.981873618963737e-06, "epoch": 1.1875812274368232, "percentage": 59.42, "elapsed_time": "10:36:24", "remaining_time": "7:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 1730, "loss": 0.7743, "learning_rate": 4.980557467992476e-06, "epoch": 1.1887364620938627, "percentage": 59.48, "elapsed_time": "10:36:57", "remaining_time": "7:13:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 1730, "loss": 0.7917, "learning_rate": 4.97919538041825e-06, "epoch": 1.1898916967509026, "percentage": 59.54, "elapsed_time": "10:37:31", "remaining_time": "7:13:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 1730, "loss": 0.774, "learning_rate": 4.977787381467638e-06, "epoch": 1.1910469314079422, "percentage": 59.6, "elapsed_time": "10:38:05", "remaining_time": "7:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 1730, "loss": 0.7989, "learning_rate": 4.976333497217524e-06, "epoch": 1.192202166064982, "percentage": 59.65, "elapsed_time": "10:38:38", "remaining_time": "7:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 1730, "loss": 0.7832, "learning_rate": 4.974833754594611e-06, "epoch": 1.1933574007220216, "percentage": 59.71, "elapsed_time": "10:39:12", "remaining_time": "7:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 1730, "loss": 0.7991, "learning_rate": 4.9732881813749236e-06, "epoch": 1.1945126353790614, "percentage": 59.77, "elapsed_time": "10:39:46", "remaining_time": "7:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 1730, "loss": 0.7917, "learning_rate": 4.9716968061832935e-06, "epoch": 1.1956678700361012, "percentage": 59.83, "elapsed_time": "10:40:19", "remaining_time": "7:09:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 1730, "loss": 0.7765, "learning_rate": 4.9700596584928275e-06, "epoch": 1.1968231046931408, "percentage": 59.88, "elapsed_time": "10:40:53", "remaining_time": "7:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 1730, "loss": 0.7871, "learning_rate": 4.968376768624368e-06, "epoch": 1.1979783393501804, "percentage": 59.94, "elapsed_time": "10:41:27", "remaining_time": "7:08:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 1730, "loss": 0.7858, "learning_rate": 4.96664816774592e-06, "epoch": 1.1991335740072202, "percentage": 60.0, "elapsed_time": "10:42:01", "remaining_time": "7:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 1730, "loss": 0.7938, "learning_rate": 4.964873887872085e-06, "epoch": 1.20028880866426, "percentage": 60.06, "elapsed_time": "10:42:35", "remaining_time": "7:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 1730, "loss": 0.7776, "learning_rate": 4.963053961863463e-06, "epoch": 1.2014440433212996, "percentage": 60.12, "elapsed_time": "10:43:09", "remaining_time": "7:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 1730, "loss": 0.7741, "learning_rate": 4.961188423426042e-06, "epoch": 1.2025992779783394, "percentage": 60.17, "elapsed_time": "10:43:43", "remaining_time": "7:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 1730, "loss": 0.7667, "learning_rate": 4.959277307110582e-06, "epoch": 1.203754512635379, "percentage": 60.23, "elapsed_time": "10:44:16", "remaining_time": "7:05:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 1730, "loss": 0.7894, "learning_rate": 4.957320648311961e-06, "epoch": 1.2049097472924188, "percentage": 60.29, "elapsed_time": "10:44:50", "remaining_time": "7:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 1730, "loss": 0.7812, "learning_rate": 4.955318483268535e-06, "epoch": 1.2060649819494584, "percentage": 60.35, "elapsed_time": "10:45:24", "remaining_time": "7:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 1730, "loss": 0.7585, "learning_rate": 4.953270849061456e-06, "epoch": 1.2072202166064983, "percentage": 60.4, "elapsed_time": "10:45:57", "remaining_time": "7:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 1730, "loss": 0.8091, "learning_rate": 4.951177783613991e-06, "epoch": 1.2083754512635378, "percentage": 60.46, "elapsed_time": "10:46:31", "remaining_time": "7:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 1730, "loss": 0.7956, "learning_rate": 4.9490393256908144e-06, "epoch": 1.2095306859205777, "percentage": 60.52, "elapsed_time": "10:47:05", "remaining_time": "7:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 1730, "loss": 0.7779, "learning_rate": 4.946855514897297e-06, "epoch": 1.2106859205776173, "percentage": 60.58, "elapsed_time": "10:47:39", "remaining_time": "7:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 1730, "loss": 0.7993, "learning_rate": 4.944626391678766e-06, "epoch": 1.211841155234657, "percentage": 60.64, "elapsed_time": "10:48:13", "remaining_time": "7:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1730, "loss": 0.812, "learning_rate": 4.942351997319761e-06, "epoch": 1.2129963898916967, "percentage": 60.69, "elapsed_time": "10:48:47", "remaining_time": "7:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 1730, "loss": 0.7558, "learning_rate": 4.940032373943262e-06, "epoch": 1.2141516245487365, "percentage": 60.75, "elapsed_time": "10:49:21", "remaining_time": "6:59:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 1730, "loss": 0.7781, "learning_rate": 4.937667564509923e-06, "epoch": 1.215306859205776, "percentage": 60.81, "elapsed_time": "10:49:54", "remaining_time": "6:58:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 1730, "loss": 0.7916, "learning_rate": 4.935257612817259e-06, "epoch": 1.216462093862816, "percentage": 60.87, "elapsed_time": "10:50:29", "remaining_time": "6:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 1730, "loss": 0.7979, "learning_rate": 4.932802563498847e-06, "epoch": 1.2176173285198555, "percentage": 60.92, "elapsed_time": "10:51:02", "remaining_time": "6:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 1730, "loss": 0.7984, "learning_rate": 4.9303024620234966e-06, "epoch": 1.2187725631768953, "percentage": 60.98, "elapsed_time": "10:51:36", "remaining_time": "6:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 1730, "loss": 0.7986, "learning_rate": 4.927757354694406e-06, "epoch": 1.2199277978339351, "percentage": 61.04, "elapsed_time": "10:52:10", "remaining_time": "6:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 1730, "loss": 0.7763, "learning_rate": 4.925167288648305e-06, "epoch": 1.2210830324909747, "percentage": 61.1, "elapsed_time": "10:52:44", "remaining_time": "6:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 1730, "loss": 0.7967, "learning_rate": 4.922532311854585e-06, "epoch": 1.2222382671480145, "percentage": 61.16, "elapsed_time": "10:53:17", "remaining_time": "6:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 1730, "loss": 0.7926, "learning_rate": 4.919852473114405e-06, "epoch": 1.2233935018050541, "percentage": 61.21, "elapsed_time": "10:53:51", "remaining_time": "6:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 1730, "loss": 0.783, "learning_rate": 4.917127822059792e-06, "epoch": 1.224548736462094, "percentage": 61.27, "elapsed_time": "10:54:25", "remaining_time": "6:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 1730, "loss": 0.7954, "learning_rate": 4.9143584091527236e-06, "epoch": 1.2257039711191335, "percentage": 61.33, "elapsed_time": "10:54:59", "remaining_time": "6:52:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 1730, "loss": 0.7875, "learning_rate": 4.911544285684186e-06, "epoch": 1.2268592057761734, "percentage": 61.39, "elapsed_time": "10:55:32", "remaining_time": "6:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 1730, "loss": 0.7618, "learning_rate": 4.9086855037732315e-06, "epoch": 1.228014440433213, "percentage": 61.45, "elapsed_time": "10:56:06", "remaining_time": "6:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 1730, "loss": 0.7513, "learning_rate": 4.9057821163660085e-06, "epoch": 1.2291696750902528, "percentage": 61.5, "elapsed_time": "10:56:40", "remaining_time": "6:51:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 1730, "loss": 0.7825, "learning_rate": 4.9028341772347845e-06, "epoch": 1.2303249097472924, "percentage": 61.56, "elapsed_time": "10:57:15", "remaining_time": "6:50:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 1730, "loss": 0.7784, "learning_rate": 4.899841740976947e-06, "epoch": 1.2314801444043322, "percentage": 61.62, "elapsed_time": "10:57:48", "remaining_time": "6:49:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 1730, "loss": 0.8057, "learning_rate": 4.8968048630139945e-06, "epoch": 1.2326353790613718, "percentage": 61.68, "elapsed_time": "10:58:22", "remaining_time": "6:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 1730, "loss": 0.778, "learning_rate": 4.89372359959051e-06, "epoch": 1.2337906137184116, "percentage": 61.73, "elapsed_time": "10:58:56", "remaining_time": "6:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 1730, "loss": 0.7719, "learning_rate": 4.890598007773116e-06, "epoch": 1.2349458483754512, "percentage": 61.79, "elapsed_time": "10:59:30", "remaining_time": "6:47:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 1730, "loss": 0.7898, "learning_rate": 4.887428145449425e-06, "epoch": 1.236101083032491, "percentage": 61.85, "elapsed_time": "11:00:05", "remaining_time": "6:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 1730, "loss": 0.7586, "learning_rate": 4.884214071326957e-06, "epoch": 1.2372563176895306, "percentage": 61.91, "elapsed_time": "11:00:38", "remaining_time": "6:46:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 1730, "loss": 0.7779, "learning_rate": 4.880955844932061e-06, "epoch": 1.2384115523465704, "percentage": 61.97, "elapsed_time": "11:01:12", "remaining_time": "6:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 1730, "loss": 0.7774, "learning_rate": 4.877653526608811e-06, "epoch": 1.2395667870036102, "percentage": 62.02, "elapsed_time": "11:01:45", "remaining_time": "6:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 1730, "loss": 0.7714, "learning_rate": 4.874307177517882e-06, "epoch": 1.2407220216606498, "percentage": 62.08, "elapsed_time": "11:02:19", "remaining_time": "6:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 1730, "loss": 0.7951, "learning_rate": 4.870916859635426e-06, "epoch": 1.2418772563176894, "percentage": 62.14, "elapsed_time": "11:02:53", "remaining_time": "6:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 1730, "loss": 0.8094, "learning_rate": 4.86748263575192e-06, "epoch": 1.2430324909747292, "percentage": 62.2, "elapsed_time": "11:03:27", "remaining_time": "6:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 1730, "loss": 0.7828, "learning_rate": 4.864004569471e-06, "epoch": 1.244187725631769, "percentage": 62.25, "elapsed_time": "11:04:01", "remaining_time": "6:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 1730, "loss": 0.8106, "learning_rate": 4.860482725208291e-06, "epoch": 1.2453429602888086, "percentage": 62.31, "elapsed_time": "11:04:34", "remaining_time": "6:41:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 1730, "loss": 0.7893, "learning_rate": 4.856917168190205e-06, "epoch": 1.2464981949458485, "percentage": 62.37, "elapsed_time": "11:05:08", "remaining_time": "6:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 1730, "loss": 0.749, "learning_rate": 4.853307964452739e-06, "epoch": 1.247653429602888, "percentage": 62.43, "elapsed_time": "11:05:41", "remaining_time": "6:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 1730, "loss": 0.8041, "learning_rate": 4.849655180840253e-06, "epoch": 1.2488086642599279, "percentage": 62.49, "elapsed_time": "11:06:15", "remaining_time": "6:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 1730, "loss": 0.7455, "learning_rate": 4.8459588850042255e-06, "epoch": 1.2499638989169675, "percentage": 62.54, "elapsed_time": "11:06:49", "remaining_time": "6:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 1730, "loss": 0.7995, "learning_rate": 4.8422191454020055e-06, "epoch": 1.2511191335740073, "percentage": 62.6, "elapsed_time": "11:07:23", "remaining_time": "6:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 1730, "loss": 0.7776, "learning_rate": 4.838436031295543e-06, "epoch": 1.2522743682310469, "percentage": 62.66, "elapsed_time": "11:07:57", "remaining_time": "6:38:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 1730, "loss": 0.7755, "learning_rate": 4.834609612750108e-06, "epoch": 1.2534296028880867, "percentage": 62.72, "elapsed_time": "11:08:31", "remaining_time": "6:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 1730, "loss": 0.7815, "learning_rate": 4.8307399606329906e-06, "epoch": 1.2545848375451263, "percentage": 62.77, "elapsed_time": "11:09:05", "remaining_time": "6:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 1730, "loss": 0.7618, "learning_rate": 4.82682714661219e-06, "epoch": 1.255740072202166, "percentage": 62.83, "elapsed_time": "11:09:39", "remaining_time": "6:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 1730, "loss": 0.7906, "learning_rate": 4.822871243155085e-06, "epoch": 1.2568953068592057, "percentage": 62.89, "elapsed_time": "11:10:13", "remaining_time": "6:35:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 1730, "loss": 0.7871, "learning_rate": 4.818872323527097e-06, "epoch": 1.2580505415162455, "percentage": 62.95, "elapsed_time": "11:10:47", "remaining_time": "6:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 1730, "loss": 0.763, "learning_rate": 4.814830461790327e-06, "epoch": 1.2592057761732853, "percentage": 63.01, "elapsed_time": "11:11:20", "remaining_time": "6:34:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 1730, "loss": 0.7744, "learning_rate": 4.810745732802186e-06, "epoch": 1.260361010830325, "percentage": 63.06, "elapsed_time": "11:11:54", "remaining_time": "6:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 1730, "loss": 0.7901, "learning_rate": 4.806618212214009e-06, "epoch": 1.2615162454873645, "percentage": 63.12, "elapsed_time": "11:12:29", "remaining_time": "6:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 1730, "loss": 0.797, "learning_rate": 4.802447976469658e-06, "epoch": 1.2626714801444043, "percentage": 63.18, "elapsed_time": "11:13:03", "remaining_time": "6:32:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 1730, "loss": 0.7956, "learning_rate": 4.7982351028040966e-06, "epoch": 1.2638267148014442, "percentage": 63.24, "elapsed_time": "11:13:37", "remaining_time": "6:31:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 1730, "loss": 0.7785, "learning_rate": 4.79397966924197e-06, "epoch": 1.2649819494584837, "percentage": 63.29, "elapsed_time": "11:14:11", "remaining_time": "6:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 1730, "loss": 0.7882, "learning_rate": 4.789681754596152e-06, "epoch": 1.2661371841155233, "percentage": 63.35, "elapsed_time": "11:14:45", "remaining_time": "6:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 1730, "loss": 0.7716, "learning_rate": 4.785341438466289e-06, "epoch": 1.2672924187725632, "percentage": 63.41, "elapsed_time": "11:15:18", "remaining_time": "6:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 1730, "loss": 0.7702, "learning_rate": 4.7809588012373255e-06, "epoch": 1.268447653429603, "percentage": 63.47, "elapsed_time": "11:15:52", "remaining_time": "6:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 1730, "loss": 0.7734, "learning_rate": 4.776533924078018e-06, "epoch": 1.2696028880866426, "percentage": 63.53, "elapsed_time": "11:16:26", "remaining_time": "6:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 1730, "loss": 0.7894, "learning_rate": 4.772066888939423e-06, "epoch": 1.2707581227436824, "percentage": 63.58, "elapsed_time": "11:17:00", "remaining_time": "6:27:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 1730, "loss": 0.7658, "learning_rate": 4.767557778553389e-06, "epoch": 1.271913357400722, "percentage": 63.64, "elapsed_time": "11:17:34", "remaining_time": "6:27:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 1730, "loss": 0.775, "learning_rate": 4.763006676431021e-06, "epoch": 1.2730685920577618, "percentage": 63.7, "elapsed_time": "11:18:09", "remaining_time": "6:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 1730, "loss": 0.7823, "learning_rate": 4.75841366686113e-06, "epoch": 1.2742238267148014, "percentage": 63.76, "elapsed_time": "11:18:42", "remaining_time": "6:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 1730, "loss": 0.7607, "learning_rate": 4.753778834908678e-06, "epoch": 1.2753790613718412, "percentage": 63.82, "elapsed_time": "11:19:16", "remaining_time": "6:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 1730, "loss": 0.7739, "learning_rate": 4.749102266413195e-06, "epoch": 1.2765342960288808, "percentage": 63.87, "elapsed_time": "11:19:50", "remaining_time": "6:24:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 1730, "loss": 0.7914, "learning_rate": 4.744384047987202e-06, "epoch": 1.2776895306859206, "percentage": 63.93, "elapsed_time": "11:20:23", "remaining_time": "6:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 1730, "loss": 0.754, "learning_rate": 4.739624267014589e-06, "epoch": 1.2788447653429602, "percentage": 63.99, "elapsed_time": "11:20:57", "remaining_time": "6:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 1730, "loss": 0.7964, "learning_rate": 4.734823011649013e-06, "epoch": 1.28, "percentage": 64.05, "elapsed_time": "11:21:31", "remaining_time": "6:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 1730, "loss": 0.7831, "learning_rate": 4.7299803708122565e-06, "epoch": 1.2811552346570396, "percentage": 64.1, "elapsed_time": "11:22:05", "remaining_time": "6:21:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 1730, "loss": 0.7651, "learning_rate": 4.725096434192583e-06, "epoch": 1.2823104693140794, "percentage": 64.16, "elapsed_time": "11:22:39", "remaining_time": "6:21:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 1730, "loss": 0.7776, "learning_rate": 4.720171292243076e-06, "epoch": 1.2834657039711193, "percentage": 64.22, "elapsed_time": "11:23:13", "remaining_time": "6:20:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 1730, "loss": 0.7804, "learning_rate": 4.7152050361799626e-06, "epoch": 1.2846209386281588, "percentage": 64.28, "elapsed_time": "11:23:46", "remaining_time": "6:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 1730, "loss": 0.798, "learning_rate": 4.710197757980923e-06, "epoch": 1.2857761732851984, "percentage": 64.34, "elapsed_time": "11:24:20", "remaining_time": "6:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 1730, "loss": 0.7717, "learning_rate": 4.7051495503833955e-06, "epoch": 1.2869314079422383, "percentage": 64.39, "elapsed_time": "11:24:54", "remaining_time": "6:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 1730, "loss": 0.7494, "learning_rate": 4.700060506882846e-06, "epoch": 1.288086642599278, "percentage": 64.45, "elapsed_time": "11:25:28", "remaining_time": "6:18:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 1730, "loss": 0.7955, "learning_rate": 4.694930721731046e-06, "epoch": 1.2892418772563177, "percentage": 64.51, "elapsed_time": "11:26:02", "remaining_time": "6:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 1730, "loss": 0.7752, "learning_rate": 4.689760289934322e-06, "epoch": 1.2903971119133573, "percentage": 64.57, "elapsed_time": "11:26:36", "remaining_time": "6:16:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 1730, "loss": 0.7631, "learning_rate": 4.684549307251799e-06, "epoch": 1.291552346570397, "percentage": 64.62, "elapsed_time": "11:27:11", "remaining_time": "6:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 1730, "loss": 0.7844, "learning_rate": 4.679297870193628e-06, "epoch": 1.292707581227437, "percentage": 64.68, "elapsed_time": "11:27:44", "remaining_time": "6:15:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1730, "loss": 0.74, "learning_rate": 4.6740060760191905e-06, "epoch": 1.2938628158844765, "percentage": 64.74, "elapsed_time": "11:28:19", "remaining_time": "6:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 1730, "loss": 0.7923, "learning_rate": 4.668674022735311e-06, "epoch": 1.2950180505415163, "percentage": 64.8, "elapsed_time": "11:28:53", "remaining_time": "6:14:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 1730, "loss": 0.7899, "learning_rate": 4.663301809094425e-06, "epoch": 1.296173285198556, "percentage": 64.86, "elapsed_time": "11:29:27", "remaining_time": "6:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 1730, "loss": 0.7831, "learning_rate": 4.657889534592767e-06, "epoch": 1.2973285198555957, "percentage": 64.91, "elapsed_time": "11:30:00", "remaining_time": "6:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 1730, "loss": 0.7728, "learning_rate": 4.652437299468514e-06, "epoch": 1.2984837545126353, "percentage": 64.97, "elapsed_time": "11:30:35", "remaining_time": "6:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 1730, "loss": 0.7736, "learning_rate": 4.646945204699939e-06, "epoch": 1.2996389891696751, "percentage": 65.03, "elapsed_time": "11:31:08", "remaining_time": "6:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 1730, "loss": 0.7738, "learning_rate": 4.641413352003534e-06, "epoch": 1.3007942238267147, "percentage": 65.09, "elapsed_time": "11:31:42", "remaining_time": "6:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 1730, "loss": 0.7766, "learning_rate": 4.63584184383213e-06, "epoch": 1.3019494584837545, "percentage": 65.14, "elapsed_time": "11:32:17", "remaining_time": "6:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 1730, "loss": 0.7939, "learning_rate": 4.630230783372998e-06, "epoch": 1.3031046931407944, "percentage": 65.2, "elapsed_time": "11:32:50", "remaining_time": "6:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 1730, "loss": 0.7701, "learning_rate": 4.624580274545938e-06, "epoch": 1.304259927797834, "percentage": 65.26, "elapsed_time": "11:33:24", "remaining_time": "6:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 1730, "loss": 0.7979, "learning_rate": 4.618890422001355e-06, "epoch": 1.3054151624548735, "percentage": 65.32, "elapsed_time": "11:33:58", "remaining_time": "6:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 1730, "loss": 0.7473, "learning_rate": 4.61316133111832e-06, "epoch": 1.3065703971119134, "percentage": 65.38, "elapsed_time": "11:34:32", "remaining_time": "6:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 1730, "loss": 0.7663, "learning_rate": 4.607393108002618e-06, "epoch": 1.3077256317689532, "percentage": 65.43, "elapsed_time": "11:35:06", "remaining_time": "6:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 1730, "loss": 0.7811, "learning_rate": 4.601585859484786e-06, "epoch": 1.3088808664259928, "percentage": 65.49, "elapsed_time": "11:35:39", "remaining_time": "6:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 1730, "loss": 0.7836, "learning_rate": 4.595739693118132e-06, "epoch": 1.3100361010830324, "percentage": 65.55, "elapsed_time": "11:36:13", "remaining_time": "6:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 1730, "loss": 0.7708, "learning_rate": 4.5898547171767375e-06, "epoch": 1.3111913357400722, "percentage": 65.61, "elapsed_time": "11:36:47", "remaining_time": "6:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 1730, "loss": 0.772, "learning_rate": 4.583931040653466e-06, "epoch": 1.312346570397112, "percentage": 65.66, "elapsed_time": "11:37:21", "remaining_time": "6:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 1730, "loss": 0.783, "learning_rate": 4.5779687732579285e-06, "epoch": 1.3135018050541516, "percentage": 65.72, "elapsed_time": "11:37:55", "remaining_time": "6:03:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 1730, "loss": 0.7736, "learning_rate": 4.571968025414466e-06, "epoch": 1.3146570397111914, "percentage": 65.78, "elapsed_time": "11:38:28", "remaining_time": "6:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 1730, "loss": 0.7823, "learning_rate": 4.565928908260093e-06, "epoch": 1.315812274368231, "percentage": 65.84, "elapsed_time": "11:39:02", "remaining_time": "6:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 1730, "loss": 0.7966, "learning_rate": 4.559851533642446e-06, "epoch": 1.3169675090252708, "percentage": 65.9, "elapsed_time": "11:39:36", "remaining_time": "6:02:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 1730, "loss": 0.8043, "learning_rate": 4.55373601411771e-06, "epoch": 1.3181227436823104, "percentage": 65.95, "elapsed_time": "11:40:10", "remaining_time": "6:01:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 1730, "loss": 0.7903, "learning_rate": 4.547582462948533e-06, "epoch": 1.3192779783393502, "percentage": 66.01, "elapsed_time": "11:40:44", "remaining_time": "6:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 1730, "loss": 0.7834, "learning_rate": 4.541390994101928e-06, "epoch": 1.3204332129963898, "percentage": 66.07, "elapsed_time": "11:41:18", "remaining_time": "6:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 1730, "loss": 0.7774, "learning_rate": 4.535161722247168e-06, "epoch": 1.3215884476534296, "percentage": 66.13, "elapsed_time": "11:41:51", "remaining_time": "5:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 1730, "loss": 0.7909, "learning_rate": 4.528894762753651e-06, "epoch": 1.3227436823104692, "percentage": 66.18, "elapsed_time": "11:42:25", "remaining_time": "5:58:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 1730, "loss": 0.7885, "learning_rate": 4.522590231688775e-06, "epoch": 1.323898916967509, "percentage": 66.24, "elapsed_time": "11:43:00", "remaining_time": "5:58:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 1730, "loss": 0.7924, "learning_rate": 4.516248245815782e-06, "epoch": 1.3250541516245486, "percentage": 66.3, "elapsed_time": "11:43:34", "remaining_time": "5:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 1730, "loss": 0.7845, "learning_rate": 4.509868922591595e-06, "epoch": 1.3262093862815885, "percentage": 66.36, "elapsed_time": "11:44:07", "remaining_time": "5:56:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 1730, "loss": 0.7983, "learning_rate": 4.503452380164648e-06, "epoch": 1.3273646209386283, "percentage": 66.42, "elapsed_time": "11:44:41", "remaining_time": "5:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 1730, "loss": 0.7561, "learning_rate": 4.496998737372691e-06, "epoch": 1.3285198555956679, "percentage": 66.47, "elapsed_time": "11:45:15", "remaining_time": "5:55:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 1730, "loss": 0.7753, "learning_rate": 4.490508113740594e-06, "epoch": 1.3296750902527075, "percentage": 66.53, "elapsed_time": "11:45:49", "remaining_time": "5:55:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 1730, "loss": 0.769, "learning_rate": 4.483980629478131e-06, "epoch": 1.3308303249097473, "percentage": 66.59, "elapsed_time": "11:46:23", "remaining_time": "5:54:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 1730, "loss": 0.7879, "learning_rate": 4.477416405477754e-06, "epoch": 1.331985559566787, "percentage": 66.65, "elapsed_time": "11:46:58", "remaining_time": "5:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 1730, "loss": 0.7795, "learning_rate": 4.470815563312356e-06, "epoch": 1.3331407942238267, "percentage": 66.71, "elapsed_time": "11:47:32", "remaining_time": "5:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 1730, "loss": 0.7577, "learning_rate": 4.464178225233016e-06, "epoch": 1.3342960288808663, "percentage": 66.76, "elapsed_time": "11:48:06", "remaining_time": "5:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 1730, "loss": 0.7617, "learning_rate": 4.457504514166738e-06, "epoch": 1.335451263537906, "percentage": 66.82, "elapsed_time": "11:48:39", "remaining_time": "5:51:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 1730, "loss": 0.7924, "learning_rate": 4.4507945537141714e-06, "epoch": 1.336606498194946, "percentage": 66.88, "elapsed_time": "11:49:14", "remaining_time": "5:51:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 1730, "loss": 0.7756, "learning_rate": 4.444048468147324e-06, "epoch": 1.3377617328519855, "percentage": 66.94, "elapsed_time": "11:49:47", "remaining_time": "5:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 1730, "loss": 0.785, "learning_rate": 4.4372663824072595e-06, "epoch": 1.3389169675090253, "percentage": 66.99, "elapsed_time": "11:50:21", "remaining_time": "5:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 1730, "loss": 0.7914, "learning_rate": 4.430448422101786e-06, "epoch": 1.340072202166065, "percentage": 67.05, "elapsed_time": "11:50:56", "remaining_time": "5:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 1730, "loss": 0.7948, "learning_rate": 4.423594713503124e-06, "epoch": 1.3412274368231047, "percentage": 67.11, "elapsed_time": "11:51:30", "remaining_time": "5:48:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 1730, "loss": 0.7571, "learning_rate": 4.416705383545574e-06, "epoch": 1.3423826714801443, "percentage": 67.17, "elapsed_time": "11:52:04", "remaining_time": "5:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 1730, "loss": 0.7544, "learning_rate": 4.409780559823159e-06, "epoch": 1.3435379061371842, "percentage": 67.23, "elapsed_time": "11:52:38", "remaining_time": "5:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 1730, "loss": 0.7928, "learning_rate": 4.402820370587272e-06, "epoch": 1.3446931407942238, "percentage": 67.28, "elapsed_time": "11:53:12", "remaining_time": "5:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 1730, "loss": 0.7821, "learning_rate": 4.395824944744287e-06, "epoch": 1.3458483754512636, "percentage": 67.34, "elapsed_time": "11:53:46", "remaining_time": "5:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 1730, "loss": 0.7563, "learning_rate": 4.388794411853183e-06, "epoch": 1.3470036101083034, "percentage": 67.4, "elapsed_time": "11:54:20", "remaining_time": "5:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 1730, "loss": 0.7675, "learning_rate": 4.381728902123138e-06, "epoch": 1.348158844765343, "percentage": 67.46, "elapsed_time": "11:54:54", "remaining_time": "5:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 1730, "loss": 0.7839, "learning_rate": 4.374628546411121e-06, "epoch": 1.3493140794223826, "percentage": 67.51, "elapsed_time": "11:55:28", "remaining_time": "5:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 1730, "loss": 0.7764, "learning_rate": 4.367493476219464e-06, "epoch": 1.3504693140794224, "percentage": 67.57, "elapsed_time": "11:56:02", "remaining_time": "5:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 1730, "loss": 0.7873, "learning_rate": 4.360323823693434e-06, "epoch": 1.3516245487364622, "percentage": 67.63, "elapsed_time": "11:56:35", "remaining_time": "5:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 1730, "loss": 0.7719, "learning_rate": 4.353119721618778e-06, "epoch": 1.3527797833935018, "percentage": 67.69, "elapsed_time": "11:57:09", "remaining_time": "5:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 1730, "loss": 0.8023, "learning_rate": 4.345881303419266e-06, "epoch": 1.3539350180505414, "percentage": 67.75, "elapsed_time": "11:57:43", "remaining_time": "5:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 1730, "loss": 0.7612, "learning_rate": 4.338608703154224e-06, "epoch": 1.3550902527075812, "percentage": 67.8, "elapsed_time": "11:58:17", "remaining_time": "5:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 1730, "loss": 0.7735, "learning_rate": 4.3313020555160445e-06, "epoch": 1.356245487364621, "percentage": 67.86, "elapsed_time": "11:58:51", "remaining_time": "5:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 1730, "loss": 0.7942, "learning_rate": 4.323961495827698e-06, "epoch": 1.3574007220216606, "percentage": 67.92, "elapsed_time": "11:59:25", "remaining_time": "5:39:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 1730, "loss": 0.7675, "learning_rate": 4.316587160040222e-06, "epoch": 1.3585559566787004, "percentage": 67.98, "elapsed_time": "11:59:59", "remaining_time": "5:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 1730, "loss": 0.7586, "learning_rate": 4.309179184730207e-06, "epoch": 1.35971119133574, "percentage": 68.03, "elapsed_time": "12:00:33", "remaining_time": "5:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 1730, "loss": 0.7792, "learning_rate": 4.301737707097264e-06, "epoch": 1.3608664259927798, "percentage": 68.09, "elapsed_time": "12:01:07", "remaining_time": "5:37:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 1730, "loss": 0.77, "learning_rate": 4.294262864961486e-06, "epoch": 1.3620216606498194, "percentage": 68.15, "elapsed_time": "12:01:41", "remaining_time": "5:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 1730, "loss": 0.7898, "learning_rate": 4.286754796760892e-06, "epoch": 1.3631768953068593, "percentage": 68.21, "elapsed_time": "12:02:15", "remaining_time": "5:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 1730, "loss": 0.7644, "learning_rate": 4.279213641548867e-06, "epoch": 1.3643321299638989, "percentage": 68.27, "elapsed_time": "12:02:49", "remaining_time": "5:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 1730, "loss": 0.7484, "learning_rate": 4.271639538991584e-06, "epoch": 1.3654873646209387, "percentage": 68.32, "elapsed_time": "12:03:23", "remaining_time": "5:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 1730, "loss": 0.8274, "learning_rate": 4.264032629365418e-06, "epoch": 1.3666425992779783, "percentage": 68.38, "elapsed_time": "12:03:57", "remaining_time": "5:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 1730, "loss": 0.7438, "learning_rate": 4.256393053554351e-06, "epoch": 1.367797833935018, "percentage": 68.44, "elapsed_time": "12:04:31", "remaining_time": "5:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 1730, "loss": 0.764, "learning_rate": 4.248720953047355e-06, "epoch": 1.3689530685920577, "percentage": 68.5, "elapsed_time": "12:05:04", "remaining_time": "5:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 1730, "loss": 0.764, "learning_rate": 4.241016469935782e-06, "epoch": 1.3701083032490975, "percentage": 68.55, "elapsed_time": "12:05:38", "remaining_time": "5:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 1730, "loss": 0.7729, "learning_rate": 4.233279746910722e-06, "epoch": 1.3712635379061373, "percentage": 68.61, "elapsed_time": "12:06:12", "remaining_time": "5:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 1730, "loss": 0.7901, "learning_rate": 4.225510927260369e-06, "epoch": 1.372418772563177, "percentage": 68.67, "elapsed_time": "12:06:46", "remaining_time": "5:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 1730, "loss": 0.8064, "learning_rate": 4.217710154867362e-06, "epoch": 1.3735740072202165, "percentage": 68.73, "elapsed_time": "12:07:20", "remaining_time": "5:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 1730, "loss": 0.7248, "learning_rate": 4.209877574206121e-06, "epoch": 1.3747292418772563, "percentage": 68.79, "elapsed_time": "12:07:54", "remaining_time": "5:30:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 1730, "loss": 0.8044, "learning_rate": 4.2020133303401714e-06, "epoch": 1.3758844765342961, "percentage": 68.84, "elapsed_time": "12:08:27", "remaining_time": "5:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 1730, "loss": 0.771, "learning_rate": 4.1941175689194615e-06, "epoch": 1.3770397111913357, "percentage": 68.9, "elapsed_time": "12:09:01", "remaining_time": "5:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 1730, "loss": 0.7926, "learning_rate": 4.186190436177655e-06, "epoch": 1.3781949458483753, "percentage": 68.96, "elapsed_time": "12:09:35", "remaining_time": "5:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 1730, "loss": 0.7658, "learning_rate": 4.178232078929437e-06, "epoch": 1.3793501805054151, "percentage": 69.02, "elapsed_time": "12:10:09", "remaining_time": "5:27:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 1730, "loss": 0.7598, "learning_rate": 4.170242644567781e-06, "epoch": 1.380505415162455, "percentage": 69.08, "elapsed_time": "12:10:43", "remaining_time": "5:27:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 1730, "loss": 0.8047, "learning_rate": 4.162222281061226e-06, "epoch": 1.3816606498194945, "percentage": 69.13, "elapsed_time": "12:11:17", "remaining_time": "5:26:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 1730, "loss": 0.7707, "learning_rate": 4.154171136951136e-06, "epoch": 1.3828158844765344, "percentage": 69.19, "elapsed_time": "12:11:50", "remaining_time": "5:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 1730, "loss": 0.7659, "learning_rate": 4.146089361348948e-06, "epoch": 1.383971119133574, "percentage": 69.25, "elapsed_time": "12:12:24", "remaining_time": "5:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 1730, "loss": 0.7898, "learning_rate": 4.137977103933411e-06, "epoch": 1.3851263537906138, "percentage": 69.31, "elapsed_time": "12:12:58", "remaining_time": "5:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 1730, "loss": 0.8019, "learning_rate": 4.1298345149478115e-06, "epoch": 1.3862815884476534, "percentage": 69.36, "elapsed_time": "12:13:32", "remaining_time": "5:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 1730, "loss": 0.7749, "learning_rate": 4.121661745197195e-06, "epoch": 1.3874368231046932, "percentage": 69.42, "elapsed_time": "12:14:06", "remaining_time": "5:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 1730, "loss": 0.7807, "learning_rate": 4.113458946045569e-06, "epoch": 1.3885920577617328, "percentage": 69.48, "elapsed_time": "12:14:41", "remaining_time": "5:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 1730, "loss": 0.8127, "learning_rate": 4.1052262694131e-06, "epoch": 1.3897472924187726, "percentage": 69.54, "elapsed_time": "12:15:15", "remaining_time": "5:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 1730, "loss": 0.7887, "learning_rate": 4.096963867773306e-06, "epoch": 1.3909025270758124, "percentage": 69.6, "elapsed_time": "12:15:48", "remaining_time": "5:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 1730, "loss": 0.7705, "learning_rate": 4.0886718941502215e-06, "epoch": 1.392057761732852, "percentage": 69.65, "elapsed_time": "12:16:21", "remaining_time": "5:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 1730, "loss": 0.7655, "learning_rate": 4.080350502115575e-06, "epoch": 1.3932129963898916, "percentage": 69.71, "elapsed_time": "12:16:55", "remaining_time": "5:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 1730, "loss": 0.7839, "learning_rate": 4.071999845785938e-06, "epoch": 1.3943682310469314, "percentage": 69.77, "elapsed_time": "12:17:29", "remaining_time": "5:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 1730, "loss": 0.7676, "learning_rate": 4.06362007981987e-06, "epoch": 1.3955234657039712, "percentage": 69.83, "elapsed_time": "12:18:03", "remaining_time": "5:18:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 1730, "loss": 0.7685, "learning_rate": 4.055211359415058e-06, "epoch": 1.3966787003610108, "percentage": 69.88, "elapsed_time": "12:18:36", "remaining_time": "5:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 1730, "loss": 0.7716, "learning_rate": 4.0467738403054425e-06, "epoch": 1.3978339350180504, "percentage": 69.94, "elapsed_time": "12:19:10", "remaining_time": "5:17:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 1730, "loss": 0.8029, "learning_rate": 4.038307678758328e-06, "epoch": 1.3989891696750902, "percentage": 70.0, "elapsed_time": "12:19:44", "remaining_time": "5:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 1730, "loss": 0.766, "learning_rate": 4.0298130315714934e-06, "epoch": 1.40014440433213, "percentage": 70.06, "elapsed_time": "12:20:18", "remaining_time": "5:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 1730, "loss": 0.7724, "learning_rate": 4.021290056070287e-06, "epoch": 1.4012996389891696, "percentage": 70.12, "elapsed_time": "12:20:52", "remaining_time": "5:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 1730, "loss": 0.7987, "learning_rate": 4.012738910104711e-06, "epoch": 1.4024548736462095, "percentage": 70.17, "elapsed_time": "12:21:26", "remaining_time": "5:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 1730, "loss": 0.7516, "learning_rate": 4.004159752046501e-06, "epoch": 1.403610108303249, "percentage": 70.23, "elapsed_time": "12:21:59", "remaining_time": "5:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 1730, "loss": 0.7778, "learning_rate": 3.99555274078619e-06, "epoch": 1.4047653429602889, "percentage": 70.29, "elapsed_time": "12:22:33", "remaining_time": "5:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 1730, "loss": 0.7689, "learning_rate": 3.986918035730169e-06, "epoch": 1.4059205776173285, "percentage": 70.35, "elapsed_time": "12:23:07", "remaining_time": "5:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 1730, "loss": 0.7976, "learning_rate": 3.9782557967977295e-06, "epoch": 1.4070758122743683, "percentage": 70.4, "elapsed_time": "12:23:41", "remaining_time": "5:12:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 1730, "loss": 0.7775, "learning_rate": 3.969566184418109e-06, "epoch": 1.4082310469314079, "percentage": 70.46, "elapsed_time": "12:24:15", "remaining_time": "5:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 1730, "loss": 0.7639, "learning_rate": 3.960849359527515e-06, "epoch": 1.4093862815884477, "percentage": 70.52, "elapsed_time": "12:24:49", "remaining_time": "5:11:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 1730, "loss": 0.7583, "learning_rate": 3.952105483566139e-06, "epoch": 1.4105415162454873, "percentage": 70.58, "elapsed_time": "12:25:22", "remaining_time": "5:10:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 1730, "loss": 0.7936, "learning_rate": 3.94333471847518e-06, "epoch": 1.411696750902527, "percentage": 70.64, "elapsed_time": "12:25:57", "remaining_time": "5:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 1730, "loss": 0.761, "learning_rate": 3.934537226693836e-06, "epoch": 1.4128519855595667, "percentage": 70.69, "elapsed_time": "12:26:30", "remaining_time": "5:09:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 1730, "loss": 0.7952, "learning_rate": 3.925713171156295e-06, "epoch": 1.4140072202166065, "percentage": 70.75, "elapsed_time": "12:27:04", "remaining_time": "5:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 1730, "loss": 0.7623, "learning_rate": 3.9168627152887214e-06, "epoch": 1.4151624548736463, "percentage": 70.81, "elapsed_time": "12:27:38", "remaining_time": "5:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 1730, "loss": 0.7451, "learning_rate": 3.9079860230062286e-06, "epoch": 1.416317689530686, "percentage": 70.87, "elapsed_time": "12:28:12", "remaining_time": "5:07:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 1730, "loss": 0.7825, "learning_rate": 3.8990832587098396e-06, "epoch": 1.4174729241877255, "percentage": 70.92, "elapsed_time": "12:28:46", "remaining_time": "5:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 1730, "loss": 0.7788, "learning_rate": 3.890154587283447e-06, "epoch": 1.4186281588447653, "percentage": 70.98, "elapsed_time": "12:29:20", "remaining_time": "5:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 1730, "loss": 0.7752, "learning_rate": 3.881200174090758e-06, "epoch": 1.4197833935018052, "percentage": 71.04, "elapsed_time": "12:29:55", "remaining_time": "5:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 1730, "loss": 0.7834, "learning_rate": 3.8722201849722264e-06, "epoch": 1.4209386281588448, "percentage": 71.1, "elapsed_time": "12:30:28", "remaining_time": "5:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 1730, "loss": 0.7633, "learning_rate": 3.863214786241993e-06, "epoch": 1.4220938628158843, "percentage": 71.16, "elapsed_time": "12:31:01", "remaining_time": "5:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 1730, "loss": 0.7901, "learning_rate": 3.85418414468479e-06, "epoch": 1.4232490974729242, "percentage": 71.21, "elapsed_time": "12:31:36", "remaining_time": "5:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 1730, "loss": 0.7579, "learning_rate": 3.845128427552865e-06, "epoch": 1.424404332129964, "percentage": 71.27, "elapsed_time": "12:32:09", "remaining_time": "5:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 1730, "loss": 0.7633, "learning_rate": 3.836047802562878e-06, "epoch": 1.4255595667870036, "percentage": 71.33, "elapsed_time": "12:32:43", "remaining_time": "5:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 1730, "loss": 0.7959, "learning_rate": 3.8269424378927925e-06, "epoch": 1.4267148014440434, "percentage": 71.39, "elapsed_time": "12:33:17", "remaining_time": "5:01:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 1730, "loss": 0.782, "learning_rate": 3.81781250217877e-06, "epoch": 1.427870036101083, "percentage": 71.45, "elapsed_time": "12:33:50", "remaining_time": "5:01:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 1730, "loss": 0.7875, "learning_rate": 3.8086581645120347e-06, "epoch": 1.4290252707581228, "percentage": 71.5, "elapsed_time": "12:34:24", "remaining_time": "5:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 1730, "loss": 0.7712, "learning_rate": 3.799479594435751e-06, "epoch": 1.4301805054151624, "percentage": 71.56, "elapsed_time": "12:34:58", "remaining_time": "5:00:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 1730, "loss": 0.8094, "learning_rate": 3.7902769619418783e-06, "epoch": 1.4313357400722022, "percentage": 71.62, "elapsed_time": "12:35:32", "remaining_time": "4:59:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 1730, "loss": 0.7687, "learning_rate": 3.7810504374680274e-06, "epoch": 1.4324909747292418, "percentage": 71.68, "elapsed_time": "12:36:05", "remaining_time": "4:58:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 1730, "loss": 0.7943, "learning_rate": 3.7718001918942982e-06, "epoch": 1.4336462093862816, "percentage": 71.73, "elapsed_time": "12:36:40", "remaining_time": "4:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 1730, "loss": 0.7735, "learning_rate": 3.762526396540121e-06, "epoch": 1.4348014440433212, "percentage": 71.79, "elapsed_time": "12:37:13", "remaining_time": "4:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 1730, "loss": 0.7641, "learning_rate": 3.7532292231610774e-06, "epoch": 1.435956678700361, "percentage": 71.85, "elapsed_time": "12:37:46", "remaining_time": "4:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 1730, "loss": 0.7627, "learning_rate": 3.7439088439457257e-06, "epoch": 1.4371119133574006, "percentage": 71.91, "elapsed_time": "12:38:21", "remaining_time": "4:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 1730, "loss": 0.7811, "learning_rate": 3.7345654315124035e-06, "epoch": 1.4382671480144404, "percentage": 71.97, "elapsed_time": "12:38:54", "remaining_time": "4:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 1730, "loss": 0.7924, "learning_rate": 3.725199158906041e-06, "epoch": 1.4394223826714803, "percentage": 72.02, "elapsed_time": "12:39:29", "remaining_time": "4:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 1730, "loss": 0.7601, "learning_rate": 3.7158101995949486e-06, "epoch": 1.4405776173285199, "percentage": 72.08, "elapsed_time": "12:40:03", "remaining_time": "4:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 1730, "loss": 0.7624, "learning_rate": 3.706398727467606e-06, "epoch": 1.4417328519855594, "percentage": 72.14, "elapsed_time": "12:40:36", "remaining_time": "4:53:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 1730, "loss": 0.7867, "learning_rate": 3.696964916829443e-06, "epoch": 1.4428880866425993, "percentage": 72.2, "elapsed_time": "12:41:10", "remaining_time": "4:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 1730, "loss": 0.7861, "learning_rate": 3.6875089423996097e-06, "epoch": 1.444043321299639, "percentage": 72.25, "elapsed_time": "12:41:44", "remaining_time": "4:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 1730, "loss": 0.7869, "learning_rate": 3.678030979307741e-06, "epoch": 1.4451985559566787, "percentage": 72.31, "elapsed_time": "12:56:07", "remaining_time": "4:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 1730, "loss": 0.7568, "learning_rate": 3.6685312030907167e-06, "epoch": 1.4463537906137185, "percentage": 72.37, "elapsed_time": "12:56:41", "remaining_time": "4:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 1730, "loss": 0.8089, "learning_rate": 3.6590097896894017e-06, "epoch": 1.447509025270758, "percentage": 72.43, "elapsed_time": "12:57:15", "remaining_time": "4:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 1730, "loss": 0.794, "learning_rate": 3.6494669154453978e-06, "epoch": 1.448664259927798, "percentage": 72.49, "elapsed_time": "12:57:48", "remaining_time": "4:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 1730, "loss": 0.7657, "learning_rate": 3.6399027570977703e-06, "epoch": 1.4498194945848375, "percentage": 72.54, "elapsed_time": "12:58:23", "remaining_time": "4:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 1730, "loss": 0.7573, "learning_rate": 3.6303174917797783e-06, "epoch": 1.4509747292418773, "percentage": 72.6, "elapsed_time": "12:58:57", "remaining_time": "4:53:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 1730, "loss": 0.7739, "learning_rate": 3.6207112970155915e-06, "epoch": 1.452129963898917, "percentage": 72.66, "elapsed_time": "12:59:31", "remaining_time": "4:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 1730, "loss": 0.7612, "learning_rate": 3.611084350717008e-06, "epoch": 1.4532851985559567, "percentage": 72.72, "elapsed_time": "13:00:06", "remaining_time": "4:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 1730, "loss": 0.7892, "learning_rate": 3.60143683118015e-06, "epoch": 1.4544404332129963, "percentage": 72.77, "elapsed_time": "13:00:40", "remaining_time": "4:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 1730, "loss": 0.7806, "learning_rate": 3.5917689170821714e-06, "epoch": 1.4555956678700361, "percentage": 72.83, "elapsed_time": "13:01:14", "remaining_time": "4:51:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 1730, "loss": 0.7772, "learning_rate": 3.582080787477941e-06, "epoch": 1.4567509025270757, "percentage": 72.89, "elapsed_time": "13:01:47", "remaining_time": "4:50:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 1730, "loss": 0.7926, "learning_rate": 3.5723726217967315e-06, "epoch": 1.4579061371841155, "percentage": 72.95, "elapsed_time": "13:02:21", "remaining_time": "4:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 1730, "loss": 0.7819, "learning_rate": 3.5626445998388926e-06, "epoch": 1.4590613718411554, "percentage": 73.01, "elapsed_time": "13:02:54", "remaining_time": "4:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 1730, "loss": 0.7845, "learning_rate": 3.552896901772525e-06, "epoch": 1.460216606498195, "percentage": 73.06, "elapsed_time": "13:03:29", "remaining_time": "4:48:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 1730, "loss": 0.7979, "learning_rate": 3.543129708130139e-06, "epoch": 1.4613718411552346, "percentage": 73.12, "elapsed_time": "13:04:03", "remaining_time": "4:48:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 1730, "loss": 0.7869, "learning_rate": 3.533343199805315e-06, "epoch": 1.4625270758122744, "percentage": 73.18, "elapsed_time": "13:04:36", "remaining_time": "4:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 1730, "loss": 0.7765, "learning_rate": 3.52353755804935e-06, "epoch": 1.4636823104693142, "percentage": 73.24, "elapsed_time": "13:05:10", "remaining_time": "4:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 1730, "loss": 0.7606, "learning_rate": 3.5137129644679035e-06, "epoch": 1.4648375451263538, "percentage": 73.29, "elapsed_time": "13:05:44", "remaining_time": "4:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 1730, "loss": 0.7624, "learning_rate": 3.5038696010176316e-06, "epoch": 1.4659927797833934, "percentage": 73.35, "elapsed_time": "13:06:18", "remaining_time": "4:45:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 1730, "loss": 0.7704, "learning_rate": 3.4940076500028193e-06, "epoch": 1.4671480144404332, "percentage": 73.41, "elapsed_time": "13:06:51", "remaining_time": "4:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 1730, "loss": 0.7799, "learning_rate": 3.484127294072003e-06, "epoch": 1.468303249097473, "percentage": 73.47, "elapsed_time": "13:07:25", "remaining_time": "4:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 1730, "loss": 0.7859, "learning_rate": 3.474228716214588e-06, "epoch": 1.4694584837545126, "percentage": 73.53, "elapsed_time": "13:07:59", "remaining_time": "4:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 1730, "loss": 0.7553, "learning_rate": 3.464312099757457e-06, "epoch": 1.4706137184115524, "percentage": 73.58, "elapsed_time": "13:08:33", "remaining_time": "4:43:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 1730, "loss": 0.7869, "learning_rate": 3.4543776283615815e-06, "epoch": 1.471768953068592, "percentage": 73.64, "elapsed_time": "13:09:10", "remaining_time": "4:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 1730, "loss": 0.7734, "learning_rate": 3.444425486018611e-06, "epoch": 1.4729241877256318, "percentage": 73.7, "elapsed_time": "13:09:44", "remaining_time": "4:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 1730, "loss": 0.7714, "learning_rate": 3.434455857047475e-06, "epoch": 1.4740794223826714, "percentage": 73.76, "elapsed_time": "13:10:19", "remaining_time": "4:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 1730, "loss": 0.7912, "learning_rate": 3.424468926090961e-06, "epoch": 1.4752346570397112, "percentage": 73.82, "elapsed_time": "13:10:53", "remaining_time": "4:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 1730, "loss": 0.7725, "learning_rate": 3.4144648781122987e-06, "epoch": 1.4763898916967508, "percentage": 73.87, "elapsed_time": "13:11:27", "remaining_time": "4:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 1730, "loss": 0.7548, "learning_rate": 3.404443898391737e-06, "epoch": 1.4775451263537906, "percentage": 73.93, "elapsed_time": "13:12:00", "remaining_time": "4:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 1730, "loss": 0.7882, "learning_rate": 3.3944061725231055e-06, "epoch": 1.4787003610108302, "percentage": 73.99, "elapsed_time": "13:12:34", "remaining_time": "4:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 1730, "loss": 0.7617, "learning_rate": 3.3843518864103857e-06, "epoch": 1.47985559566787, "percentage": 74.05, "elapsed_time": "13:13:09", "remaining_time": "4:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 1730, "loss": 0.7798, "learning_rate": 3.374281226264259e-06, "epoch": 1.4810108303249097, "percentage": 74.1, "elapsed_time": "13:13:42", "remaining_time": "4:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 1730, "loss": 0.7647, "learning_rate": 3.364194378598666e-06, "epoch": 1.4821660649819495, "percentage": 74.16, "elapsed_time": "13:14:16", "remaining_time": "4:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 1730, "loss": 0.777, "learning_rate": 3.3540915302273476e-06, "epoch": 1.4833212996389893, "percentage": 74.22, "elapsed_time": "13:14:50", "remaining_time": "4:36:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 1730, "loss": 0.7704, "learning_rate": 3.343972868260385e-06, "epoch": 1.4844765342960289, "percentage": 74.28, "elapsed_time": "13:15:24", "remaining_time": "4:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 1730, "loss": 0.7465, "learning_rate": 3.333838580100737e-06, "epoch": 1.4856317689530685, "percentage": 74.34, "elapsed_time": "13:15:57", "remaining_time": "4:34:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 1730, "loss": 0.798, "learning_rate": 3.32368885344077e-06, "epoch": 1.4867870036101083, "percentage": 74.39, "elapsed_time": "13:16:31", "remaining_time": "4:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 1730, "loss": 0.7946, "learning_rate": 3.3135238762587723e-06, "epoch": 1.487942238267148, "percentage": 74.45, "elapsed_time": "13:17:05", "remaining_time": "4:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 1730, "loss": 0.7762, "learning_rate": 3.3033438368154886e-06, "epoch": 1.4890974729241877, "percentage": 74.51, "elapsed_time": "13:17:39", "remaining_time": "4:32:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 1730, "loss": 0.7977, "learning_rate": 3.2931489236506183e-06, "epoch": 1.4902527075812273, "percentage": 74.57, "elapsed_time": "13:18:14", "remaining_time": "4:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 1730, "loss": 0.7634, "learning_rate": 3.282939325579333e-06, "epoch": 1.4914079422382671, "percentage": 74.62, "elapsed_time": "13:18:48", "remaining_time": "4:31:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 1730, "loss": 0.7917, "learning_rate": 3.272715231688775e-06, "epoch": 1.492563176895307, "percentage": 74.68, "elapsed_time": "13:19:22", "remaining_time": "4:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 1730, "loss": 0.7507, "learning_rate": 3.2624768313345594e-06, "epoch": 1.4937184115523465, "percentage": 74.74, "elapsed_time": "13:19:56", "remaining_time": "4:30:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 1730, "loss": 0.7751, "learning_rate": 3.25222431413726e-06, "epoch": 1.4948736462093863, "percentage": 74.8, "elapsed_time": "13:20:30", "remaining_time": "4:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 1730, "loss": 0.7697, "learning_rate": 3.241957869978907e-06, "epoch": 1.496028880866426, "percentage": 74.86, "elapsed_time": "13:21:05", "remaining_time": "4:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 1730, "loss": 0.8087, "learning_rate": 3.2316776889994627e-06, "epoch": 1.4971841155234658, "percentage": 74.91, "elapsed_time": "13:21:39", "remaining_time": "4:28:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 1730, "loss": 0.7511, "learning_rate": 3.221383961593303e-06, "epoch": 1.4983393501805053, "percentage": 74.97, "elapsed_time": "13:22:13", "remaining_time": "4:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 1730, "loss": 0.7741, "learning_rate": 3.2110768784056884e-06, "epoch": 1.4994945848375452, "percentage": 75.03, "elapsed_time": "13:22:47", "remaining_time": "4:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 1730, "loss": 0.7631, "learning_rate": 3.2007566303292416e-06, "epoch": 1.5006498194945848, "percentage": 75.09, "elapsed_time": "13:23:20", "remaining_time": "4:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 1730, "loss": 0.7574, "learning_rate": 3.1904234085003976e-06, "epoch": 1.5018050541516246, "percentage": 75.14, "elapsed_time": "13:23:53", "remaining_time": "4:25:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 1730, "loss": 0.8047, "learning_rate": 3.180077404295881e-06, "epoch": 1.5029602888086644, "percentage": 75.2, "elapsed_time": "13:24:27", "remaining_time": "4:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 1730, "loss": 0.7663, "learning_rate": 3.1697188093291454e-06, "epoch": 1.504115523465704, "percentage": 75.26, "elapsed_time": "13:25:01", "remaining_time": "4:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 1730, "loss": 0.8022, "learning_rate": 3.1593478154468364e-06, "epoch": 1.5052707581227436, "percentage": 75.32, "elapsed_time": "13:25:36", "remaining_time": "4:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 1730, "loss": 0.779, "learning_rate": 3.148964614725232e-06, "epoch": 1.5064259927797834, "percentage": 75.38, "elapsed_time": "13:26:09", "remaining_time": "4:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 1730, "loss": 0.7833, "learning_rate": 3.138569399466689e-06, "epoch": 1.5075812274368232, "percentage": 75.43, "elapsed_time": "13:26:43", "remaining_time": "4:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 1730, "loss": 0.7753, "learning_rate": 3.128162362196077e-06, "epoch": 1.5087364620938628, "percentage": 75.49, "elapsed_time": "13:27:17", "remaining_time": "4:22:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 1730, "loss": 0.7648, "learning_rate": 3.117743695657219e-06, "epoch": 1.5098916967509024, "percentage": 75.55, "elapsed_time": "13:27:51", "remaining_time": "4:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 1730, "loss": 0.7819, "learning_rate": 3.107313592809315e-06, "epoch": 1.5110469314079422, "percentage": 75.61, "elapsed_time": "13:28:25", "remaining_time": "4:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 1730, "loss": 0.7831, "learning_rate": 3.0968722468233743e-06, "epoch": 1.512202166064982, "percentage": 75.66, "elapsed_time": "13:28:59", "remaining_time": "4:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 1730, "loss": 0.7874, "learning_rate": 3.086419851078632e-06, "epoch": 1.5133574007220216, "percentage": 75.72, "elapsed_time": "13:29:32", "remaining_time": "4:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 1730, "loss": 0.7687, "learning_rate": 3.0759565991589733e-06, "epoch": 1.5145126353790612, "percentage": 75.78, "elapsed_time": "13:30:06", "remaining_time": "4:18:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 1730, "loss": 0.7722, "learning_rate": 3.0654826848493436e-06, "epoch": 1.515667870036101, "percentage": 75.84, "elapsed_time": "13:30:40", "remaining_time": "4:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 1730, "loss": 0.7731, "learning_rate": 3.0549983021321634e-06, "epoch": 1.5168231046931409, "percentage": 75.9, "elapsed_time": "13:31:14", "remaining_time": "4:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 1730, "loss": 0.7773, "learning_rate": 3.044503645183731e-06, "epoch": 1.5179783393501805, "percentage": 75.95, "elapsed_time": "13:31:48", "remaining_time": "4:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 1730, "loss": 0.7911, "learning_rate": 3.0339989083706306e-06, "epoch": 1.5191335740072203, "percentage": 76.01, "elapsed_time": "13:32:21", "remaining_time": "4:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 1730, "loss": 0.7383, "learning_rate": 3.0234842862461307e-06, "epoch": 1.5202888086642599, "percentage": 76.07, "elapsed_time": "13:32:56", "remaining_time": "4:15:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 1730, "loss": 0.766, "learning_rate": 3.0129599735465816e-06, "epoch": 1.5214440433212997, "percentage": 76.13, "elapsed_time": "13:33:30", "remaining_time": "4:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 1730, "loss": 0.7661, "learning_rate": 3.0024261651878056e-06, "epoch": 1.5225992779783395, "percentage": 76.18, "elapsed_time": "13:34:03", "remaining_time": "4:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 1730, "loss": 0.785, "learning_rate": 2.9918830562614927e-06, "epoch": 1.523754512635379, "percentage": 76.24, "elapsed_time": "13:34:37", "remaining_time": "4:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 1730, "loss": 0.7814, "learning_rate": 2.9813308420315825e-06, "epoch": 1.5249097472924187, "percentage": 76.3, "elapsed_time": "13:35:11", "remaining_time": "4:13:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 1730, "loss": 0.7875, "learning_rate": 2.9707697179306505e-06, "epoch": 1.5260649819494585, "percentage": 76.36, "elapsed_time": "13:35:45", "remaining_time": "4:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 1730, "loss": 0.7683, "learning_rate": 2.9601998795562865e-06, "epoch": 1.5272202166064983, "percentage": 76.42, "elapsed_time": "13:36:18", "remaining_time": "4:11:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 1730, "loss": 0.7671, "learning_rate": 2.9496215226674747e-06, "epoch": 1.528375451263538, "percentage": 76.47, "elapsed_time": "13:36:52", "remaining_time": "4:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 1730, "loss": 0.7705, "learning_rate": 2.9390348431809656e-06, "epoch": 1.5295306859205775, "percentage": 76.53, "elapsed_time": "13:37:26", "remaining_time": "4:10:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 1730, "loss": 0.7771, "learning_rate": 2.9284400371676486e-06, "epoch": 1.5306859205776173, "percentage": 76.59, "elapsed_time": "13:38:00", "remaining_time": "4:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 1730, "loss": 0.7683, "learning_rate": 2.917837300848923e-06, "epoch": 1.5318411552346571, "percentage": 76.65, "elapsed_time": "13:38:34", "remaining_time": "4:09:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 1730, "loss": 0.789, "learning_rate": 2.9072268305930578e-06, "epoch": 1.5329963898916967, "percentage": 76.71, "elapsed_time": "13:39:08", "remaining_time": "4:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 1730, "loss": 0.7699, "learning_rate": 2.896608822911561e-06, "epoch": 1.5341516245487363, "percentage": 76.76, "elapsed_time": "13:39:41", "remaining_time": "4:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 1730, "loss": 0.773, "learning_rate": 2.8859834744555377e-06, "epoch": 1.5353068592057761, "percentage": 76.82, "elapsed_time": "13:40:15", "remaining_time": "4:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 1730, "loss": 0.791, "learning_rate": 2.8753509820120464e-06, "epoch": 1.536462093862816, "percentage": 76.88, "elapsed_time": "13:40:49", "remaining_time": "4:06:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 1730, "loss": 0.7643, "learning_rate": 2.864711542500457e-06, "epoch": 1.5376173285198556, "percentage": 76.94, "elapsed_time": "13:41:23", "remaining_time": "4:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 1730, "loss": 0.7813, "learning_rate": 2.8540653529688033e-06, "epoch": 1.5387725631768951, "percentage": 76.99, "elapsed_time": "13:41:57", "remaining_time": "4:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 1730, "loss": 0.7905, "learning_rate": 2.8434126105901333e-06, "epoch": 1.539927797833935, "percentage": 77.05, "elapsed_time": "13:42:31", "remaining_time": "4:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 1730, "loss": 0.771, "learning_rate": 2.8327535126588563e-06, "epoch": 1.5410830324909748, "percentage": 77.11, "elapsed_time": "13:43:04", "remaining_time": "4:04:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 1730, "loss": 0.792, "learning_rate": 2.8220882565870893e-06, "epoch": 1.5422382671480146, "percentage": 77.17, "elapsed_time": "13:43:38", "remaining_time": "4:03:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 1730, "loss": 0.7674, "learning_rate": 2.811417039901001e-06, "epoch": 1.5433935018050542, "percentage": 77.23, "elapsed_time": "13:44:12", "remaining_time": "4:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 1730, "loss": 0.7745, "learning_rate": 2.800740060237157e-06, "epoch": 1.5445487364620938, "percentage": 77.28, "elapsed_time": "13:44:46", "remaining_time": "4:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 1730, "loss": 0.7645, "learning_rate": 2.7900575153388525e-06, "epoch": 1.5457039711191336, "percentage": 77.34, "elapsed_time": "13:45:19", "remaining_time": "4:01:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 1730, "loss": 0.8149, "learning_rate": 2.779369603052456e-06, "epoch": 1.5468592057761734, "percentage": 77.4, "elapsed_time": "13:45:54", "remaining_time": "4:01:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 1730, "loss": 0.7552, "learning_rate": 2.768676521323742e-06, "epoch": 1.548014440433213, "percentage": 77.46, "elapsed_time": "13:46:27", "remaining_time": "4:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 1730, "loss": 0.7712, "learning_rate": 2.757978468194226e-06, "epoch": 1.5491696750902526, "percentage": 77.51, "elapsed_time": "13:47:01", "remaining_time": "3:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 1730, "loss": 0.7511, "learning_rate": 2.747275641797496e-06, "epoch": 1.5503249097472924, "percentage": 77.57, "elapsed_time": "13:47:35", "remaining_time": "3:59:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 1730, "loss": 0.7659, "learning_rate": 2.736568240355544e-06, "epoch": 1.5514801444043322, "percentage": 77.63, "elapsed_time": "13:48:09", "remaining_time": "3:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 1730, "loss": 0.7547, "learning_rate": 2.725856462175095e-06, "epoch": 1.5526353790613718, "percentage": 77.69, "elapsed_time": "13:48:42", "remaining_time": "3:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 1730, "loss": 0.7996, "learning_rate": 2.715140505643932e-06, "epoch": 1.5537906137184114, "percentage": 77.75, "elapsed_time": "13:49:16", "remaining_time": "3:57:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 1730, "loss": 0.7641, "learning_rate": 2.704420569227224e-06, "epoch": 1.5549458483754512, "percentage": 77.8, "elapsed_time": "13:49:50", "remaining_time": "3:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 1730, "loss": 0.7466, "learning_rate": 2.6936968514638495e-06, "epoch": 1.556101083032491, "percentage": 77.86, "elapsed_time": "13:50:24", "remaining_time": "3:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 1730, "loss": 0.7826, "learning_rate": 2.68296955096272e-06, "epoch": 1.5572563176895307, "percentage": 77.92, "elapsed_time": "13:50:58", "remaining_time": "3:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 1730, "loss": 0.789, "learning_rate": 2.672238866399099e-06, "epoch": 1.5584115523465703, "percentage": 77.98, "elapsed_time": "13:51:32", "remaining_time": "3:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 1730, "loss": 0.784, "learning_rate": 2.6615049965109296e-06, "epoch": 1.55956678700361, "percentage": 78.03, "elapsed_time": "13:52:06", "remaining_time": "3:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 1730, "loss": 0.7934, "learning_rate": 2.6507681400951414e-06, "epoch": 1.5607220216606499, "percentage": 78.09, "elapsed_time": "13:52:40", "remaining_time": "3:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 1730, "loss": 0.7554, "learning_rate": 2.640028496003984e-06, "epoch": 1.5618772563176895, "percentage": 78.15, "elapsed_time": "13:53:14", "remaining_time": "3:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 1730, "loss": 0.7652, "learning_rate": 2.629286263141329e-06, "epoch": 1.5630324909747293, "percentage": 78.21, "elapsed_time": "13:53:48", "remaining_time": "3:52:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 1730, "loss": 0.7515, "learning_rate": 2.6185416404589985e-06, "epoch": 1.5641877256317689, "percentage": 78.27, "elapsed_time": "13:54:22", "remaining_time": "3:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 1730, "loss": 0.7839, "learning_rate": 2.607794826953075e-06, "epoch": 1.5653429602888087, "percentage": 78.32, "elapsed_time": "13:54:56", "remaining_time": "3:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 1730, "loss": 0.773, "learning_rate": 2.5970460216602133e-06, "epoch": 1.5664981949458485, "percentage": 78.38, "elapsed_time": "13:55:29", "remaining_time": "3:50:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 1730, "loss": 0.7641, "learning_rate": 2.5862954236539587e-06, "epoch": 1.5676534296028881, "percentage": 78.44, "elapsed_time": "13:56:03", "remaining_time": "3:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 1730, "loss": 0.7869, "learning_rate": 2.5755432320410594e-06, "epoch": 1.5688086642599277, "percentage": 78.5, "elapsed_time": "13:56:37", "remaining_time": "3:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 1730, "loss": 0.7873, "learning_rate": 2.5647896459577757e-06, "epoch": 1.5699638989169675, "percentage": 78.55, "elapsed_time": "13:57:12", "remaining_time": "3:48:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 1730, "loss": 0.7805, "learning_rate": 2.5540348645661965e-06, "epoch": 1.5711191335740073, "percentage": 78.61, "elapsed_time": "13:57:46", "remaining_time": "3:47:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 1730, "loss": 0.791, "learning_rate": 2.5432790870505487e-06, "epoch": 1.572274368231047, "percentage": 78.67, "elapsed_time": "13:58:19", "remaining_time": "3:47:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 1730, "loss": 0.7814, "learning_rate": 2.5325225126135045e-06, "epoch": 1.5734296028880865, "percentage": 78.73, "elapsed_time": "13:58:53", "remaining_time": "3:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 1730, "loss": 0.8046, "learning_rate": 2.521765340472499e-06, "epoch": 1.5745848375451263, "percentage": 78.79, "elapsed_time": "13:59:27", "remaining_time": "3:46:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 1730, "loss": 0.757, "learning_rate": 2.5110077698560364e-06, "epoch": 1.5757400722021662, "percentage": 78.84, "elapsed_time": "14:00:01", "remaining_time": "3:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 1730, "loss": 0.7729, "learning_rate": 2.5002500000000003e-06, "epoch": 1.5768953068592058, "percentage": 78.9, "elapsed_time": "14:00:35", "remaining_time": "3:44:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 1730, "loss": 0.7825, "learning_rate": 2.4894922301439643e-06, "epoch": 1.5780505415162454, "percentage": 78.96, "elapsed_time": "14:01:09", "remaining_time": "3:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 1730, "loss": 0.7783, "learning_rate": 2.478734659527501e-06, "epoch": 1.5792057761732852, "percentage": 79.02, "elapsed_time": "14:01:43", "remaining_time": "3:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 1730, "loss": 0.7617, "learning_rate": 2.467977487386497e-06, "epoch": 1.580361010830325, "percentage": 79.08, "elapsed_time": "14:02:17", "remaining_time": "3:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 1730, "loss": 0.7494, "learning_rate": 2.4572209129494524e-06, "epoch": 1.5815162454873646, "percentage": 79.13, "elapsed_time": "14:02:51", "remaining_time": "3:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 1730, "loss": 0.8013, "learning_rate": 2.4464651354338037e-06, "epoch": 1.5826714801444042, "percentage": 79.19, "elapsed_time": "14:03:25", "remaining_time": "3:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 1730, "loss": 0.7706, "learning_rate": 2.435710354042225e-06, "epoch": 1.583826714801444, "percentage": 79.25, "elapsed_time": "14:03:58", "remaining_time": "3:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 1730, "loss": 0.8006, "learning_rate": 2.4249567679589417e-06, "epoch": 1.5849819494584838, "percentage": 79.31, "elapsed_time": "14:04:32", "remaining_time": "3:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 1730, "loss": 0.7609, "learning_rate": 2.4142045763460415e-06, "epoch": 1.5861371841155236, "percentage": 79.36, "elapsed_time": "14:05:06", "remaining_time": "3:39:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 1730, "loss": 0.8048, "learning_rate": 2.403453978339787e-06, "epoch": 1.5872924187725632, "percentage": 79.42, "elapsed_time": "14:05:40", "remaining_time": "3:39:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 1730, "loss": 0.7731, "learning_rate": 2.392705173046925e-06, "epoch": 1.5884476534296028, "percentage": 79.48, "elapsed_time": "14:06:14", "remaining_time": "3:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 1730, "loss": 0.7858, "learning_rate": 2.3819583595410013e-06, "epoch": 1.5896028880866426, "percentage": 79.54, "elapsed_time": "14:06:48", "remaining_time": "3:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 1730, "loss": 0.7438, "learning_rate": 2.3712137368586717e-06, "epoch": 1.5907581227436824, "percentage": 79.6, "elapsed_time": "14:07:22", "remaining_time": "3:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 1730, "loss": 0.7835, "learning_rate": 2.3604715039960173e-06, "epoch": 1.591913357400722, "percentage": 79.65, "elapsed_time": "14:07:56", "remaining_time": "3:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 1730, "loss": 0.7716, "learning_rate": 2.3497318599048592e-06, "epoch": 1.5930685920577616, "percentage": 79.71, "elapsed_time": "14:08:30", "remaining_time": "3:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 1730, "loss": 0.7556, "learning_rate": 2.338995003489072e-06, "epoch": 1.5942238267148015, "percentage": 79.77, "elapsed_time": "14:09:04", "remaining_time": "3:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 1730, "loss": 0.7708, "learning_rate": 2.328261133600902e-06, "epoch": 1.5953790613718413, "percentage": 79.83, "elapsed_time": "14:09:38", "remaining_time": "3:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 1730, "loss": 0.7837, "learning_rate": 2.317530449037281e-06, "epoch": 1.5965342960288809, "percentage": 79.88, "elapsed_time": "14:10:12", "remaining_time": "3:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 1730, "loss": 0.7575, "learning_rate": 2.3068031485361516e-06, "epoch": 1.5976895306859205, "percentage": 79.94, "elapsed_time": "14:10:46", "remaining_time": "3:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 1730, "loss": 0.8002, "learning_rate": 2.296079430772777e-06, "epoch": 1.5988447653429603, "percentage": 80.0, "elapsed_time": "14:11:20", "remaining_time": "3:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 1730, "loss": 0.8076, "learning_rate": 2.285359494356068e-06, "epoch": 1.6, "percentage": 80.06, "elapsed_time": "14:11:54", "remaining_time": "3:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 1730, "loss": 0.7601, "learning_rate": 2.274643537824905e-06, "epoch": 1.6011552346570397, "percentage": 80.12, "elapsed_time": "14:12:28", "remaining_time": "3:31:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 1730, "loss": 0.7777, "learning_rate": 2.263931759644456e-06, "epoch": 1.6023104693140793, "percentage": 80.17, "elapsed_time": "14:13:02", "remaining_time": "3:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 1730, "loss": 0.7779, "learning_rate": 2.2532243582025048e-06, "epoch": 1.603465703971119, "percentage": 80.23, "elapsed_time": "14:13:35", "remaining_time": "3:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 1730, "loss": 0.7623, "learning_rate": 2.242521531805775e-06, "epoch": 1.604620938628159, "percentage": 80.29, "elapsed_time": "14:14:09", "remaining_time": "3:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 1730, "loss": 0.769, "learning_rate": 2.2318234786762586e-06, "epoch": 1.6057761732851985, "percentage": 80.35, "elapsed_time": "14:14:44", "remaining_time": "3:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 1730, "loss": 0.8051, "learning_rate": 2.2211303969475444e-06, "epoch": 1.6069314079422383, "percentage": 80.4, "elapsed_time": "14:15:18", "remaining_time": "3:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 1730, "loss": 0.8117, "learning_rate": 2.210442484661148e-06, "epoch": 1.608086642599278, "percentage": 80.46, "elapsed_time": "14:15:53", "remaining_time": "3:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 1730, "loss": 0.7768, "learning_rate": 2.199759939762843e-06, "epoch": 1.6092418772563177, "percentage": 80.52, "elapsed_time": "14:16:27", "remaining_time": "3:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 1730, "loss": 0.7575, "learning_rate": 2.1890829600989995e-06, "epoch": 1.6103971119133575, "percentage": 80.58, "elapsed_time": "14:17:01", "remaining_time": "3:26:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 1730, "loss": 0.7599, "learning_rate": 2.1784117434129113e-06, "epoch": 1.6115523465703971, "percentage": 80.64, "elapsed_time": "14:17:35", "remaining_time": "3:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 1730, "loss": 0.7661, "learning_rate": 2.167746487341144e-06, "epoch": 1.6127075812274367, "percentage": 80.69, "elapsed_time": "14:18:08", "remaining_time": "3:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 1730, "loss": 0.7698, "learning_rate": 2.157087389409867e-06, "epoch": 1.6138628158844766, "percentage": 80.75, "elapsed_time": "14:18:43", "remaining_time": "3:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 1730, "loss": 0.7695, "learning_rate": 2.1464346470311965e-06, "epoch": 1.6150180505415164, "percentage": 80.81, "elapsed_time": "14:19:17", "remaining_time": "3:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 1730, "loss": 0.7622, "learning_rate": 2.135788457499544e-06, "epoch": 1.616173285198556, "percentage": 80.87, "elapsed_time": "14:19:50", "remaining_time": "3:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 1730, "loss": 0.7639, "learning_rate": 2.1251490179879547e-06, "epoch": 1.6173285198555956, "percentage": 80.92, "elapsed_time": "14:20:24", "remaining_time": "3:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 1730, "loss": 0.7893, "learning_rate": 2.1145165255444643e-06, "epoch": 1.6184837545126354, "percentage": 80.98, "elapsed_time": "14:20:58", "remaining_time": "3:22:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 1730, "loss": 0.7936, "learning_rate": 2.1038911770884395e-06, "epoch": 1.6196389891696752, "percentage": 81.04, "elapsed_time": "14:21:31", "remaining_time": "3:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 1730, "loss": 0.7506, "learning_rate": 2.0932731694069438e-06, "epoch": 1.6207942238267148, "percentage": 81.1, "elapsed_time": "14:22:06", "remaining_time": "3:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 1730, "loss": 0.7623, "learning_rate": 2.0826626991510775e-06, "epoch": 1.6219494584837544, "percentage": 81.16, "elapsed_time": "14:22:41", "remaining_time": "3:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 1730, "loss": 0.7444, "learning_rate": 2.072059962832352e-06, "epoch": 1.6231046931407942, "percentage": 81.21, "elapsed_time": "14:23:14", "remaining_time": "3:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 1730, "loss": 0.7869, "learning_rate": 2.0614651568190354e-06, "epoch": 1.624259927797834, "percentage": 81.27, "elapsed_time": "14:23:48", "remaining_time": "3:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 1730, "loss": 0.8075, "learning_rate": 2.050878477332526e-06, "epoch": 1.6254151624548736, "percentage": 81.33, "elapsed_time": "14:24:22", "remaining_time": "3:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 1730, "loss": 0.7647, "learning_rate": 2.040300120443714e-06, "epoch": 1.6265703971119132, "percentage": 81.39, "elapsed_time": "14:24:56", "remaining_time": "3:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 1730, "loss": 0.7594, "learning_rate": 2.02973028206935e-06, "epoch": 1.627725631768953, "percentage": 81.45, "elapsed_time": "14:25:30", "remaining_time": "3:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 1730, "loss": 0.7664, "learning_rate": 2.019169157968418e-06, "epoch": 1.6288808664259928, "percentage": 81.5, "elapsed_time": "14:26:03", "remaining_time": "3:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 1730, "loss": 0.7637, "learning_rate": 2.008616943738508e-06, "epoch": 1.6300361010830327, "percentage": 81.56, "elapsed_time": "14:26:36", "remaining_time": "3:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 1730, "loss": 0.7674, "learning_rate": 1.9980738348121955e-06, "epoch": 1.6311913357400722, "percentage": 81.62, "elapsed_time": "14:27:10", "remaining_time": "3:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 1730, "loss": 0.7703, "learning_rate": 1.9875400264534194e-06, "epoch": 1.6323465703971118, "percentage": 81.68, "elapsed_time": "14:27:44", "remaining_time": "3:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 1730, "loss": 0.7825, "learning_rate": 1.97701571375387e-06, "epoch": 1.6335018050541517, "percentage": 81.73, "elapsed_time": "14:28:18", "remaining_time": "3:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 1730, "loss": 0.7875, "learning_rate": 1.9665010916293704e-06, "epoch": 1.6346570397111915, "percentage": 81.79, "elapsed_time": "14:28:51", "remaining_time": "3:13:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 1730, "loss": 0.7745, "learning_rate": 1.95599635481627e-06, "epoch": 1.635812274368231, "percentage": 81.85, "elapsed_time": "14:29:25", "remaining_time": "3:12:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 1730, "loss": 0.7825, "learning_rate": 1.9455016978678377e-06, "epoch": 1.6369675090252707, "percentage": 81.91, "elapsed_time": "14:29:59", "remaining_time": "3:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 1730, "loss": 0.7654, "learning_rate": 1.935017315150656e-06, "epoch": 1.6381227436823105, "percentage": 81.97, "elapsed_time": "14:30:33", "remaining_time": "3:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 1730, "loss": 0.7513, "learning_rate": 1.9245434008410273e-06, "epoch": 1.6392779783393503, "percentage": 82.02, "elapsed_time": "14:31:07", "remaining_time": "3:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 1730, "loss": 0.7756, "learning_rate": 1.914080148921368e-06, "epoch": 1.6404332129963899, "percentage": 82.08, "elapsed_time": "14:31:41", "remaining_time": "3:10:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 1730, "loss": 0.7702, "learning_rate": 1.903627753176627e-06, "epoch": 1.6415884476534295, "percentage": 82.14, "elapsed_time": "14:32:15", "remaining_time": "3:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 1730, "loss": 0.7727, "learning_rate": 1.893186407190685e-06, "epoch": 1.6427436823104693, "percentage": 82.2, "elapsed_time": "14:32:49", "remaining_time": "3:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 1730, "loss": 0.7856, "learning_rate": 1.8827563043427818e-06, "epoch": 1.6438989169675091, "percentage": 82.25, "elapsed_time": "14:33:24", "remaining_time": "3:08:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 1730, "loss": 0.775, "learning_rate": 1.8723376378039229e-06, "epoch": 1.6450541516245487, "percentage": 82.31, "elapsed_time": "14:33:57", "remaining_time": "3:07:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1425, "total_steps": 1730, "loss": 0.7464, "learning_rate": 1.8619306005333118e-06, "epoch": 1.6462093862815883, "percentage": 82.37, "elapsed_time": "14:34:31", "remaining_time": "3:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1426, "total_steps": 1730, "loss": 0.7944, "learning_rate": 1.851535385274768e-06, "epoch": 1.6473646209386281, "percentage": 82.43, "elapsed_time": "14:35:05", "remaining_time": "3:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1427, "total_steps": 1730, "loss": 0.7646, "learning_rate": 1.8411521845531638e-06, "epoch": 1.648519855595668, "percentage": 82.49, "elapsed_time": "14:35:38", "remaining_time": "3:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1428, "total_steps": 1730, "loss": 0.7802, "learning_rate": 1.8307811906708552e-06, "epoch": 1.6496750902527075, "percentage": 82.54, "elapsed_time": "14:36:12", "remaining_time": "3:05:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1429, "total_steps": 1730, "loss": 0.7686, "learning_rate": 1.8204225957041197e-06, "epoch": 1.6508303249097471, "percentage": 82.6, "elapsed_time": "14:36:45", "remaining_time": "3:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 1730, "loss": 0.79, "learning_rate": 1.8100765914996026e-06, "epoch": 1.651985559566787, "percentage": 82.66, "elapsed_time": "14:37:20", "remaining_time": "3:04:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1431, "total_steps": 1730, "loss": 0.766, "learning_rate": 1.7997433696707597e-06, "epoch": 1.6531407942238268, "percentage": 82.72, "elapsed_time": "14:37:53", "remaining_time": "3:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1432, "total_steps": 1730, "loss": 0.7718, "learning_rate": 1.789423121594312e-06, "epoch": 1.6542960288808666, "percentage": 82.77, "elapsed_time": "14:38:27", "remaining_time": "3:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1433, "total_steps": 1730, "loss": 0.7813, "learning_rate": 1.779116038406698e-06, "epoch": 1.6554512635379062, "percentage": 82.83, "elapsed_time": "14:39:00", "remaining_time": "3:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1434, "total_steps": 1730, "loss": 0.7772, "learning_rate": 1.768822311000538e-06, "epoch": 1.6566064981949458, "percentage": 82.89, "elapsed_time": "14:39:34", "remaining_time": "3:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1435, "total_steps": 1730, "loss": 0.7958, "learning_rate": 1.7585421300210932e-06, "epoch": 1.6577617328519856, "percentage": 82.95, "elapsed_time": "14:40:08", "remaining_time": "3:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1436, "total_steps": 1730, "loss": 0.774, "learning_rate": 1.7482756858627406e-06, "epoch": 1.6589169675090254, "percentage": 83.01, "elapsed_time": "14:40:42", "remaining_time": "3:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1437, "total_steps": 1730, "loss": 0.7763, "learning_rate": 1.7380231686654419e-06, "epoch": 1.660072202166065, "percentage": 83.06, "elapsed_time": "14:41:16", "remaining_time": "2:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1438, "total_steps": 1730, "loss": 0.7602, "learning_rate": 1.7277847683112251e-06, "epoch": 1.6612274368231046, "percentage": 83.12, "elapsed_time": "14:41:50", "remaining_time": "2:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1439, "total_steps": 1730, "loss": 0.7772, "learning_rate": 1.7175606744206683e-06, "epoch": 1.6623826714801444, "percentage": 83.18, "elapsed_time": "14:42:24", "remaining_time": "2:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 1730, "loss": 0.7776, "learning_rate": 1.707351076349382e-06, "epoch": 1.6635379061371842, "percentage": 83.24, "elapsed_time": "14:42:58", "remaining_time": "2:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1441, "total_steps": 1730, "loss": 0.769, "learning_rate": 1.697156163184512e-06, "epoch": 1.6646931407942238, "percentage": 83.29, "elapsed_time": "14:43:31", "remaining_time": "2:57:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1442, "total_steps": 1730, "loss": 0.7614, "learning_rate": 1.6869761237412275e-06, "epoch": 1.6658483754512634, "percentage": 83.35, "elapsed_time": "14:44:06", "remaining_time": "2:56:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1443, "total_steps": 1730, "loss": 0.7828, "learning_rate": 1.6768111465592312e-06, "epoch": 1.6670036101083032, "percentage": 83.41, "elapsed_time": "14:44:40", "remaining_time": "2:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1444, "total_steps": 1730, "loss": 0.7847, "learning_rate": 1.6666614198992625e-06, "epoch": 1.668158844765343, "percentage": 83.47, "elapsed_time": "14:45:14", "remaining_time": "2:55:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1445, "total_steps": 1730, "loss": 0.7757, "learning_rate": 1.6565271317396156e-06, "epoch": 1.6693140794223826, "percentage": 83.53, "elapsed_time": "14:45:48", "remaining_time": "2:54:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1446, "total_steps": 1730, "loss": 0.756, "learning_rate": 1.6464084697726532e-06, "epoch": 1.6704693140794222, "percentage": 83.58, "elapsed_time": "14:46:22", "remaining_time": "2:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1447, "total_steps": 1730, "loss": 0.7701, "learning_rate": 1.636305621401335e-06, "epoch": 1.671624548736462, "percentage": 83.64, "elapsed_time": "14:46:56", "remaining_time": "2:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1448, "total_steps": 1730, "loss": 0.8012, "learning_rate": 1.626218773735742e-06, "epoch": 1.6727797833935019, "percentage": 83.7, "elapsed_time": "14:47:29", "remaining_time": "2:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1449, "total_steps": 1730, "loss": 0.7796, "learning_rate": 1.6161481135896154e-06, "epoch": 1.6739350180505417, "percentage": 83.76, "elapsed_time": "14:48:03", "remaining_time": "2:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 1730, "loss": 0.7584, "learning_rate": 1.606093827476895e-06, "epoch": 1.6750902527075813, "percentage": 83.82, "elapsed_time": "14:48:37", "remaining_time": "2:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1451, "total_steps": 1730, "loss": 0.7812, "learning_rate": 1.5960561016082638e-06, "epoch": 1.6762454873646209, "percentage": 83.87, "elapsed_time": "14:49:11", "remaining_time": "2:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1452, "total_steps": 1730, "loss": 0.7642, "learning_rate": 1.5860351218877021e-06, "epoch": 1.6774007220216607, "percentage": 83.93, "elapsed_time": "14:49:45", "remaining_time": "2:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1453, "total_steps": 1730, "loss": 0.7838, "learning_rate": 1.5760310739090402e-06, "epoch": 1.6785559566787005, "percentage": 83.99, "elapsed_time": "14:50:19", "remaining_time": "2:49:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1454, "total_steps": 1730, "loss": 0.7713, "learning_rate": 1.5660441429525258e-06, "epoch": 1.67971119133574, "percentage": 84.05, "elapsed_time": "14:50:53", "remaining_time": "2:49:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1455, "total_steps": 1730, "loss": 0.8022, "learning_rate": 1.556074513981389e-06, "epoch": 1.6808664259927797, "percentage": 84.1, "elapsed_time": "14:51:27", "remaining_time": "2:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1456, "total_steps": 1730, "loss": 0.7794, "learning_rate": 1.5461223716384196e-06, "epoch": 1.6820216606498195, "percentage": 84.16, "elapsed_time": "14:52:01", "remaining_time": "2:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1457, "total_steps": 1730, "loss": 0.8067, "learning_rate": 1.5361879002425432e-06, "epoch": 1.6831768953068593, "percentage": 84.22, "elapsed_time": "14:52:35", "remaining_time": "2:47:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1458, "total_steps": 1730, "loss": 0.7497, "learning_rate": 1.5262712837854139e-06, "epoch": 1.684332129963899, "percentage": 84.28, "elapsed_time": "14:53:09", "remaining_time": "2:46:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1459, "total_steps": 1730, "loss": 0.7645, "learning_rate": 1.5163727059279972e-06, "epoch": 1.6854873646209385, "percentage": 84.34, "elapsed_time": "14:53:43", "remaining_time": "2:46:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 1730, "loss": 0.7698, "learning_rate": 1.506492349997181e-06, "epoch": 1.6866425992779783, "percentage": 84.39, "elapsed_time": "14:54:17", "remaining_time": "2:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1461, "total_steps": 1730, "loss": 0.7541, "learning_rate": 1.4966303989823688e-06, "epoch": 1.6877978339350181, "percentage": 84.45, "elapsed_time": "14:54:52", "remaining_time": "2:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1462, "total_steps": 1730, "loss": 0.7611, "learning_rate": 1.4867870355320972e-06, "epoch": 1.6889530685920577, "percentage": 84.51, "elapsed_time": "14:55:26", "remaining_time": "2:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1463, "total_steps": 1730, "loss": 0.7598, "learning_rate": 1.4769624419506507e-06, "epoch": 1.6901083032490973, "percentage": 84.57, "elapsed_time": "14:56:00", "remaining_time": "2:43:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1464, "total_steps": 1730, "loss": 0.7863, "learning_rate": 1.4671568001946851e-06, "epoch": 1.6912635379061371, "percentage": 84.62, "elapsed_time": "14:56:34", "remaining_time": "2:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1465, "total_steps": 1730, "loss": 0.7955, "learning_rate": 1.4573702918698615e-06, "epoch": 1.692418772563177, "percentage": 84.68, "elapsed_time": "14:57:08", "remaining_time": "2:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1466, "total_steps": 1730, "loss": 0.7666, "learning_rate": 1.4476030982274746e-06, "epoch": 1.6935740072202166, "percentage": 84.74, "elapsed_time": "14:57:42", "remaining_time": "2:41:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1467, "total_steps": 1730, "loss": 0.747, "learning_rate": 1.4378554001611087e-06, "epoch": 1.6947292418772562, "percentage": 84.8, "elapsed_time": "14:58:16", "remaining_time": "2:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1468, "total_steps": 1730, "loss": 0.7914, "learning_rate": 1.4281273782032696e-06, "epoch": 1.695884476534296, "percentage": 84.86, "elapsed_time": "14:58:50", "remaining_time": "2:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1469, "total_steps": 1730, "loss": 0.7879, "learning_rate": 1.41841921252206e-06, "epoch": 1.6970397111913358, "percentage": 84.91, "elapsed_time": "14:59:24", "remaining_time": "2:39:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 1730, "loss": 0.7707, "learning_rate": 1.4087310829178295e-06, "epoch": 1.6981949458483756, "percentage": 84.97, "elapsed_time": "14:59:57", "remaining_time": "2:39:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1471, "total_steps": 1730, "loss": 0.7753, "learning_rate": 1.3990631688198505e-06, "epoch": 1.6993501805054152, "percentage": 85.03, "elapsed_time": "15:00:32", "remaining_time": "2:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1472, "total_steps": 1730, "loss": 0.7579, "learning_rate": 1.3894156492829932e-06, "epoch": 1.7005054151624548, "percentage": 85.09, "elapsed_time": "15:01:06", "remaining_time": "2:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1473, "total_steps": 1730, "loss": 0.7512, "learning_rate": 1.3797887029844083e-06, "epoch": 1.7016606498194946, "percentage": 85.14, "elapsed_time": "15:01:40", "remaining_time": "2:37:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1474, "total_steps": 1730, "loss": 0.772, "learning_rate": 1.3701825082202227e-06, "epoch": 1.7028158844765344, "percentage": 85.2, "elapsed_time": "15:02:14", "remaining_time": "2:36:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1475, "total_steps": 1730, "loss": 0.766, "learning_rate": 1.3605972429022308e-06, "epoch": 1.703971119133574, "percentage": 85.26, "elapsed_time": "15:02:48", "remaining_time": "2:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1476, "total_steps": 1730, "loss": 0.7638, "learning_rate": 1.3510330845546029e-06, "epoch": 1.7051263537906136, "percentage": 85.32, "elapsed_time": "15:03:23", "remaining_time": "2:35:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1477, "total_steps": 1730, "loss": 0.7572, "learning_rate": 1.3414902103105984e-06, "epoch": 1.7062815884476534, "percentage": 85.38, "elapsed_time": "15:03:56", "remaining_time": "2:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1478, "total_steps": 1730, "loss": 0.7763, "learning_rate": 1.3319687969092844e-06, "epoch": 1.7074368231046932, "percentage": 85.43, "elapsed_time": "15:04:31", "remaining_time": "2:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1479, "total_steps": 1730, "loss": 0.7859, "learning_rate": 1.3224690206922594e-06, "epoch": 1.7085920577617328, "percentage": 85.49, "elapsed_time": "15:05:05", "remaining_time": "2:33:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 1730, "loss": 0.76, "learning_rate": 1.3129910576003918e-06, "epoch": 1.7097472924187724, "percentage": 85.55, "elapsed_time": "15:05:39", "remaining_time": "2:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1481, "total_steps": 1730, "loss": 0.7541, "learning_rate": 1.3035350831705581e-06, "epoch": 1.7109025270758123, "percentage": 85.61, "elapsed_time": "15:06:13", "remaining_time": "2:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1482, "total_steps": 1730, "loss": 0.7794, "learning_rate": 1.2941012725323943e-06, "epoch": 1.712057761732852, "percentage": 85.66, "elapsed_time": "15:06:47", "remaining_time": "2:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1483, "total_steps": 1730, "loss": 0.789, "learning_rate": 1.2846898004050527e-06, "epoch": 1.7132129963898917, "percentage": 85.72, "elapsed_time": "15:07:21", "remaining_time": "2:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1484, "total_steps": 1730, "loss": 0.7704, "learning_rate": 1.2753008410939593e-06, "epoch": 1.7143682310469313, "percentage": 85.78, "elapsed_time": "15:07:55", "remaining_time": "2:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1485, "total_steps": 1730, "loss": 0.7751, "learning_rate": 1.2659345684875971e-06, "epoch": 1.715523465703971, "percentage": 85.84, "elapsed_time": "15:08:29", "remaining_time": "2:29:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1486, "total_steps": 1730, "loss": 0.7721, "learning_rate": 1.2565911560542752e-06, "epoch": 1.716678700361011, "percentage": 85.9, "elapsed_time": "15:09:03", "remaining_time": "2:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1487, "total_steps": 1730, "loss": 0.7638, "learning_rate": 1.2472707768389226e-06, "epoch": 1.7178339350180507, "percentage": 85.95, "elapsed_time": "15:09:37", "remaining_time": "2:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1488, "total_steps": 1730, "loss": 0.7898, "learning_rate": 1.2379736034598793e-06, "epoch": 1.7189891696750903, "percentage": 86.01, "elapsed_time": "15:10:10", "remaining_time": "2:28:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1489, "total_steps": 1730, "loss": 0.757, "learning_rate": 1.2286998081057024e-06, "epoch": 1.72014440433213, "percentage": 86.07, "elapsed_time": "15:10:45", "remaining_time": "2:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 1730, "loss": 0.7756, "learning_rate": 1.219449562531973e-06, "epoch": 1.7212996389891697, "percentage": 86.13, "elapsed_time": "15:11:19", "remaining_time": "2:26:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1491, "total_steps": 1730, "loss": 0.7851, "learning_rate": 1.2102230380581221e-06, "epoch": 1.7224548736462095, "percentage": 86.18, "elapsed_time": "15:11:52", "remaining_time": "2:26:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1492, "total_steps": 1730, "loss": 0.7786, "learning_rate": 1.2010204055642504e-06, "epoch": 1.7236101083032491, "percentage": 86.24, "elapsed_time": "15:12:27", "remaining_time": "2:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1493, "total_steps": 1730, "loss": 0.7918, "learning_rate": 1.1918418354879655e-06, "epoch": 1.7247653429602887, "percentage": 86.3, "elapsed_time": "15:13:00", "remaining_time": "2:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1494, "total_steps": 1730, "loss": 0.7797, "learning_rate": 1.1826874978212304e-06, "epoch": 1.7259205776173285, "percentage": 86.36, "elapsed_time": "15:13:34", "remaining_time": "2:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1495, "total_steps": 1730, "loss": 0.7622, "learning_rate": 1.1735575621072076e-06, "epoch": 1.7270758122743683, "percentage": 86.42, "elapsed_time": "15:14:08", "remaining_time": "2:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1496, "total_steps": 1730, "loss": 0.7538, "learning_rate": 1.1644521974371236e-06, "epoch": 1.728231046931408, "percentage": 86.47, "elapsed_time": "15:14:41", "remaining_time": "2:23:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1497, "total_steps": 1730, "loss": 0.7567, "learning_rate": 1.1553715724471356e-06, "epoch": 1.7293862815884475, "percentage": 86.53, "elapsed_time": "15:15:15", "remaining_time": "2:22:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1498, "total_steps": 1730, "loss": 0.763, "learning_rate": 1.146315855315211e-06, "epoch": 1.7305415162454874, "percentage": 86.59, "elapsed_time": "15:15:48", "remaining_time": "2:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1499, "total_steps": 1730, "loss": 0.7519, "learning_rate": 1.1372852137580082e-06, "epoch": 1.7316967509025272, "percentage": 86.65, "elapsed_time": "15:16:22", "remaining_time": "2:21:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 1730, "loss": 0.7704, "learning_rate": 1.1282798150277738e-06, "epoch": 1.7328519855595668, "percentage": 86.71, "elapsed_time": "15:16:56", "remaining_time": "2:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1501, "total_steps": 1730, "loss": 0.8001, "learning_rate": 1.1192998259092428e-06, "epoch": 1.7340072202166064, "percentage": 86.76, "elapsed_time": "15:32:32", "remaining_time": "2:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1502, "total_steps": 1730, "loss": 0.7725, "learning_rate": 1.1103454127165526e-06, "epoch": 1.7351624548736462, "percentage": 86.82, "elapsed_time": "15:33:06", "remaining_time": "2:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1503, "total_steps": 1730, "loss": 0.7227, "learning_rate": 1.1014167412901609e-06, "epoch": 1.736317689530686, "percentage": 86.88, "elapsed_time": "15:33:40", "remaining_time": "2:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1504, "total_steps": 1730, "loss": 0.7852, "learning_rate": 1.092513976993772e-06, "epoch": 1.7374729241877256, "percentage": 86.94, "elapsed_time": "15:34:14", "remaining_time": "2:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1505, "total_steps": 1730, "loss": 0.7648, "learning_rate": 1.083637284711279e-06, "epoch": 1.7386281588447652, "percentage": 86.99, "elapsed_time": "15:34:49", "remaining_time": "2:19:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1506, "total_steps": 1730, "loss": 0.741, "learning_rate": 1.074786828843705e-06, "epoch": 1.739783393501805, "percentage": 87.05, "elapsed_time": "15:35:23", "remaining_time": "2:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1507, "total_steps": 1730, "loss": 0.7355, "learning_rate": 1.0659627733061643e-06, "epoch": 1.7409386281588448, "percentage": 87.11, "elapsed_time": "15:35:58", "remaining_time": "2:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1508, "total_steps": 1730, "loss": 0.8, "learning_rate": 1.0571652815248199e-06, "epoch": 1.7420938628158846, "percentage": 87.17, "elapsed_time": "15:36:32", "remaining_time": "2:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1509, "total_steps": 1730, "loss": 0.7701, "learning_rate": 1.0483945164338617e-06, "epoch": 1.7432490974729242, "percentage": 87.23, "elapsed_time": "15:37:06", "remaining_time": "2:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 1730, "loss": 0.7831, "learning_rate": 1.039650640472486e-06, "epoch": 1.7444043321299638, "percentage": 87.28, "elapsed_time": "15:37:40", "remaining_time": "2:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1511, "total_steps": 1730, "loss": 0.7896, "learning_rate": 1.0309338155818906e-06, "epoch": 1.7455595667870036, "percentage": 87.34, "elapsed_time": "15:38:13", "remaining_time": "2:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1512, "total_steps": 1730, "loss": 0.7806, "learning_rate": 1.0222442032022705e-06, "epoch": 1.7467148014440435, "percentage": 87.4, "elapsed_time": "15:38:47", "remaining_time": "2:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1513, "total_steps": 1730, "loss": 0.7844, "learning_rate": 1.0135819642698318e-06, "epoch": 1.747870036101083, "percentage": 87.46, "elapsed_time": "15:39:21", "remaining_time": "2:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1514, "total_steps": 1730, "loss": 0.7766, "learning_rate": 1.0049472592138105e-06, "epoch": 1.7490252707581226, "percentage": 87.51, "elapsed_time": "15:39:56", "remaining_time": "2:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1515, "total_steps": 1730, "loss": 0.7813, "learning_rate": 9.963402479535004e-07, "epoch": 1.7501805054151625, "percentage": 87.57, "elapsed_time": "15:40:30", "remaining_time": "2:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1516, "total_steps": 1730, "loss": 0.79, "learning_rate": 9.877610898952902e-07, "epoch": 1.7513357400722023, "percentage": 87.63, "elapsed_time": "15:41:04", "remaining_time": "2:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1517, "total_steps": 1730, "loss": 0.7875, "learning_rate": 9.792099439297134e-07, "epoch": 1.7524909747292419, "percentage": 87.69, "elapsed_time": "15:41:38", "remaining_time": "2:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1518, "total_steps": 1730, "loss": 0.7605, "learning_rate": 9.706869684285066e-07, "epoch": 1.7536462093862815, "percentage": 87.75, "elapsed_time": "15:42:13", "remaining_time": "2:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1519, "total_steps": 1730, "loss": 0.7778, "learning_rate": 9.621923212416713e-07, "epoch": 1.7548014440433213, "percentage": 87.8, "elapsed_time": "15:42:46", "remaining_time": "2:10:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 1730, "loss": 0.7881, "learning_rate": 9.53726159694558e-07, "epoch": 1.755956678700361, "percentage": 87.86, "elapsed_time": "15:43:20", "remaining_time": "2:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1521, "total_steps": 1730, "loss": 0.7725, "learning_rate": 9.452886405849418e-07, "epoch": 1.7571119133574007, "percentage": 87.92, "elapsed_time": "15:43:54", "remaining_time": "2:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1522, "total_steps": 1730, "loss": 0.771, "learning_rate": 9.36879920180131e-07, "epoch": 1.7582671480144403, "percentage": 87.98, "elapsed_time": "15:44:29", "remaining_time": "2:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1523, "total_steps": 1730, "loss": 0.7624, "learning_rate": 9.285001542140625e-07, "epoch": 1.75942238267148, "percentage": 88.03, "elapsed_time": "15:45:08", "remaining_time": "2:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1524, "total_steps": 1730, "loss": 0.7763, "learning_rate": 9.201494978844251e-07, "epoch": 1.76057761732852, "percentage": 88.09, "elapsed_time": "15:45:41", "remaining_time": "2:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1525, "total_steps": 1730, "loss": 0.7634, "learning_rate": 9.118281058497792e-07, "epoch": 1.7617328519855595, "percentage": 88.15, "elapsed_time": "15:46:16", "remaining_time": "2:07:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1526, "total_steps": 1730, "loss": 0.7501, "learning_rate": 9.03536132226695e-07, "epoch": 1.7628880866425993, "percentage": 88.21, "elapsed_time": "15:46:51", "remaining_time": "2:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1527, "total_steps": 1730, "loss": 0.802, "learning_rate": 8.952737305869002e-07, "epoch": 1.764043321299639, "percentage": 88.27, "elapsed_time": "15:47:27", "remaining_time": "2:05:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1528, "total_steps": 1730, "loss": 0.7846, "learning_rate": 8.870410539544322e-07, "epoch": 1.7651985559566787, "percentage": 88.32, "elapsed_time": "15:48:02", "remaining_time": "2:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1529, "total_steps": 1730, "loss": 0.7551, "learning_rate": 8.788382548028056e-07, "epoch": 1.7663537906137186, "percentage": 88.38, "elapsed_time": "15:48:35", "remaining_time": "2:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 1730, "loss": 0.7736, "learning_rate": 8.706654850521883e-07, "epoch": 1.7675090252707581, "percentage": 88.44, "elapsed_time": "15:49:09", "remaining_time": "2:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1531, "total_steps": 1730, "loss": 0.7632, "learning_rate": 8.625228960665893e-07, "epoch": 1.7686642599277977, "percentage": 88.5, "elapsed_time": "15:49:43", "remaining_time": "2:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1532, "total_steps": 1730, "loss": 0.7514, "learning_rate": 8.544106386510526e-07, "epoch": 1.7698194945848376, "percentage": 88.55, "elapsed_time": "15:50:16", "remaining_time": "2:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1533, "total_steps": 1730, "loss": 0.7741, "learning_rate": 8.463288630488653e-07, "epoch": 1.7709747292418774, "percentage": 88.61, "elapsed_time": "15:50:51", "remaining_time": "2:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1534, "total_steps": 1730, "loss": 0.7721, "learning_rate": 8.382777189387751e-07, "epoch": 1.772129963898917, "percentage": 88.67, "elapsed_time": "15:51:25", "remaining_time": "2:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1535, "total_steps": 1730, "loss": 0.7507, "learning_rate": 8.302573554322192e-07, "epoch": 1.7732851985559566, "percentage": 88.73, "elapsed_time": "15:52:00", "remaining_time": "2:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1536, "total_steps": 1730, "loss": 0.7993, "learning_rate": 8.222679210705636e-07, "epoch": 1.7744404332129964, "percentage": 88.79, "elapsed_time": "15:52:33", "remaining_time": "2:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1537, "total_steps": 1730, "loss": 0.7536, "learning_rate": 8.143095638223446e-07, "epoch": 1.7755956678700362, "percentage": 88.84, "elapsed_time": "15:53:07", "remaining_time": "1:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1538, "total_steps": 1730, "loss": 0.7552, "learning_rate": 8.063824310805396e-07, "epoch": 1.7767509025270758, "percentage": 88.9, "elapsed_time": "15:53:40", "remaining_time": "1:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1539, "total_steps": 1730, "loss": 0.7845, "learning_rate": 7.984866696598284e-07, "epoch": 1.7779061371841154, "percentage": 88.96, "elapsed_time": "15:54:14", "remaining_time": "1:58:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 1730, "loss": 0.7674, "learning_rate": 7.906224257938796e-07, "epoch": 1.7790613718411552, "percentage": 89.02, "elapsed_time": "15:54:48", "remaining_time": "1:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1541, "total_steps": 1730, "loss": 0.7637, "learning_rate": 7.827898451326386e-07, "epoch": 1.780216606498195, "percentage": 89.08, "elapsed_time": "15:55:21", "remaining_time": "1:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1542, "total_steps": 1730, "loss": 0.7754, "learning_rate": 7.749890727396312e-07, "epoch": 1.7813718411552346, "percentage": 89.13, "elapsed_time": "15:55:55", "remaining_time": "1:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1543, "total_steps": 1730, "loss": 0.7751, "learning_rate": 7.672202530892778e-07, "epoch": 1.7825270758122742, "percentage": 89.19, "elapsed_time": "15:56:29", "remaining_time": "1:55:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1544, "total_steps": 1730, "loss": 0.7955, "learning_rate": 7.594835300642188e-07, "epoch": 1.783682310469314, "percentage": 89.25, "elapsed_time": "15:57:02", "remaining_time": "1:55:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1545, "total_steps": 1730, "loss": 0.7713, "learning_rate": 7.517790469526456e-07, "epoch": 1.7848375451263538, "percentage": 89.31, "elapsed_time": "15:57:36", "remaining_time": "1:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1546, "total_steps": 1730, "loss": 0.7888, "learning_rate": 7.441069464456497e-07, "epoch": 1.7859927797833937, "percentage": 89.36, "elapsed_time": "15:58:10", "remaining_time": "1:54:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1547, "total_steps": 1730, "loss": 0.7548, "learning_rate": 7.364673706345822e-07, "epoch": 1.7871480144404333, "percentage": 89.42, "elapsed_time": "15:58:44", "remaining_time": "1:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1548, "total_steps": 1730, "loss": 0.7645, "learning_rate": 7.288604610084172e-07, "epoch": 1.7883032490974728, "percentage": 89.48, "elapsed_time": "15:59:17", "remaining_time": "1:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1549, "total_steps": 1730, "loss": 0.7565, "learning_rate": 7.212863584511341e-07, "epoch": 1.7894584837545127, "percentage": 89.54, "elapsed_time": "15:59:51", "remaining_time": "1:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 1730, "loss": 0.7646, "learning_rate": 7.137452032391084e-07, "epoch": 1.7906137184115525, "percentage": 89.6, "elapsed_time": "16:00:25", "remaining_time": "1:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1551, "total_steps": 1730, "loss": 0.7667, "learning_rate": 7.062371350385143e-07, "epoch": 1.791768953068592, "percentage": 89.65, "elapsed_time": "16:00:59", "remaining_time": "1:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1552, "total_steps": 1730, "loss": 0.7848, "learning_rate": 6.987622929027362e-07, "epoch": 1.7929241877256317, "percentage": 89.71, "elapsed_time": "16:01:33", "remaining_time": "1:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1553, "total_steps": 1730, "loss": 0.7667, "learning_rate": 6.913208152697935e-07, "epoch": 1.7940794223826715, "percentage": 89.77, "elapsed_time": "16:02:07", "remaining_time": "1:49:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1554, "total_steps": 1730, "loss": 0.7742, "learning_rate": 6.839128399597784e-07, "epoch": 1.7952346570397113, "percentage": 89.83, "elapsed_time": "16:02:41", "remaining_time": "1:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1555, "total_steps": 1730, "loss": 0.7783, "learning_rate": 6.765385041723024e-07, "epoch": 1.796389891696751, "percentage": 89.88, "elapsed_time": "16:03:15", "remaining_time": "1:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1556, "total_steps": 1730, "loss": 0.7737, "learning_rate": 6.691979444839561e-07, "epoch": 1.7975451263537905, "percentage": 89.94, "elapsed_time": "16:03:49", "remaining_time": "1:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1557, "total_steps": 1730, "loss": 0.7767, "learning_rate": 6.618912968457771e-07, "epoch": 1.7987003610108303, "percentage": 90.0, "elapsed_time": "16:04:23", "remaining_time": "1:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1558, "total_steps": 1730, "loss": 0.7607, "learning_rate": 6.546186965807347e-07, "epoch": 1.7998555956678701, "percentage": 90.06, "elapsed_time": "16:04:57", "remaining_time": "1:46:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1559, "total_steps": 1730, "loss": 0.8028, "learning_rate": 6.473802783812225e-07, "epoch": 1.8010108303249097, "percentage": 90.12, "elapsed_time": "16:05:31", "remaining_time": "1:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 1730, "loss": 0.7452, "learning_rate": 6.401761763065661e-07, "epoch": 1.8021660649819493, "percentage": 90.17, "elapsed_time": "16:06:04", "remaining_time": "1:45:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1561, "total_steps": 1730, "loss": 0.7879, "learning_rate": 6.330065237805361e-07, "epoch": 1.8033212996389891, "percentage": 90.23, "elapsed_time": "16:06:38", "remaining_time": "1:44:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1562, "total_steps": 1730, "loss": 0.7687, "learning_rate": 6.258714535888803e-07, "epoch": 1.804476534296029, "percentage": 90.29, "elapsed_time": "16:07:12", "remaining_time": "1:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1563, "total_steps": 1730, "loss": 0.7622, "learning_rate": 6.187710978768624e-07, "epoch": 1.8056317689530685, "percentage": 90.35, "elapsed_time": "16:07:46", "remaining_time": "1:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1564, "total_steps": 1730, "loss": 0.7863, "learning_rate": 6.117055881468175e-07, "epoch": 1.8067870036101084, "percentage": 90.4, "elapsed_time": "16:08:21", "remaining_time": "1:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1565, "total_steps": 1730, "loss": 0.7887, "learning_rate": 6.046750552557139e-07, "epoch": 1.807942238267148, "percentage": 90.46, "elapsed_time": "16:08:54", "remaining_time": "1:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1566, "total_steps": 1730, "loss": 0.7687, "learning_rate": 5.976796294127286e-07, "epoch": 1.8090974729241878, "percentage": 90.52, "elapsed_time": "16:09:28", "remaining_time": "1:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1567, "total_steps": 1730, "loss": 0.7705, "learning_rate": 5.907194401768411e-07, "epoch": 1.8102527075812276, "percentage": 90.58, "elapsed_time": "16:10:01", "remaining_time": "1:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1568, "total_steps": 1730, "loss": 0.805, "learning_rate": 5.837946164544276e-07, "epoch": 1.8114079422382672, "percentage": 90.64, "elapsed_time": "16:10:35", "remaining_time": "1:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1569, "total_steps": 1730, "loss": 0.7699, "learning_rate": 5.769052864968768e-07, "epoch": 1.8125631768953068, "percentage": 90.69, "elapsed_time": "16:11:09", "remaining_time": "1:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 1730, "loss": 0.7506, "learning_rate": 5.700515778982142e-07, "epoch": 1.8137184115523466, "percentage": 90.75, "elapsed_time": "16:11:43", "remaining_time": "1:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1571, "total_steps": 1730, "loss": 0.7663, "learning_rate": 5.632336175927404e-07, "epoch": 1.8148736462093864, "percentage": 90.81, "elapsed_time": "16:12:17", "remaining_time": "1:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1572, "total_steps": 1730, "loss": 0.7555, "learning_rate": 5.564515318526759e-07, "epoch": 1.816028880866426, "percentage": 90.87, "elapsed_time": "16:12:51", "remaining_time": "1:37:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1573, "total_steps": 1730, "loss": 0.7856, "learning_rate": 5.497054462858296e-07, "epoch": 1.8171841155234656, "percentage": 90.92, "elapsed_time": "16:13:25", "remaining_time": "1:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1574, "total_steps": 1730, "loss": 0.7755, "learning_rate": 5.429954858332623e-07, "epoch": 1.8183393501805054, "percentage": 90.98, "elapsed_time": "16:13:58", "remaining_time": "1:36:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1575, "total_steps": 1730, "loss": 0.7871, "learning_rate": 5.363217747669843e-07, "epoch": 1.8194945848375452, "percentage": 91.04, "elapsed_time": "16:14:33", "remaining_time": "1:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1576, "total_steps": 1730, "loss": 0.7499, "learning_rate": 5.296844366876441e-07, "epoch": 1.8206498194945848, "percentage": 91.1, "elapsed_time": "16:15:06", "remaining_time": "1:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1577, "total_steps": 1730, "loss": 0.7941, "learning_rate": 5.230835945222463e-07, "epoch": 1.8218050541516244, "percentage": 91.16, "elapsed_time": "16:15:40", "remaining_time": "1:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1578, "total_steps": 1730, "loss": 0.7719, "learning_rate": 5.165193705218699e-07, "epoch": 1.8229602888086642, "percentage": 91.21, "elapsed_time": "16:16:14", "remaining_time": "1:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1579, "total_steps": 1730, "loss": 0.7815, "learning_rate": 5.099918862594065e-07, "epoch": 1.824115523465704, "percentage": 91.27, "elapsed_time": "16:16:48", "remaining_time": "1:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 1730, "loss": 0.7538, "learning_rate": 5.035012626273094e-07, "epoch": 1.8252707581227436, "percentage": 91.33, "elapsed_time": "16:17:22", "remaining_time": "1:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1581, "total_steps": 1730, "loss": 0.764, "learning_rate": 4.970476198353524e-07, "epoch": 1.8264259927797832, "percentage": 91.39, "elapsed_time": "16:17:55", "remaining_time": "1:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1582, "total_steps": 1730, "loss": 0.787, "learning_rate": 4.906310774084055e-07, "epoch": 1.827581227436823, "percentage": 91.45, "elapsed_time": "16:18:29", "remaining_time": "1:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1583, "total_steps": 1730, "loss": 0.7527, "learning_rate": 4.842517541842186e-07, "epoch": 1.8287364620938629, "percentage": 91.5, "elapsed_time": "16:19:03", "remaining_time": "1:30:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1584, "total_steps": 1730, "loss": 0.7639, "learning_rate": 4.779097683112254e-07, "epoch": 1.8298916967509027, "percentage": 91.56, "elapsed_time": "16:19:37", "remaining_time": "1:30:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1585, "total_steps": 1730, "loss": 0.7676, "learning_rate": 4.7160523724634964e-07, "epoch": 1.8310469314079423, "percentage": 91.62, "elapsed_time": "16:20:11", "remaining_time": "1:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1586, "total_steps": 1730, "loss": 0.7805, "learning_rate": 4.653382777528332e-07, "epoch": 1.8322021660649819, "percentage": 91.68, "elapsed_time": "16:20:45", "remaining_time": "1:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1587, "total_steps": 1730, "loss": 0.7578, "learning_rate": 4.5910900589807164e-07, "epoch": 1.8333574007220217, "percentage": 91.73, "elapsed_time": "16:21:19", "remaining_time": "1:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1588, "total_steps": 1730, "loss": 0.7816, "learning_rate": 4.5291753705146685e-07, "epoch": 1.8345126353790615, "percentage": 91.79, "elapsed_time": "16:21:54", "remaining_time": "1:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1589, "total_steps": 1730, "loss": 0.7712, "learning_rate": 4.4676398588229044e-07, "epoch": 1.835667870036101, "percentage": 91.85, "elapsed_time": "16:22:28", "remaining_time": "1:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 1730, "loss": 0.7673, "learning_rate": 4.40648466357554e-07, "epoch": 1.8368231046931407, "percentage": 91.91, "elapsed_time": "16:23:02", "remaining_time": "1:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1591, "total_steps": 1730, "loss": 0.7627, "learning_rate": 4.3457109173990736e-07, "epoch": 1.8379783393501805, "percentage": 91.97, "elapsed_time": "16:23:36", "remaining_time": "1:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1592, "total_steps": 1730, "loss": 0.7758, "learning_rate": 4.285319745855341e-07, "epoch": 1.8391335740072203, "percentage": 92.02, "elapsed_time": "16:24:11", "remaining_time": "1:25:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1593, "total_steps": 1730, "loss": 0.7763, "learning_rate": 4.2253122674207165e-07, "epoch": 1.84028880866426, "percentage": 92.08, "elapsed_time": "16:24:45", "remaining_time": "1:24:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1594, "total_steps": 1730, "loss": 0.7873, "learning_rate": 4.165689593465352e-07, "epoch": 1.8414440433212995, "percentage": 92.14, "elapsed_time": "16:25:19", "remaining_time": "1:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1595, "total_steps": 1730, "loss": 0.7517, "learning_rate": 4.1064528282326263e-07, "epoch": 1.8425992779783393, "percentage": 92.2, "elapsed_time": "16:25:52", "remaining_time": "1:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1596, "total_steps": 1730, "loss": 0.7715, "learning_rate": 4.047603068818685e-07, "epoch": 1.8437545126353792, "percentage": 92.25, "elapsed_time": "16:26:26", "remaining_time": "1:22:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1597, "total_steps": 1730, "loss": 0.7697, "learning_rate": 3.9891414051521345e-07, "epoch": 1.8449097472924187, "percentage": 92.31, "elapsed_time": "16:27:00", "remaining_time": "1:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1598, "total_steps": 1730, "loss": 0.7651, "learning_rate": 3.93106891997382e-07, "epoch": 1.8460649819494583, "percentage": 92.37, "elapsed_time": "16:27:34", "remaining_time": "1:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1599, "total_steps": 1730, "loss": 0.7862, "learning_rate": 3.8733866888168026e-07, "epoch": 1.8472202166064982, "percentage": 92.43, "elapsed_time": "16:28:08", "remaining_time": "1:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 1730, "loss": 0.7704, "learning_rate": 3.816095779986455e-07, "epoch": 1.848375451263538, "percentage": 92.49, "elapsed_time": "16:28:42", "remaining_time": "1:20:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1601, "total_steps": 1730, "loss": 0.7712, "learning_rate": 3.759197254540624e-07, "epoch": 1.8495306859205776, "percentage": 92.54, "elapsed_time": "16:29:16", "remaining_time": "1:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1602, "total_steps": 1730, "loss": 0.7918, "learning_rate": 3.702692166270027e-07, "epoch": 1.8506859205776174, "percentage": 92.6, "elapsed_time": "16:29:50", "remaining_time": "1:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1603, "total_steps": 1730, "loss": 0.7888, "learning_rate": 3.6465815616787e-07, "epoch": 1.851841155234657, "percentage": 92.66, "elapsed_time": "16:30:24", "remaining_time": "1:18:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1604, "total_steps": 1730, "loss": 0.747, "learning_rate": 3.590866479964664e-07, "epoch": 1.8529963898916968, "percentage": 92.72, "elapsed_time": "16:30:57", "remaining_time": "1:17:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1605, "total_steps": 1730, "loss": 0.7872, "learning_rate": 3.535547953000618e-07, "epoch": 1.8541516245487366, "percentage": 92.77, "elapsed_time": "16:31:31", "remaining_time": "1:17:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1606, "total_steps": 1730, "loss": 0.7748, "learning_rate": 3.4806270053148703e-07, "epoch": 1.8553068592057762, "percentage": 92.83, "elapsed_time": "16:32:06", "remaining_time": "1:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1607, "total_steps": 1730, "loss": 0.7576, "learning_rate": 3.4261046540723424e-07, "epoch": 1.8564620938628158, "percentage": 92.89, "elapsed_time": "16:32:40", "remaining_time": "1:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1608, "total_steps": 1730, "loss": 0.7577, "learning_rate": 3.371981909055759e-07, "epoch": 1.8576173285198556, "percentage": 92.95, "elapsed_time": "16:33:14", "remaining_time": "1:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1609, "total_steps": 1730, "loss": 0.7442, "learning_rate": 3.318259772646901e-07, "epoch": 1.8587725631768954, "percentage": 93.01, "elapsed_time": "16:33:48", "remaining_time": "1:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 1730, "loss": 0.7589, "learning_rate": 3.264939239808092e-07, "epoch": 1.859927797833935, "percentage": 93.06, "elapsed_time": "16:34:21", "remaining_time": "1:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1611, "total_steps": 1730, "loss": 0.768, "learning_rate": 3.2120212980637286e-07, "epoch": 1.8610830324909746, "percentage": 93.12, "elapsed_time": "16:34:55", "remaining_time": "1:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1612, "total_steps": 1730, "loss": 0.7603, "learning_rate": 3.1595069274820076e-07, "epoch": 1.8622382671480144, "percentage": 93.18, "elapsed_time": "16:35:28", "remaining_time": "1:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1613, "total_steps": 1730, "loss": 0.7814, "learning_rate": 3.1073971006567867e-07, "epoch": 1.8633935018050543, "percentage": 93.24, "elapsed_time": "16:36:03", "remaining_time": "1:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1614, "total_steps": 1730, "loss": 0.7667, "learning_rate": 3.055692782689551e-07, "epoch": 1.8645487364620938, "percentage": 93.29, "elapsed_time": "16:36:36", "remaining_time": "1:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1615, "total_steps": 1730, "loss": 0.7826, "learning_rate": 3.0043949311715463e-07, "epoch": 1.8657039711191334, "percentage": 93.35, "elapsed_time": "16:37:09", "remaining_time": "1:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1616, "total_steps": 1730, "loss": 0.7678, "learning_rate": 2.953504496166049e-07, "epoch": 1.8668592057761733, "percentage": 93.41, "elapsed_time": "16:37:43", "remaining_time": "1:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1617, "total_steps": 1730, "loss": 0.7751, "learning_rate": 2.903022420190769e-07, "epoch": 1.868014440433213, "percentage": 93.47, "elapsed_time": "16:38:17", "remaining_time": "1:09:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1618, "total_steps": 1730, "loss": 0.7799, "learning_rate": 2.8529496382003895e-07, "epoch": 1.8691696750902527, "percentage": 93.53, "elapsed_time": "16:38:51", "remaining_time": "1:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1619, "total_steps": 1730, "loss": 0.7723, "learning_rate": 2.8032870775692436e-07, "epoch": 1.8703249097472923, "percentage": 93.58, "elapsed_time": "16:39:25", "remaining_time": "1:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 1730, "loss": 0.7635, "learning_rate": 2.75403565807417e-07, "epoch": 1.871480144404332, "percentage": 93.64, "elapsed_time": "16:39:58", "remaining_time": "1:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1621, "total_steps": 1730, "loss": 0.7605, "learning_rate": 2.705196291877439e-07, "epoch": 1.872635379061372, "percentage": 93.7, "elapsed_time": "16:40:32", "remaining_time": "1:07:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1622, "total_steps": 1730, "loss": 0.7815, "learning_rate": 2.6567698835098765e-07, "epoch": 1.8737906137184117, "percentage": 93.76, "elapsed_time": "16:41:06", "remaining_time": "1:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1623, "total_steps": 1730, "loss": 0.759, "learning_rate": 2.608757329854116e-07, "epoch": 1.8749458483754513, "percentage": 93.82, "elapsed_time": "16:41:40", "remaining_time": "1:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1624, "total_steps": 1730, "loss": 0.7847, "learning_rate": 2.561159520127993e-07, "epoch": 1.876101083032491, "percentage": 93.87, "elapsed_time": "16:42:13", "remaining_time": "1:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1625, "total_steps": 1730, "loss": 0.7734, "learning_rate": 2.5139773358680497e-07, "epoch": 1.8772563176895307, "percentage": 93.93, "elapsed_time": "16:42:47", "remaining_time": "1:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1626, "total_steps": 1730, "loss": 0.7627, "learning_rate": 2.467211650913235e-07, "epoch": 1.8784115523465705, "percentage": 93.99, "elapsed_time": "16:43:21", "remaining_time": "1:04:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1627, "total_steps": 1730, "loss": 0.8107, "learning_rate": 2.4208633313887026e-07, "epoch": 1.8795667870036101, "percentage": 94.05, "elapsed_time": "16:43:55", "remaining_time": "1:03:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1628, "total_steps": 1730, "loss": 0.7739, "learning_rate": 2.3749332356897935e-07, "epoch": 1.8807220216606497, "percentage": 94.1, "elapsed_time": "16:44:28", "remaining_time": "1:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1629, "total_steps": 1730, "loss": 0.778, "learning_rate": 2.3294222144661086e-07, "epoch": 1.8818772563176895, "percentage": 94.16, "elapsed_time": "16:45:03", "remaining_time": "1:02:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 1730, "loss": 0.7772, "learning_rate": 2.2843311106057757e-07, "epoch": 1.8830324909747294, "percentage": 94.22, "elapsed_time": "16:45:36", "remaining_time": "1:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1631, "total_steps": 1730, "loss": 0.7631, "learning_rate": 2.2396607592198304e-07, "epoch": 1.884187725631769, "percentage": 94.28, "elapsed_time": "16:46:10", "remaining_time": "1:01:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1632, "total_steps": 1730, "loss": 0.7966, "learning_rate": 2.1954119876267445e-07, "epoch": 1.8853429602888085, "percentage": 94.34, "elapsed_time": "16:46:44", "remaining_time": "1:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1633, "total_steps": 1730, "loss": 0.7685, "learning_rate": 2.1515856153371186e-07, "epoch": 1.8864981949458484, "percentage": 94.39, "elapsed_time": "16:47:18", "remaining_time": "0:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1634, "total_steps": 1730, "loss": 0.7807, "learning_rate": 2.108182454038492e-07, "epoch": 1.8876534296028882, "percentage": 94.45, "elapsed_time": "16:47:52", "remaining_time": "0:59:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1635, "total_steps": 1730, "loss": 0.7761, "learning_rate": 2.065203307580309e-07, "epoch": 1.8888086642599278, "percentage": 94.51, "elapsed_time": "16:48:27", "remaining_time": "0:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1636, "total_steps": 1730, "loss": 0.7619, "learning_rate": 2.0226489719590362e-07, "epoch": 1.8899638989169674, "percentage": 94.57, "elapsed_time": "16:49:00", "remaining_time": "0:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1637, "total_steps": 1730, "loss": 0.7587, "learning_rate": 1.9805202353034296e-07, "epoch": 1.8911191335740072, "percentage": 94.62, "elapsed_time": "16:49:34", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1638, "total_steps": 1730, "loss": 0.7739, "learning_rate": 1.9388178778599145e-07, "epoch": 1.892274368231047, "percentage": 94.68, "elapsed_time": "16:50:08", "remaining_time": "0:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1639, "total_steps": 1730, "loss": 0.7671, "learning_rate": 1.8975426719781569e-07, "epoch": 1.8934296028880866, "percentage": 94.74, "elapsed_time": "16:50:42", "remaining_time": "0:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 1730, "loss": 0.7873, "learning_rate": 1.85669538209674e-07, "epoch": 1.8945848375451262, "percentage": 94.8, "elapsed_time": "16:51:15", "remaining_time": "0:55:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1641, "total_steps": 1730, "loss": 0.7698, "learning_rate": 1.816276764729035e-07, "epoch": 1.895740072202166, "percentage": 94.86, "elapsed_time": "16:51:49", "remaining_time": "0:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1642, "total_steps": 1730, "loss": 0.7851, "learning_rate": 1.7762875684491536e-07, "epoch": 1.8968953068592058, "percentage": 94.91, "elapsed_time": "16:52:23", "remaining_time": "0:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1643, "total_steps": 1730, "loss": 0.7699, "learning_rate": 1.7367285338781114e-07, "epoch": 1.8980505415162456, "percentage": 94.97, "elapsed_time": "16:52:57", "remaining_time": "0:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1644, "total_steps": 1730, "loss": 0.7768, "learning_rate": 1.6976003936701042e-07, "epoch": 1.8992057761732852, "percentage": 95.03, "elapsed_time": "16:53:31", "remaining_time": "0:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1645, "total_steps": 1730, "loss": 0.7931, "learning_rate": 1.6589038724989278e-07, "epoch": 1.9003610108303248, "percentage": 95.09, "elapsed_time": "16:54:05", "remaining_time": "0:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1646, "total_steps": 1730, "loss": 0.7533, "learning_rate": 1.6206396870445796e-07, "epoch": 1.9015162454873646, "percentage": 95.14, "elapsed_time": "16:54:38", "remaining_time": "0:51:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1647, "total_steps": 1730, "loss": 0.7875, "learning_rate": 1.582808545979954e-07, "epoch": 1.9026714801444045, "percentage": 95.2, "elapsed_time": "16:55:12", "remaining_time": "0:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1648, "total_steps": 1730, "loss": 0.7561, "learning_rate": 1.5454111499577497e-07, "epoch": 1.903826714801444, "percentage": 95.26, "elapsed_time": "16:55:46", "remaining_time": "0:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1649, "total_steps": 1730, "loss": 0.7695, "learning_rate": 1.5084481915974666e-07, "epoch": 1.9049819494584836, "percentage": 95.32, "elapsed_time": "16:56:20", "remaining_time": "0:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 1730, "loss": 0.7765, "learning_rate": 1.471920355472605e-07, "epoch": 1.9061371841155235, "percentage": 95.38, "elapsed_time": "16:56:54", "remaining_time": "0:49:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1651, "total_steps": 1730, "loss": 0.8193, "learning_rate": 1.4358283180979607e-07, "epoch": 1.9072924187725633, "percentage": 95.43, "elapsed_time": "16:57:28", "remaining_time": "0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1652, "total_steps": 1730, "loss": 0.8001, "learning_rate": 1.4001727479171022e-07, "epoch": 1.9084476534296029, "percentage": 95.49, "elapsed_time": "16:58:02", "remaining_time": "0:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1653, "total_steps": 1730, "loss": 0.7714, "learning_rate": 1.3649543052900035e-07, "epoch": 1.9096028880866425, "percentage": 95.55, "elapsed_time": "16:58:36", "remaining_time": "0:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1654, "total_steps": 1730, "loss": 0.7906, "learning_rate": 1.3301736424808105e-07, "epoch": 1.9107581227436823, "percentage": 95.61, "elapsed_time": "16:59:10", "remaining_time": "0:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1655, "total_steps": 1730, "loss": 0.7643, "learning_rate": 1.295831403645745e-07, "epoch": 1.911913357400722, "percentage": 95.66, "elapsed_time": "16:59:45", "remaining_time": "0:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1656, "total_steps": 1730, "loss": 0.8194, "learning_rate": 1.2619282248211896e-07, "epoch": 1.9130685920577617, "percentage": 95.72, "elapsed_time": "17:00:18", "remaining_time": "0:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1657, "total_steps": 1730, "loss": 0.753, "learning_rate": 1.2284647339118997e-07, "epoch": 1.9142238267148013, "percentage": 95.78, "elapsed_time": "17:00:52", "remaining_time": "0:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1658, "total_steps": 1730, "loss": 0.7659, "learning_rate": 1.1954415506793914e-07, "epoch": 1.915379061371841, "percentage": 95.84, "elapsed_time": "17:01:26", "remaining_time": "0:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1659, "total_steps": 1730, "loss": 0.7673, "learning_rate": 1.1628592867304393e-07, "epoch": 1.916534296028881, "percentage": 95.9, "elapsed_time": "17:02:00", "remaining_time": "0:43:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 1730, "loss": 0.7703, "learning_rate": 1.1307185455057616e-07, "epoch": 1.9176895306859207, "percentage": 95.95, "elapsed_time": "17:02:35", "remaining_time": "0:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1661, "total_steps": 1730, "loss": 0.7839, "learning_rate": 1.0990199222688366e-07, "epoch": 1.9188447653429603, "percentage": 96.01, "elapsed_time": "17:03:09", "remaining_time": "0:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1662, "total_steps": 1730, "loss": 0.7723, "learning_rate": 1.0677640040949089e-07, "epoch": 1.92, "percentage": 96.07, "elapsed_time": "17:03:43", "remaining_time": "0:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1663, "total_steps": 1730, "loss": 0.7699, "learning_rate": 1.0369513698600607e-07, "epoch": 1.9211552346570397, "percentage": 96.13, "elapsed_time": "17:04:18", "remaining_time": "0:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1664, "total_steps": 1730, "loss": 0.7736, "learning_rate": 1.0065825902305331e-07, "epoch": 1.9223104693140796, "percentage": 96.18, "elapsed_time": "17:04:51", "remaining_time": "0:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1665, "total_steps": 1730, "loss": 0.7661, "learning_rate": 9.766582276521622e-08, "epoch": 1.9234657039711192, "percentage": 96.24, "elapsed_time": "17:05:25", "remaining_time": "0:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1666, "total_steps": 1730, "loss": 0.7723, "learning_rate": 9.471788363399199e-08, "epoch": 1.9246209386281588, "percentage": 96.3, "elapsed_time": "17:05:59", "remaining_time": "0:39:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1667, "total_steps": 1730, "loss": 0.7702, "learning_rate": 9.181449622676956e-08, "epoch": 1.9257761732851986, "percentage": 96.36, "elapsed_time": "17:06:32", "remaining_time": "0:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1668, "total_steps": 1730, "loss": 0.7538, "learning_rate": 8.8955714315814e-08, "epoch": 1.9269314079422384, "percentage": 96.42, "elapsed_time": "17:07:06", "remaining_time": "0:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1669, "total_steps": 1730, "loss": 0.7792, "learning_rate": 8.614159084727651e-08, "epoch": 1.928086642599278, "percentage": 96.47, "elapsed_time": "17:07:40", "remaining_time": "0:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 1730, "loss": 0.7423, "learning_rate": 8.337217794020758e-08, "epoch": 1.9292418772563176, "percentage": 96.53, "elapsed_time": "17:08:14", "remaining_time": "0:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1671, "total_steps": 1730, "loss": 0.7549, "learning_rate": 8.064752688559553e-08, "epoch": 1.9303971119133574, "percentage": 96.59, "elapsed_time": "17:08:48", "remaining_time": "0:36:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1672, "total_steps": 1730, "loss": 0.7845, "learning_rate": 7.796768814541562e-08, "epoch": 1.9315523465703972, "percentage": 96.65, "elapsed_time": "17:09:22", "remaining_time": "0:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1673, "total_steps": 1730, "loss": 0.7706, "learning_rate": 7.533271135169531e-08, "epoch": 1.9327075812274368, "percentage": 96.71, "elapsed_time": "17:09:56", "remaining_time": "0:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1674, "total_steps": 1730, "loss": 0.7794, "learning_rate": 7.274264530559488e-08, "epoch": 1.9338628158844764, "percentage": 96.76, "elapsed_time": "17:10:30", "remaining_time": "0:34:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1675, "total_steps": 1730, "loss": 0.7515, "learning_rate": 7.019753797650377e-08, "epoch": 1.9350180505415162, "percentage": 96.82, "elapsed_time": "17:11:03", "remaining_time": "0:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1676, "total_steps": 1730, "loss": 0.7852, "learning_rate": 6.769743650115355e-08, "epoch": 1.936173285198556, "percentage": 96.88, "elapsed_time": "17:11:38", "remaining_time": "0:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1677, "total_steps": 1730, "loss": 0.7451, "learning_rate": 6.524238718274186e-08, "epoch": 1.9373285198555956, "percentage": 96.94, "elapsed_time": "17:12:11", "remaining_time": "0:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1678, "total_steps": 1730, "loss": 0.7679, "learning_rate": 6.283243549007756e-08, "epoch": 1.9384837545126352, "percentage": 96.99, "elapsed_time": "17:12:45", "remaining_time": "0:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1679, "total_steps": 1730, "loss": 0.7619, "learning_rate": 6.046762605673734e-08, "epoch": 1.939638989169675, "percentage": 97.05, "elapsed_time": "17:13:19", "remaining_time": "0:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 1730, "loss": 0.7792, "learning_rate": 5.814800268024005e-08, "epoch": 1.9407942238267148, "percentage": 97.11, "elapsed_time": "17:13:53", "remaining_time": "0:30:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1681, "total_steps": 1730, "loss": 0.7648, "learning_rate": 5.58736083212344e-08, "epoch": 1.9419494584837547, "percentage": 97.17, "elapsed_time": "17:14:27", "remaining_time": "0:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1682, "total_steps": 1730, "loss": 0.7907, "learning_rate": 5.364448510270387e-08, "epoch": 1.9431046931407943, "percentage": 97.23, "elapsed_time": "17:15:01", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1683, "total_steps": 1730, "loss": 0.7737, "learning_rate": 5.146067430918623e-08, "epoch": 1.9442599277978339, "percentage": 97.28, "elapsed_time": "17:15:34", "remaining_time": "0:28:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1684, "total_steps": 1730, "loss": 0.7746, "learning_rate": 4.932221638601039e-08, "epoch": 1.9454151624548737, "percentage": 97.34, "elapsed_time": "17:16:08", "remaining_time": "0:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1685, "total_steps": 1730, "loss": 0.7547, "learning_rate": 4.722915093854457e-08, "epoch": 1.9465703971119135, "percentage": 97.4, "elapsed_time": "17:16:42", "remaining_time": "0:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1686, "total_steps": 1730, "loss": 0.7786, "learning_rate": 4.518151673146557e-08, "epoch": 1.947725631768953, "percentage": 97.46, "elapsed_time": "17:17:16", "remaining_time": "0:27:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1687, "total_steps": 1730, "loss": 0.7785, "learning_rate": 4.3179351688039386e-08, "epoch": 1.9488808664259927, "percentage": 97.51, "elapsed_time": "17:17:51", "remaining_time": "0:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1688, "total_steps": 1730, "loss": 0.7665, "learning_rate": 4.122269288941911e-08, "epoch": 1.9500361010830325, "percentage": 97.57, "elapsed_time": "17:18:25", "remaining_time": "0:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1689, "total_steps": 1730, "loss": 0.7539, "learning_rate": 3.931157657395747e-08, "epoch": 1.9511913357400723, "percentage": 97.63, "elapsed_time": "17:18:58", "remaining_time": "0:25:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 1730, "loss": 0.7962, "learning_rate": 3.744603813653741e-08, "epoch": 1.952346570397112, "percentage": 97.69, "elapsed_time": "17:19:32", "remaining_time": "0:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1691, "total_steps": 1730, "loss": 0.7373, "learning_rate": 3.562611212791524e-08, "epoch": 1.9535018050541515, "percentage": 97.75, "elapsed_time": "17:20:06", "remaining_time": "0:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1692, "total_steps": 1730, "loss": 0.7971, "learning_rate": 3.3851832254080314e-08, "epoch": 1.9546570397111913, "percentage": 97.8, "elapsed_time": "17:20:40", "remaining_time": "0:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1693, "total_steps": 1730, "loss": 0.746, "learning_rate": 3.212323137563259e-08, "epoch": 1.9558122743682311, "percentage": 97.86, "elapsed_time": "17:21:14", "remaining_time": "0:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1694, "total_steps": 1730, "loss": 0.7903, "learning_rate": 3.044034150717202e-08, "epoch": 1.9569675090252707, "percentage": 97.92, "elapsed_time": "17:21:48", "remaining_time": "0:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1695, "total_steps": 1730, "loss": 0.7752, "learning_rate": 2.880319381670718e-08, "epoch": 1.9581227436823103, "percentage": 97.98, "elapsed_time": "17:22:21", "remaining_time": "0:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1696, "total_steps": 1730, "loss": 0.7453, "learning_rate": 2.721181862507687e-08, "epoch": 1.9592779783393501, "percentage": 98.03, "elapsed_time": "17:22:55", "remaining_time": "0:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1697, "total_steps": 1730, "loss": 0.7601, "learning_rate": 2.566624540538925e-08, "epoch": 1.96043321299639, "percentage": 98.09, "elapsed_time": "17:23:29", "remaining_time": "0:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1698, "total_steps": 1730, "loss": 0.7577, "learning_rate": 2.4166502782475928e-08, "epoch": 1.9615884476534298, "percentage": 98.15, "elapsed_time": "17:24:03", "remaining_time": "0:19:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1699, "total_steps": 1730, "loss": 0.7723, "learning_rate": 2.2712618532361902e-08, "epoch": 1.9627436823104694, "percentage": 98.21, "elapsed_time": "17:24:37", "remaining_time": "0:19:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 1730, "loss": 0.7896, "learning_rate": 2.130461958174988e-08, "epoch": 1.963898916967509, "percentage": 98.27, "elapsed_time": "17:25:11", "remaining_time": "0:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1701, "total_steps": 1730, "loss": 0.7587, "learning_rate": 1.9942532007523544e-08, "epoch": 1.9650541516245488, "percentage": 98.32, "elapsed_time": "17:25:44", "remaining_time": "0:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1702, "total_steps": 1730, "loss": 0.7714, "learning_rate": 1.8626381036264058e-08, "epoch": 1.9662093862815886, "percentage": 98.38, "elapsed_time": "17:26:18", "remaining_time": "0:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1703, "total_steps": 1730, "loss": 0.7937, "learning_rate": 1.735619104378108e-08, "epoch": 1.9673646209386282, "percentage": 98.44, "elapsed_time": "17:26:53", "remaining_time": "0:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1704, "total_steps": 1730, "loss": 0.761, "learning_rate": 1.6131985554663975e-08, "epoch": 1.9685198555956678, "percentage": 98.5, "elapsed_time": "17:27:27", "remaining_time": "0:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1705, "total_steps": 1730, "loss": 0.7742, "learning_rate": 1.4953787241843607e-08, "epoch": 1.9696750902527076, "percentage": 98.55, "elapsed_time": "17:28:00", "remaining_time": "0:15:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1706, "total_steps": 1730, "loss": 0.7489, "learning_rate": 1.382161792617522e-08, "epoch": 1.9708303249097474, "percentage": 98.61, "elapsed_time": "17:28:34", "remaining_time": "0:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1707, "total_steps": 1730, "loss": 0.7927, "learning_rate": 1.273549857603129e-08, "epoch": 1.971985559566787, "percentage": 98.67, "elapsed_time": "17:29:07", "remaining_time": "0:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1708, "total_steps": 1730, "loss": 0.7603, "learning_rate": 1.16954493069155e-08, "epoch": 1.9731407942238266, "percentage": 98.73, "elapsed_time": "17:29:40", "remaining_time": "0:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1709, "total_steps": 1730, "loss": 0.7886, "learning_rate": 1.0701489381089175e-08, "epoch": 1.9742960288808664, "percentage": 98.79, "elapsed_time": "17:30:13", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 1730, "loss": 0.7837, "learning_rate": 9.753637207214111e-09, "epoch": 1.9754512635379062, "percentage": 98.84, "elapsed_time": "17:30:47", "remaining_time": "0:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1711, "total_steps": 1730, "loss": 0.7449, "learning_rate": 8.85191034001343e-09, "epoch": 1.9766064981949458, "percentage": 98.9, "elapsed_time": "17:31:20", "remaining_time": "0:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1712, "total_steps": 1730, "loss": 0.7825, "learning_rate": 7.996325479943542e-09, "epoch": 1.9777617328519854, "percentage": 98.96, "elapsed_time": "17:31:54", "remaining_time": "0:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1713, "total_steps": 1730, "loss": 0.7702, "learning_rate": 7.186898472888319e-09, "epoch": 1.9789169675090252, "percentage": 99.02, "elapsed_time": "17:32:27", "remaining_time": "0:10:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1714, "total_steps": 1730, "loss": 0.7662, "learning_rate": 6.423644309862407e-09, "epoch": 1.980072202166065, "percentage": 99.08, "elapsed_time": "17:33:01", "remaining_time": "0:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1715, "total_steps": 1730, "loss": 0.794, "learning_rate": 5.706577126735919e-09, "epoch": 1.9812274368231046, "percentage": 99.13, "elapsed_time": "17:33:35", "remaining_time": "0:09:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1716, "total_steps": 1730, "loss": 0.7874, "learning_rate": 5.035710203971343e-09, "epoch": 1.9823826714801442, "percentage": 99.19, "elapsed_time": "17:34:08", "remaining_time": "0:08:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1717, "total_steps": 1730, "loss": 0.7666, "learning_rate": 4.411055966378209e-09, "epoch": 1.983537906137184, "percentage": 99.25, "elapsed_time": "17:34:42", "remaining_time": "0:07:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1718, "total_steps": 1730, "loss": 0.7824, "learning_rate": 3.832625982882452e-09, "epoch": 1.9846931407942239, "percentage": 99.31, "elapsed_time": "17:35:16", "remaining_time": "0:07:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1719, "total_steps": 1730, "loss": 0.7451, "learning_rate": 3.300430966312174e-09, "epoch": 1.9858483754512637, "percentage": 99.36, "elapsed_time": "17:35:50", "remaining_time": "0:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 1730, "loss": 0.7673, "learning_rate": 2.8144807732005904e-09, "epoch": 1.9870036101083033, "percentage": 99.42, "elapsed_time": "17:36:24", "remaining_time": "0:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1721, "total_steps": 1730, "loss": 0.7823, "learning_rate": 2.374784403601199e-09, "epoch": 1.9881588447653429, "percentage": 99.48, "elapsed_time": "17:36:58", "remaining_time": "0:05:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1722, "total_steps": 1730, "loss": 0.7676, "learning_rate": 1.9813500009229292e-09, "epoch": 1.9893140794223827, "percentage": 99.54, "elapsed_time": "17:37:31", "remaining_time": "0:04:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1723, "total_steps": 1730, "loss": 0.7937, "learning_rate": 1.634184851778611e-09, "epoch": 1.9904693140794225, "percentage": 99.6, "elapsed_time": "17:38:05", "remaining_time": "0:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1724, "total_steps": 1730, "loss": 0.7666, "learning_rate": 1.3332953858495395e-09, "epoch": 1.991624548736462, "percentage": 99.65, "elapsed_time": "17:38:39", "remaining_time": "0:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1725, "total_steps": 1730, "loss": 0.7796, "learning_rate": 1.0786871757678059e-09, "epoch": 1.9927797833935017, "percentage": 99.71, "elapsed_time": "17:39:13", "remaining_time": "0:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1726, "total_steps": 1730, "loss": 0.738, "learning_rate": 8.703649370116684e-10, "epoch": 1.9939350180505415, "percentage": 99.77, "elapsed_time": "17:39:46", "remaining_time": "0:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1727, "total_steps": 1730, "loss": 0.7633, "learning_rate": 7.083325278189627e-10, "epoch": 1.9950902527075813, "percentage": 99.83, "elapsed_time": "17:40:20", "remaining_time": "0:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1728, "total_steps": 1730, "loss": 0.769, "learning_rate": 5.925929491152231e-10, "epoch": 1.996245487364621, "percentage": 99.88, "elapsed_time": "17:40:54", "remaining_time": "0:01:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1729, "total_steps": 1730, "loss": 0.7676, "learning_rate": 5.231483444587321e-10, "epoch": 1.9974007220216605, "percentage": 99.94, "elapsed_time": "17:41:27", "remaining_time": "0:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 1730, "loss": 0.7958, "learning_rate": 5e-10, "epoch": 1.9985559566787003, "percentage": 100.0, "elapsed_time": "17:42:01", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 1730, "epoch": 1.9985559566787003, "percentage": 100.0, "elapsed_time": "17:55:34", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}