{"current_steps": 1, "total_steps": 1424, "loss": 0.6911, "accuracy": 0.125, "learning_rate": 0.0, "epoch": 0.000702000702000702, "percentage": 0.07, "elapsed_time": "0:00:06", "remaining_time": "2:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2, "total_steps": 1424, "loss": 0.6857, "accuracy": 0.625, "learning_rate": 5.017166594399687e-06, "epoch": 0.001404001404001404, "percentage": 0.14, "elapsed_time": "0:00:12", "remaining_time": "2:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3, "total_steps": 1424, "loss": 0.6806, "accuracy": 0.5, "learning_rate": 7.952020911994375e-06, "epoch": 0.002106002106002106, "percentage": 0.21, "elapsed_time": "0:00:18", "remaining_time": "2:27:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4, "total_steps": 1424, "loss": 0.6914, "accuracy": 0.625, "learning_rate": 1.0034333188799373e-05, "epoch": 0.002808002808002808, "percentage": 0.28, "elapsed_time": "0:00:22", "remaining_time": "2:15:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5, "total_steps": 1424, "loss": 0.6849, "accuracy": 0.625, "learning_rate": 1.164950007226698e-05, "epoch": 0.00351000351000351, "percentage": 0.35, "elapsed_time": "0:00:27", "remaining_time": "2:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6, "total_steps": 1424, "loss": 0.6928, "accuracy": 0.25, "learning_rate": 1.2969187506394062e-05, "epoch": 0.004212004212004212, "percentage": 0.42, "elapsed_time": "0:00:31", "remaining_time": "2:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7, "total_steps": 1424, "loss": 0.6741, "accuracy": 0.375, "learning_rate": 1.4084967333570947e-05, "epoch": 0.004914004914004914, "percentage": 0.49, "elapsed_time": "0:00:35", "remaining_time": "1:59:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8, "total_steps": 1424, "loss": 0.6724, "accuracy": 0.625, "learning_rate": 1.505149978319906e-05, "epoch": 0.005616005616005616, "percentage": 0.56, "elapsed_time": "0:00:39", "remaining_time": "1:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9, "total_steps": 1424, "loss": 0.6699, "accuracy": 0.375, "learning_rate": 1.590404182398875e-05, "epoch": 0.006318006318006318, "percentage": 0.63, "elapsed_time": "0:00:43", "remaining_time": "1:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10, "total_steps": 1424, "loss": 0.655, "accuracy": 0.5, "learning_rate": 1.666666666666667e-05, "epoch": 0.00702000702000702, "percentage": 0.7, "elapsed_time": "0:00:47", "remaining_time": "1:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11, "total_steps": 1424, "loss": 0.6514, "accuracy": 0.75, "learning_rate": 1.7356544752637084e-05, "epoch": 0.007722007722007722, "percentage": 0.77, "elapsed_time": "0:00:52", "remaining_time": "1:51:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12, "total_steps": 1424, "loss": 0.6501, "accuracy": 0.75, "learning_rate": 1.7986354100793748e-05, "epoch": 0.008424008424008424, "percentage": 0.84, "elapsed_time": "0:00:56", "remaining_time": "1:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13, "total_steps": 1424, "loss": 0.6277, "accuracy": 0.75, "learning_rate": 1.8565722538447282e-05, "epoch": 0.009126009126009126, "percentage": 0.91, "elapsed_time": "0:01:00", "remaining_time": "1:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14, "total_steps": 1424, "loss": 0.609, "accuracy": 1.0, "learning_rate": 1.9102133927970633e-05, "epoch": 0.009828009828009828, "percentage": 0.98, "elapsed_time": "0:01:04", "remaining_time": "1:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15, "total_steps": 1424, "loss": 0.596, "accuracy": 0.5, "learning_rate": 1.9601520984261358e-05, "epoch": 0.01053001053001053, "percentage": 1.05, "elapsed_time": "0:01:08", "remaining_time": "1:47:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16, "total_steps": 1424, "loss": 0.5662, "accuracy": 0.875, "learning_rate": 2.0068666377598747e-05, "epoch": 0.011232011232011231, "percentage": 1.12, "elapsed_time": "0:01:12", "remaining_time": "1:46:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17, "total_steps": 1424, "loss": 0.5483, "accuracy": 0.75, "learning_rate": 2.0507482022971233e-05, "epoch": 0.011934011934011933, "percentage": 1.19, "elapsed_time": "0:01:16", "remaining_time": "1:46:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18, "total_steps": 1424, "loss": 0.5408, "accuracy": 0.875, "learning_rate": 2.0921208418388435e-05, "epoch": 0.012636012636012635, "percentage": 1.26, "elapsed_time": "0:01:21", "remaining_time": "1:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19, "total_steps": 1424, "loss": 0.5102, "accuracy": 0.75, "learning_rate": 2.1312560015880482e-05, "epoch": 0.013338013338013339, "percentage": 1.33, "elapsed_time": "0:01:25", "remaining_time": "1:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 1424, "loss": 0.4495, "accuracy": 0.875, "learning_rate": 2.1683833261066357e-05, "epoch": 0.01404001404001404, "percentage": 1.4, "elapsed_time": "0:01:29", "remaining_time": "1:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21, "total_steps": 1424, "loss": 0.427, "accuracy": 1.0, "learning_rate": 2.2036988245565324e-05, "epoch": 0.014742014742014743, "percentage": 1.47, "elapsed_time": "0:01:33", "remaining_time": "1:44:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22, "total_steps": 1424, "loss": 0.3929, "accuracy": 0.875, "learning_rate": 2.2373711347036773e-05, "epoch": 0.015444015444015444, "percentage": 1.54, "elapsed_time": "0:01:37", "remaining_time": "1:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23, "total_steps": 1424, "loss": 0.3416, "accuracy": 1.0, "learning_rate": 2.269546393362655e-05, "epoch": 0.016146016146016146, "percentage": 1.62, "elapsed_time": "0:01:41", "remaining_time": "1:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24, "total_steps": 1424, "loss": 0.3121, "accuracy": 0.875, "learning_rate": 2.3003520695193437e-05, "epoch": 0.016848016848016848, "percentage": 1.69, "elapsed_time": "0:01:46", "remaining_time": "1:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25, "total_steps": 1424, "loss": 0.2714, "accuracy": 0.875, "learning_rate": 2.329900014453396e-05, "epoch": 0.01755001755001755, "percentage": 1.76, "elapsed_time": "0:01:50", "remaining_time": "1:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 26, "total_steps": 1424, "loss": 0.2044, "accuracy": 1.0, "learning_rate": 2.3582889132846968e-05, "epoch": 0.018252018252018252, "percentage": 1.83, "elapsed_time": "0:01:54", "remaining_time": "1:42:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 27, "total_steps": 1424, "loss": 0.2197, "accuracy": 1.0, "learning_rate": 2.3856062735983123e-05, "epoch": 0.018954018954018954, "percentage": 1.9, "elapsed_time": "0:01:58", "remaining_time": "1:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 28, "total_steps": 1424, "loss": 0.1908, "accuracy": 1.0, "learning_rate": 2.4119300522370322e-05, "epoch": 0.019656019656019656, "percentage": 1.97, "elapsed_time": "0:02:02", "remaining_time": "1:42:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 29, "total_steps": 1424, "loss": 0.1762, "accuracy": 1.0, "learning_rate": 2.4373299964982603e-05, "epoch": 0.020358020358020357, "percentage": 2.04, "elapsed_time": "0:02:06", "remaining_time": "1:41:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 1424, "loss": 0.1351, "accuracy": 1.0, "learning_rate": 2.4618687578661044e-05, "epoch": 0.02106002106002106, "percentage": 2.11, "elapsed_time": "0:02:11", "remaining_time": "1:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 31, "total_steps": 1424, "loss": 0.0867, "accuracy": 1.0, "learning_rate": 2.4856028230571212e-05, "epoch": 0.02176202176202176, "percentage": 2.18, "elapsed_time": "0:02:15", "remaining_time": "1:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 32, "total_steps": 1424, "loss": 0.0924, "accuracy": 0.875, "learning_rate": 2.5085832971998436e-05, "epoch": 0.022464022464022463, "percentage": 2.25, "elapsed_time": "0:02:19", "remaining_time": "1:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 33, "total_steps": 1424, "loss": 0.086, "accuracy": 0.75, "learning_rate": 2.530856566463146e-05, "epoch": 0.023166023166023165, "percentage": 2.32, "elapsed_time": "0:02:23", "remaining_time": "1:40:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 34, "total_steps": 1424, "loss": 0.1606, "accuracy": 0.75, "learning_rate": 2.552464861737092e-05, "epoch": 0.023868023868023867, "percentage": 2.39, "elapsed_time": "0:02:27", "remaining_time": "1:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 35, "total_steps": 1424, "loss": 0.12, "accuracy": 1.0, "learning_rate": 2.5734467405837933e-05, "epoch": 0.02457002457002457, "percentage": 2.46, "elapsed_time": "0:02:31", "remaining_time": "1:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 36, "total_steps": 1424, "loss": 0.1591, "accuracy": 1.0, "learning_rate": 2.5938375012788124e-05, "epoch": 0.02527202527202527, "percentage": 2.53, "elapsed_time": "0:02:36", "remaining_time": "1:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 37, "total_steps": 1424, "loss": 0.0715, "accuracy": 1.0, "learning_rate": 2.6136695401116585e-05, "epoch": 0.025974025974025976, "percentage": 2.6, "elapsed_time": "0:02:40", "remaining_time": "1:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 38, "total_steps": 1424, "loss": 0.1467, "accuracy": 1.0, "learning_rate": 2.6329726610280168e-05, "epoch": 0.026676026676026678, "percentage": 2.67, "elapsed_time": "0:02:44", "remaining_time": "1:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 39, "total_steps": 1424, "loss": 0.156, "accuracy": 1.0, "learning_rate": 2.651774345044166e-05, "epoch": 0.02737802737802738, "percentage": 2.74, "elapsed_time": "0:02:48", "remaining_time": "1:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 1424, "loss": 0.0559, "accuracy": 1.0, "learning_rate": 2.6700999855466042e-05, "epoch": 0.02808002808002808, "percentage": 2.81, "elapsed_time": "0:02:52", "remaining_time": "1:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 41, "total_steps": 1424, "loss": 0.0647, "accuracy": 1.0, "learning_rate": 2.687973094532893e-05, "epoch": 0.028782028782028783, "percentage": 2.88, "elapsed_time": "0:02:56", "remaining_time": "1:39:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 42, "total_steps": 1424, "loss": 0.1587, "accuracy": 0.875, "learning_rate": 2.7054154839965013e-05, "epoch": 0.029484029484029485, "percentage": 2.95, "elapsed_time": "0:03:00", "remaining_time": "1:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 43, "total_steps": 1424, "loss": 0.0855, "accuracy": 0.875, "learning_rate": 2.722447425965978e-05, "epoch": 0.030186030186030187, "percentage": 3.02, "elapsed_time": "0:03:05", "remaining_time": "1:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 44, "total_steps": 1424, "loss": 0.0926, "accuracy": 1.0, "learning_rate": 2.739087794143646e-05, "epoch": 0.03088803088803089, "percentage": 3.09, "elapsed_time": "0:03:09", "remaining_time": "1:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 45, "total_steps": 1424, "loss": 0.1445, "accuracy": 0.875, "learning_rate": 2.755354189625573e-05, "epoch": 0.03159003159003159, "percentage": 3.16, "elapsed_time": "0:03:13", "remaining_time": "1:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 46, "total_steps": 1424, "loss": 0.1697, "accuracy": 1.0, "learning_rate": 2.771263052802624e-05, "epoch": 0.03229203229203229, "percentage": 3.23, "elapsed_time": "0:03:17", "remaining_time": "1:38:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 47, "total_steps": 1424, "loss": 0.1109, "accuracy": 1.0, "learning_rate": 2.7868297632261957e-05, "epoch": 0.032994032994032994, "percentage": 3.3, "elapsed_time": "0:03:21", "remaining_time": "1:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 48, "total_steps": 1424, "loss": 0.0943, "accuracy": 0.625, "learning_rate": 2.8020687289593123e-05, "epoch": 0.033696033696033696, "percentage": 3.37, "elapsed_time": "0:03:25", "remaining_time": "1:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 49, "total_steps": 1424, "loss": 0.0948, "accuracy": 0.875, "learning_rate": 2.8169934667141895e-05, "epoch": 0.0343980343980344, "percentage": 3.44, "elapsed_time": "0:03:30", "remaining_time": "1:38:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 1424, "loss": 0.0689, "accuracy": 1.0, "learning_rate": 2.8316166738933646e-05, "epoch": 0.0351000351000351, "percentage": 3.51, "elapsed_time": "0:03:34", "remaining_time": "1:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 51, "total_steps": 1424, "loss": 0.0881, "accuracy": 1.0, "learning_rate": 2.845950293496561e-05, "epoch": 0.0358020358020358, "percentage": 3.58, "elapsed_time": "0:03:38", "remaining_time": "1:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 52, "total_steps": 1424, "loss": 0.0721, "accuracy": 1.0, "learning_rate": 2.8600055727246657e-05, "epoch": 0.036504036504036504, "percentage": 3.65, "elapsed_time": "0:03:42", "remaining_time": "1:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 53, "total_steps": 1424, "loss": 0.0969, "accuracy": 0.875, "learning_rate": 2.8737931160013153e-05, "epoch": 0.037206037206037205, "percentage": 3.72, "elapsed_time": "0:03:46", "remaining_time": "1:37:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 54, "total_steps": 1424, "loss": 0.103, "accuracy": 0.875, "learning_rate": 2.8873229330382812e-05, "epoch": 0.03790803790803791, "percentage": 3.79, "elapsed_time": "0:03:50", "remaining_time": "1:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 55, "total_steps": 1424, "loss": 0.0756, "accuracy": 0.875, "learning_rate": 2.9006044824904066e-05, "epoch": 0.03861003861003861, "percentage": 3.86, "elapsed_time": "0:03:55", "remaining_time": "1:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 56, "total_steps": 1424, "loss": 0.0474, "accuracy": 0.875, "learning_rate": 2.913646711677001e-05, "epoch": 0.03931203931203931, "percentage": 3.93, "elapsed_time": "0:03:59", "remaining_time": "1:37:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 57, "total_steps": 1424, "loss": 0.1579, "accuracy": 1.0, "learning_rate": 2.926458092787486e-05, "epoch": 0.04001404001404001, "percentage": 4.0, "elapsed_time": "0:04:03", "remaining_time": "1:37:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 58, "total_steps": 1424, "loss": 0.0666, "accuracy": 1.0, "learning_rate": 2.939046655938229e-05, "epoch": 0.040716040716040715, "percentage": 4.07, "elapsed_time": "0:04:07", "remaining_time": "1:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 59, "total_steps": 1424, "loss": 0.0815, "accuracy": 1.0, "learning_rate": 2.951420019403574e-05, "epoch": 0.04141804141804142, "percentage": 4.14, "elapsed_time": "0:04:11", "remaining_time": "1:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 1424, "loss": 0.0711, "accuracy": 1.0, "learning_rate": 2.963585417306073e-05, "epoch": 0.04212004212004212, "percentage": 4.21, "elapsed_time": "0:04:15", "remaining_time": "1:36:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 61, "total_steps": 1424, "loss": 0.0685, "accuracy": 1.0, "learning_rate": 2.9755497250179453e-05, "epoch": 0.04282204282204282, "percentage": 4.28, "elapsed_time": "0:04:19", "remaining_time": "1:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 62, "total_steps": 1424, "loss": 0.0731, "accuracy": 0.875, "learning_rate": 2.98731948249709e-05, "epoch": 0.04352404352404352, "percentage": 4.35, "elapsed_time": "0:04:24", "remaining_time": "1:36:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 63, "total_steps": 1424, "loss": 0.078, "accuracy": 1.0, "learning_rate": 2.9989009157559694e-05, "epoch": 0.044226044226044224, "percentage": 4.42, "elapsed_time": "0:04:28", "remaining_time": "1:36:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 64, "total_steps": 1424, "loss": 0.0793, "accuracy": 1.0, "learning_rate": 3.010299956639812e-05, "epoch": 0.044928044928044926, "percentage": 4.49, "elapsed_time": "0:04:32", "remaining_time": "1:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 65, "total_steps": 1424, "loss": 0.0888, "accuracy": 0.875, "learning_rate": 3.021522261071426e-05, "epoch": 0.04563004563004563, "percentage": 4.56, "elapsed_time": "0:04:36", "remaining_time": "1:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 66, "total_steps": 1424, "loss": 0.1086, "accuracy": 1.0, "learning_rate": 3.0325732259031143e-05, "epoch": 0.04633204633204633, "percentage": 4.63, "elapsed_time": "0:04:40", "remaining_time": "1:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 67, "total_steps": 1424, "loss": 0.0762, "accuracy": 1.0, "learning_rate": 3.043458004501377e-05, "epoch": 0.04703404703404703, "percentage": 4.71, "elapsed_time": "0:04:44", "remaining_time": "1:36:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 68, "total_steps": 1424, "loss": 0.0478, "accuracy": 1.0, "learning_rate": 3.054181521177061e-05, "epoch": 0.04773604773604773, "percentage": 4.78, "elapsed_time": "0:04:48", "remaining_time": "1:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 69, "total_steps": 1424, "loss": 0.1407, "accuracy": 0.875, "learning_rate": 3.064748484562093e-05, "epoch": 0.048438048438048435, "percentage": 4.85, "elapsed_time": "0:04:53", "remaining_time": "1:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 1424, "loss": 0.0493, "accuracy": 1.0, "learning_rate": 3.0751634000237615e-05, "epoch": 0.04914004914004914, "percentage": 4.92, "elapsed_time": "0:04:57", "remaining_time": "1:35:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 71, "total_steps": 1424, "loss": 0.0668, "accuracy": 0.875, "learning_rate": 3.085430581198459e-05, "epoch": 0.04984204984204984, "percentage": 4.99, "elapsed_time": "0:05:01", "remaining_time": "1:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 72, "total_steps": 1424, "loss": 0.0529, "accuracy": 1.0, "learning_rate": 3.095554160718781e-05, "epoch": 0.05054405054405054, "percentage": 5.06, "elapsed_time": "0:05:05", "remaining_time": "1:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 73, "total_steps": 1424, "loss": 0.0454, "accuracy": 1.0, "learning_rate": 3.10553810020076e-05, "epoch": 0.05124605124605124, "percentage": 5.13, "elapsed_time": "0:05:09", "remaining_time": "1:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 74, "total_steps": 1424, "loss": 0.0526, "accuracy": 1.0, "learning_rate": 3.115386199551628e-05, "epoch": 0.05194805194805195, "percentage": 5.2, "elapsed_time": "0:05:13", "remaining_time": "1:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 75, "total_steps": 1424, "loss": 0.0667, "accuracy": 0.875, "learning_rate": 3.1251021056528336e-05, "epoch": 0.05265005265005265, "percentage": 5.27, "elapsed_time": "0:05:18", "remaining_time": "1:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 76, "total_steps": 1424, "loss": 0.0922, "accuracy": 0.875, "learning_rate": 3.134689320467986e-05, "epoch": 0.053352053352053355, "percentage": 5.34, "elapsed_time": "0:05:22", "remaining_time": "1:35:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 77, "total_steps": 1424, "loss": 0.058, "accuracy": 1.0, "learning_rate": 3.144151208620804e-05, "epoch": 0.05405405405405406, "percentage": 5.41, "elapsed_time": "0:05:26", "remaining_time": "1:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 78, "total_steps": 1424, "loss": 0.0674, "accuracy": 1.0, "learning_rate": 3.1534910044841344e-05, "epoch": 0.05475605475605476, "percentage": 5.48, "elapsed_time": "0:05:30", "remaining_time": "1:35:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 79, "total_steps": 1424, "loss": 0.066, "accuracy": 1.0, "learning_rate": 3.1627118188174024e-05, "epoch": 0.05545805545805546, "percentage": 5.55, "elapsed_time": "0:05:34", "remaining_time": "1:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 1424, "loss": 0.0668, "accuracy": 1.0, "learning_rate": 3.171816644986573e-05, "epoch": 0.05616005616005616, "percentage": 5.62, "elapsed_time": "0:05:38", "remaining_time": "1:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 81, "total_steps": 1424, "loss": 0.0612, "accuracy": 0.875, "learning_rate": 3.18080836479775e-05, "epoch": 0.056862056862056864, "percentage": 5.69, "elapsed_time": "0:05:42", "remaining_time": "1:34:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 82, "total_steps": 1424, "loss": 0.1127, "accuracy": 1.0, "learning_rate": 3.1896897539728616e-05, "epoch": 0.057564057564057566, "percentage": 5.76, "elapsed_time": "0:05:47", "remaining_time": "1:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 83, "total_steps": 1424, "loss": 0.1153, "accuracy": 1.0, "learning_rate": 3.198463487293457e-05, "epoch": 0.05826605826605827, "percentage": 5.83, "elapsed_time": "0:05:51", "remaining_time": "1:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 84, "total_steps": 1424, "loss": 0.0785, "accuracy": 1.0, "learning_rate": 3.207132143436469e-05, "epoch": 0.05896805896805897, "percentage": 5.9, "elapsed_time": "0:05:55", "remaining_time": "1:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 85, "total_steps": 1424, "loss": 0.0741, "accuracy": 1.0, "learning_rate": 3.215698209523821e-05, "epoch": 0.05967005967005967, "percentage": 5.97, "elapsed_time": "0:05:59", "remaining_time": "1:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 86, "total_steps": 1424, "loss": 0.049, "accuracy": 0.875, "learning_rate": 3.224164085405946e-05, "epoch": 0.060372060372060374, "percentage": 6.04, "elapsed_time": "0:06:03", "remaining_time": "1:34:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 87, "total_steps": 1424, "loss": 0.0748, "accuracy": 1.0, "learning_rate": 3.232532087697698e-05, "epoch": 0.061074061074061076, "percentage": 6.11, "elapsed_time": "0:06:07", "remaining_time": "1:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 88, "total_steps": 1424, "loss": 0.0992, "accuracy": 0.875, "learning_rate": 3.240804453583615e-05, "epoch": 0.06177606177606178, "percentage": 6.18, "elapsed_time": "0:06:11", "remaining_time": "1:34:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 89, "total_steps": 1424, "loss": 0.0715, "accuracy": 1.0, "learning_rate": 3.248983344408188e-05, "epoch": 0.06247806247806248, "percentage": 6.25, "elapsed_time": "0:06:16", "remaining_time": "1:34:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 1424, "loss": 0.072, "accuracy": 1.0, "learning_rate": 3.2570708490655414e-05, "epoch": 0.06318006318006318, "percentage": 6.32, "elapsed_time": "0:06:20", "remaining_time": "1:33:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 91, "total_steps": 1424, "loss": 0.0572, "accuracy": 0.875, "learning_rate": 3.265068987201822e-05, "epoch": 0.06388206388206388, "percentage": 6.39, "elapsed_time": "0:06:24", "remaining_time": "1:33:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 92, "total_steps": 1424, "loss": 0.0539, "accuracy": 1.0, "learning_rate": 3.2729797122425925e-05, "epoch": 0.06458406458406458, "percentage": 6.46, "elapsed_time": "0:06:28", "remaining_time": "1:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 93, "total_steps": 1424, "loss": 0.0492, "accuracy": 1.0, "learning_rate": 3.280804914256559e-05, "epoch": 0.06528606528606529, "percentage": 6.53, "elapsed_time": "0:06:32", "remaining_time": "1:33:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 94, "total_steps": 1424, "loss": 0.0471, "accuracy": 1.0, "learning_rate": 3.288546422666164e-05, "epoch": 0.06598806598806599, "percentage": 6.6, "elapsed_time": "0:06:36", "remaining_time": "1:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 95, "total_steps": 1424, "loss": 0.0804, "accuracy": 1.0, "learning_rate": 3.2962060088147464e-05, "epoch": 0.06669006669006669, "percentage": 6.67, "elapsed_time": "0:06:40", "remaining_time": "1:33:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 96, "total_steps": 1424, "loss": 0.0984, "accuracy": 0.875, "learning_rate": 3.3037853883992805e-05, "epoch": 0.06739206739206739, "percentage": 6.74, "elapsed_time": "0:06:45", "remaining_time": "1:33:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 97, "total_steps": 1424, "loss": 0.0932, "accuracy": 1.0, "learning_rate": 3.3112862237770756e-05, "epoch": 0.0680940680940681, "percentage": 6.81, "elapsed_time": "0:06:49", "remaining_time": "1:33:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 98, "total_steps": 1424, "loss": 0.0402, "accuracy": 1.0, "learning_rate": 3.3187101261541584e-05, "epoch": 0.0687960687960688, "percentage": 6.88, "elapsed_time": "0:06:53", "remaining_time": "1:33:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 99, "total_steps": 1424, "loss": 0.0848, "accuracy": 1.0, "learning_rate": 3.326058657662584e-05, "epoch": 0.0694980694980695, "percentage": 6.95, "elapsed_time": "0:06:57", "remaining_time": "1:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 1424, "loss": 0.0698, "accuracy": 1.0, "learning_rate": 3.333333333333334e-05, "epoch": 0.0702000702000702, "percentage": 7.02, "elapsed_time": "0:07:01", "remaining_time": "1:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 101, "total_steps": 1424, "loss": 0.0466, "accuracy": 0.875, "learning_rate": 3.340535622971072e-05, "epoch": 0.0709020709020709, "percentage": 7.09, "elapsed_time": "0:07:12", "remaining_time": "1:34:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 102, "total_steps": 1424, "loss": 0.0792, "accuracy": 1.0, "learning_rate": 3.3476669529365295e-05, "epoch": 0.0716040716040716, "percentage": 7.16, "elapsed_time": "0:07:16", "remaining_time": "1:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 103, "total_steps": 1424, "loss": 0.0996, "accuracy": 0.875, "learning_rate": 3.3547287078419544e-05, "epoch": 0.0723060723060723, "percentage": 7.23, "elapsed_time": "0:07:20", "remaining_time": "1:34:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 104, "total_steps": 1424, "loss": 0.064, "accuracy": 1.0, "learning_rate": 3.361722232164634e-05, "epoch": 0.07300807300807301, "percentage": 7.3, "elapsed_time": "0:07:24", "remaining_time": "1:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 105, "total_steps": 1424, "loss": 0.0559, "accuracy": 1.0, "learning_rate": 3.3686488317832306e-05, "epoch": 0.07371007371007371, "percentage": 7.37, "elapsed_time": "0:07:28", "remaining_time": "1:33:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 106, "total_steps": 1424, "loss": 0.0991, "accuracy": 0.875, "learning_rate": 3.375509775441284e-05, "epoch": 0.07441207441207441, "percentage": 7.44, "elapsed_time": "0:07:33", "remaining_time": "1:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 107, "total_steps": 1424, "loss": 0.0599, "accuracy": 1.0, "learning_rate": 3.382306296142016e-05, "epoch": 0.07511407511407511, "percentage": 7.51, "elapsed_time": "0:07:37", "remaining_time": "1:33:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 108, "total_steps": 1424, "loss": 0.061, "accuracy": 1.0, "learning_rate": 3.38903959247825e-05, "epoch": 0.07581607581607581, "percentage": 7.58, "elapsed_time": "0:07:41", "remaining_time": "1:33:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 109, "total_steps": 1424, "loss": 0.109, "accuracy": 1.0, "learning_rate": 3.395710829901039e-05, "epoch": 0.07651807651807652, "percentage": 7.65, "elapsed_time": "0:07:45", "remaining_time": "1:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 1424, "loss": 0.0594, "accuracy": 1.0, "learning_rate": 3.402321141930376e-05, "epoch": 0.07722007722007722, "percentage": 7.72, "elapsed_time": "0:07:49", "remaining_time": "1:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 111, "total_steps": 1424, "loss": 0.0531, "accuracy": 1.0, "learning_rate": 3.4088716313110955e-05, "epoch": 0.07792207792207792, "percentage": 7.79, "elapsed_time": "0:07:53", "remaining_time": "1:33:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 112, "total_steps": 1424, "loss": 0.084, "accuracy": 1.0, "learning_rate": 3.415363371116969e-05, "epoch": 0.07862407862407862, "percentage": 7.87, "elapsed_time": "0:07:57", "remaining_time": "1:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 113, "total_steps": 1424, "loss": 0.0654, "accuracy": 1.0, "learning_rate": 3.4217974058057e-05, "epoch": 0.07932607932607932, "percentage": 7.94, "elapsed_time": "0:08:02", "remaining_time": "1:33:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 114, "total_steps": 1424, "loss": 0.0653, "accuracy": 1.0, "learning_rate": 3.428174752227455e-05, "epoch": 0.08002808002808003, "percentage": 8.01, "elapsed_time": "0:08:06", "remaining_time": "1:33:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 115, "total_steps": 1424, "loss": 0.0343, "accuracy": 1.0, "learning_rate": 3.434496400589353e-05, "epoch": 0.08073008073008073, "percentage": 8.08, "elapsed_time": "0:08:10", "remaining_time": "1:33:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 116, "total_steps": 1424, "loss": 0.0555, "accuracy": 1.0, "learning_rate": 3.440763315378198e-05, "epoch": 0.08143208143208143, "percentage": 8.15, "elapsed_time": "0:08:14", "remaining_time": "1:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 117, "total_steps": 1424, "loss": 0.0936, "accuracy": 1.0, "learning_rate": 3.446976436243603e-05, "epoch": 0.08213408213408213, "percentage": 8.22, "elapsed_time": "0:08:18", "remaining_time": "1:32:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 118, "total_steps": 1424, "loss": 0.0619, "accuracy": 0.875, "learning_rate": 3.4531366788435425e-05, "epoch": 0.08283608283608283, "percentage": 8.29, "elapsed_time": "0:08:22", "remaining_time": "1:32:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 119, "total_steps": 1424, "loss": 0.0425, "accuracy": 1.0, "learning_rate": 3.459244935654219e-05, "epoch": 0.08353808353808354, "percentage": 8.36, "elapsed_time": "0:08:26", "remaining_time": "1:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 1424, "loss": 0.0454, "accuracy": 1.0, "learning_rate": 3.465302076746041e-05, "epoch": 0.08424008424008424, "percentage": 8.43, "elapsed_time": "0:08:31", "remaining_time": "1:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 121, "total_steps": 1424, "loss": 0.0488, "accuracy": 1.0, "learning_rate": 3.471308950527417e-05, "epoch": 0.08494208494208494, "percentage": 8.5, "elapsed_time": "0:08:35", "remaining_time": "1:32:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 122, "total_steps": 1424, "loss": 0.0497, "accuracy": 1.0, "learning_rate": 3.477266384457914e-05, "epoch": 0.08564408564408564, "percentage": 8.57, "elapsed_time": "0:08:39", "remaining_time": "1:32:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 123, "total_steps": 1424, "loss": 0.0691, "accuracy": 1.0, "learning_rate": 3.48317518573233e-05, "epoch": 0.08634608634608634, "percentage": 8.64, "elapsed_time": "0:08:43", "remaining_time": "1:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 124, "total_steps": 1424, "loss": 0.0714, "accuracy": 1.0, "learning_rate": 3.489036141937059e-05, "epoch": 0.08704808704808704, "percentage": 8.71, "elapsed_time": "0:08:47", "remaining_time": "1:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 125, "total_steps": 1424, "loss": 0.1893, "accuracy": 1.0, "learning_rate": 3.494850021680094e-05, "epoch": 0.08775008775008775, "percentage": 8.78, "elapsed_time": "0:08:51", "remaining_time": "1:32:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 126, "total_steps": 1424, "loss": 0.0909, "accuracy": 1.0, "learning_rate": 3.500617575195938e-05, "epoch": 0.08845208845208845, "percentage": 8.85, "elapsed_time": "0:08:55", "remaining_time": "1:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 127, "total_steps": 1424, "loss": 0.0657, "accuracy": 1.0, "learning_rate": 3.5063395349265945e-05, "epoch": 0.08915408915408915, "percentage": 8.92, "elapsed_time": "0:09:00", "remaining_time": "1:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 128, "total_steps": 1424, "loss": 0.0617, "accuracy": 0.875, "learning_rate": 3.5120166160797804e-05, "epoch": 0.08985608985608985, "percentage": 8.99, "elapsed_time": "0:09:04", "remaining_time": "1:31:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 129, "total_steps": 1424, "loss": 0.0665, "accuracy": 1.0, "learning_rate": 3.517649517165415e-05, "epoch": 0.09055809055809055, "percentage": 9.06, "elapsed_time": "0:09:08", "remaining_time": "1:31:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 1424, "loss": 0.0689, "accuracy": 1.0, "learning_rate": 3.523238920511395e-05, "epoch": 0.09126009126009126, "percentage": 9.13, "elapsed_time": "0:09:12", "remaining_time": "1:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 131, "total_steps": 1424, "loss": 0.0604, "accuracy": 1.0, "learning_rate": 3.528785492759607e-05, "epoch": 0.09196209196209196, "percentage": 9.2, "elapsed_time": "0:09:16", "remaining_time": "1:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 132, "total_steps": 1424, "loss": 0.0904, "accuracy": 1.0, "learning_rate": 3.5342898853430836e-05, "epoch": 0.09266409266409266, "percentage": 9.27, "elapsed_time": "0:09:20", "remaining_time": "1:31:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 133, "total_steps": 1424, "loss": 0.0528, "accuracy": 1.0, "learning_rate": 3.539752734945143e-05, "epoch": 0.09336609336609336, "percentage": 9.34, "elapsed_time": "0:09:25", "remaining_time": "1:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 134, "total_steps": 1424, "loss": 0.0804, "accuracy": 1.0, "learning_rate": 3.5451746639413466e-05, "epoch": 0.09406809406809406, "percentage": 9.41, "elapsed_time": "0:09:29", "remaining_time": "1:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 135, "total_steps": 1424, "loss": 0.0289, "accuracy": 1.0, "learning_rate": 3.550556280825011e-05, "epoch": 0.09477009477009476, "percentage": 9.48, "elapsed_time": "0:09:33", "remaining_time": "1:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 136, "total_steps": 1424, "loss": 0.084, "accuracy": 1.0, "learning_rate": 3.55589818061703e-05, "epoch": 0.09547209547209547, "percentage": 9.55, "elapsed_time": "0:09:37", "remaining_time": "1:31:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 137, "total_steps": 1424, "loss": 0.0673, "accuracy": 0.875, "learning_rate": 3.561200945260678e-05, "epoch": 0.09617409617409617, "percentage": 9.62, "elapsed_time": "0:09:41", "remaining_time": "1:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 138, "total_steps": 1424, "loss": 0.018, "accuracy": 1.0, "learning_rate": 3.5664651440020616e-05, "epoch": 0.09687609687609687, "percentage": 9.69, "elapsed_time": "0:09:45", "remaining_time": "1:30:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 139, "total_steps": 1424, "loss": 0.0811, "accuracy": 1.0, "learning_rate": 3.571691333756825e-05, "epoch": 0.09757809757809757, "percentage": 9.76, "elapsed_time": "0:09:50", "remaining_time": "1:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 1424, "loss": 0.0586, "accuracy": 1.0, "learning_rate": 3.5768800594637304e-05, "epoch": 0.09828009828009827, "percentage": 9.83, "elapsed_time": "0:09:54", "remaining_time": "1:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 141, "total_steps": 1424, "loss": 0.0367, "accuracy": 0.875, "learning_rate": 3.582031854425634e-05, "epoch": 0.09898209898209898, "percentage": 9.9, "elapsed_time": "0:09:58", "remaining_time": "1:30:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 142, "total_steps": 1424, "loss": 0.0557, "accuracy": 1.0, "learning_rate": 3.587147240638428e-05, "epoch": 0.09968409968409968, "percentage": 9.97, "elapsed_time": "0:10:02", "remaining_time": "1:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 143, "total_steps": 1424, "loss": 0.0226, "accuracy": 1.0, "learning_rate": 3.5922267291084366e-05, "epoch": 0.10038610038610038, "percentage": 10.04, "elapsed_time": "0:10:06", "remaining_time": "1:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 144, "total_steps": 1424, "loss": 0.0904, "accuracy": 1.0, "learning_rate": 3.5972708201587496e-05, "epoch": 0.10108810108810108, "percentage": 10.11, "elapsed_time": "0:10:10", "remaining_time": "1:30:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 145, "total_steps": 1424, "loss": 0.0668, "accuracy": 1.0, "learning_rate": 3.6022800037249585e-05, "epoch": 0.10179010179010178, "percentage": 10.18, "elapsed_time": "0:10:15", "remaining_time": "1:30:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 146, "total_steps": 1424, "loss": 0.0566, "accuracy": 1.0, "learning_rate": 3.607254759640729e-05, "epoch": 0.10249210249210249, "percentage": 10.25, "elapsed_time": "0:10:19", "remaining_time": "1:30:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 147, "total_steps": 1424, "loss": 0.0659, "accuracy": 0.875, "learning_rate": 3.612195557913627e-05, "epoch": 0.10319410319410319, "percentage": 10.32, "elapsed_time": "0:10:23", "remaining_time": "1:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 148, "total_steps": 1424, "loss": 0.0859, "accuracy": 1.0, "learning_rate": 3.6171028589915954e-05, "epoch": 0.1038961038961039, "percentage": 10.39, "elapsed_time": "0:10:27", "remaining_time": "1:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 149, "total_steps": 1424, "loss": 0.0707, "accuracy": 0.875, "learning_rate": 3.6219771140204575e-05, "epoch": 0.1045981045981046, "percentage": 10.46, "elapsed_time": "0:10:31", "remaining_time": "1:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 1424, "loss": 0.0358, "accuracy": 1.0, "learning_rate": 3.626818765092802e-05, "epoch": 0.1053001053001053, "percentage": 10.53, "elapsed_time": "0:10:35", "remaining_time": "1:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 151, "total_steps": 1424, "loss": 0.0595, "accuracy": 0.875, "learning_rate": 3.6316282454886157e-05, "epoch": 0.10600210600210601, "percentage": 10.6, "elapsed_time": "0:10:39", "remaining_time": "1:29:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 152, "total_steps": 1424, "loss": 0.1011, "accuracy": 1.0, "learning_rate": 3.636405979907955e-05, "epoch": 0.10670410670410671, "percentage": 10.67, "elapsed_time": "0:10:44", "remaining_time": "1:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 153, "total_steps": 1424, "loss": 0.0183, "accuracy": 1.0, "learning_rate": 3.6411523846959985e-05, "epoch": 0.10740610740610741, "percentage": 10.74, "elapsed_time": "0:10:48", "remaining_time": "1:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 154, "total_steps": 1424, "loss": 0.0393, "accuracy": 1.0, "learning_rate": 3.645867868060772e-05, "epoch": 0.10810810810810811, "percentage": 10.81, "elapsed_time": "0:10:52", "remaining_time": "1:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 155, "total_steps": 1424, "loss": 0.0529, "accuracy": 1.0, "learning_rate": 3.6505528302838193e-05, "epoch": 0.10881010881010882, "percentage": 10.88, "elapsed_time": "0:10:56", "remaining_time": "1:29:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 156, "total_steps": 1424, "loss": 0.0678, "accuracy": 1.0, "learning_rate": 3.6552076639241027e-05, "epoch": 0.10951210951210952, "percentage": 10.96, "elapsed_time": "0:11:00", "remaining_time": "1:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 157, "total_steps": 1424, "loss": 0.0519, "accuracy": 1.0, "learning_rate": 3.65983275401539e-05, "epoch": 0.11021411021411022, "percentage": 11.03, "elapsed_time": "0:11:04", "remaining_time": "1:29:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 158, "total_steps": 1424, "loss": 0.0411, "accuracy": 1.0, "learning_rate": 3.664428478257371e-05, "epoch": 0.11091611091611092, "percentage": 11.1, "elapsed_time": "0:11:09", "remaining_time": "1:29:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 159, "total_steps": 1424, "loss": 0.0542, "accuracy": 1.0, "learning_rate": 3.668995207200753e-05, "epoch": 0.11161811161811162, "percentage": 11.17, "elapsed_time": "0:11:13", "remaining_time": "1:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 1424, "loss": 0.0638, "accuracy": 1.0, "learning_rate": 3.673533304426541e-05, "epoch": 0.11232011232011233, "percentage": 11.24, "elapsed_time": "0:11:17", "remaining_time": "1:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 161, "total_steps": 1424, "loss": 0.073, "accuracy": 1.0, "learning_rate": 3.67804312671975e-05, "epoch": 0.11302211302211303, "percentage": 11.31, "elapsed_time": "0:11:21", "remaining_time": "1:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 162, "total_steps": 1424, "loss": 0.0667, "accuracy": 0.875, "learning_rate": 3.682525024237719e-05, "epoch": 0.11372411372411373, "percentage": 11.38, "elapsed_time": "0:11:25", "remaining_time": "1:29:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 163, "total_steps": 1424, "loss": 0.0719, "accuracy": 1.0, "learning_rate": 3.6869793406732636e-05, "epoch": 0.11442611442611443, "percentage": 11.45, "elapsed_time": "0:11:29", "remaining_time": "1:28:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 164, "total_steps": 1424, "loss": 0.1004, "accuracy": 1.0, "learning_rate": 3.69140641341283e-05, "epoch": 0.11512811512811513, "percentage": 11.52, "elapsed_time": "0:11:34", "remaining_time": "1:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 165, "total_steps": 1424, "loss": 0.0488, "accuracy": 1.0, "learning_rate": 3.695806573689844e-05, "epoch": 0.11583011583011583, "percentage": 11.59, "elapsed_time": "0:11:38", "remaining_time": "1:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 166, "total_steps": 1424, "loss": 0.0611, "accuracy": 1.0, "learning_rate": 3.700180146733426e-05, "epoch": 0.11653211653211654, "percentage": 11.66, "elapsed_time": "0:11:42", "remaining_time": "1:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 167, "total_steps": 1424, "loss": 0.0272, "accuracy": 1.0, "learning_rate": 3.704527451912639e-05, "epoch": 0.11723411723411724, "percentage": 11.73, "elapsed_time": "0:11:46", "remaining_time": "1:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 168, "total_steps": 1424, "loss": 0.0489, "accuracy": 1.0, "learning_rate": 3.708848802876438e-05, "epoch": 0.11793611793611794, "percentage": 11.8, "elapsed_time": "0:11:50", "remaining_time": "1:28:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 169, "total_steps": 1424, "loss": 0.046, "accuracy": 0.875, "learning_rate": 3.7131445076894564e-05, "epoch": 0.11863811863811864, "percentage": 11.87, "elapsed_time": "0:11:54", "remaining_time": "1:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 1424, "loss": 0.0308, "accuracy": 1.0, "learning_rate": 3.717414868963791e-05, "epoch": 0.11934011934011934, "percentage": 11.94, "elapsed_time": "0:11:58", "remaining_time": "1:28:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 171, "total_steps": 1424, "loss": 0.0685, "accuracy": 1.0, "learning_rate": 3.721660183986924e-05, "epoch": 0.12004212004212005, "percentage": 12.01, "elapsed_time": "0:12:03", "remaining_time": "1:28:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 172, "total_steps": 1424, "loss": 0.0165, "accuracy": 1.0, "learning_rate": 3.725880744845915e-05, "epoch": 0.12074412074412075, "percentage": 12.08, "elapsed_time": "0:12:07", "remaining_time": "1:28:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 173, "total_steps": 1424, "loss": 0.0325, "accuracy": 1.0, "learning_rate": 3.730076838547993e-05, "epoch": 0.12144612144612145, "percentage": 12.15, "elapsed_time": "0:12:11", "remaining_time": "1:28:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 174, "total_steps": 1424, "loss": 0.0208, "accuracy": 1.0, "learning_rate": 3.734248747137666e-05, "epoch": 0.12214812214812215, "percentage": 12.22, "elapsed_time": "0:12:15", "remaining_time": "1:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 175, "total_steps": 1424, "loss": 0.044, "accuracy": 1.0, "learning_rate": 3.738396747810492e-05, "epoch": 0.12285012285012285, "percentage": 12.29, "elapsed_time": "0:12:19", "remaining_time": "1:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 176, "total_steps": 1424, "loss": 0.0479, "accuracy": 1.0, "learning_rate": 3.7425211130235834e-05, "epoch": 0.12355212355212356, "percentage": 12.36, "elapsed_time": "0:12:23", "remaining_time": "1:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 177, "total_steps": 1424, "loss": 0.0268, "accuracy": 1.0, "learning_rate": 3.7466221106030115e-05, "epoch": 0.12425412425412426, "percentage": 12.43, "elapsed_time": "0:12:27", "remaining_time": "1:27:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 178, "total_steps": 1424, "loss": 0.0219, "accuracy": 1.0, "learning_rate": 3.750700003848157e-05, "epoch": 0.12495612495612496, "percentage": 12.5, "elapsed_time": "0:12:31", "remaining_time": "1:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 179, "total_steps": 1424, "loss": 0.0241, "accuracy": 1.0, "learning_rate": 3.7547550516331555e-05, "epoch": 0.12565812565812565, "percentage": 12.57, "elapsed_time": "0:12:36", "remaining_time": "1:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 1424, "loss": 0.0455, "accuracy": 1.0, "learning_rate": 3.75878750850551e-05, "epoch": 0.12636012636012636, "percentage": 12.64, "elapsed_time": "0:12:40", "remaining_time": "1:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 181, "total_steps": 1424, "loss": 0.0061, "accuracy": 1.0, "learning_rate": 3.7627976247819744e-05, "epoch": 0.12706212706212705, "percentage": 12.71, "elapsed_time": "0:12:44", "remaining_time": "1:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 182, "total_steps": 1424, "loss": 0.0298, "accuracy": 1.0, "learning_rate": 3.766785646641792e-05, "epoch": 0.12776412776412777, "percentage": 12.78, "elapsed_time": "0:12:48", "remaining_time": "1:27:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 183, "total_steps": 1424, "loss": 0.0336, "accuracy": 1.0, "learning_rate": 3.770751816217383e-05, "epoch": 0.12846612846612845, "percentage": 12.85, "elapsed_time": "0:12:52", "remaining_time": "1:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 184, "total_steps": 1424, "loss": 0.02, "accuracy": 1.0, "learning_rate": 3.7746963716825615e-05, "epoch": 0.12916812916812917, "percentage": 12.92, "elapsed_time": "0:12:56", "remaining_time": "1:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 185, "total_steps": 1424, "loss": 0.0454, "accuracy": 1.0, "learning_rate": 3.778619547338356e-05, "epoch": 0.12987012987012986, "percentage": 12.99, "elapsed_time": "0:13:01", "remaining_time": "1:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 186, "total_steps": 1424, "loss": 0.0312, "accuracy": 1.0, "learning_rate": 3.782521573696528e-05, "epoch": 0.13057213057213057, "percentage": 13.06, "elapsed_time": "0:13:05", "remaining_time": "1:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 187, "total_steps": 1424, "loss": 0.0042, "accuracy": 1.0, "learning_rate": 3.786402677560832e-05, "epoch": 0.13127413127413126, "percentage": 13.13, "elapsed_time": "0:13:09", "remaining_time": "1:27:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 188, "total_steps": 1424, "loss": 0.0131, "accuracy": 1.0, "learning_rate": 3.790263082106134e-05, "epoch": 0.13197613197613198, "percentage": 13.2, "elapsed_time": "0:13:13", "remaining_time": "1:26:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 189, "total_steps": 1424, "loss": 0.0502, "accuracy": 0.875, "learning_rate": 3.794103006955407e-05, "epoch": 0.13267813267813267, "percentage": 13.27, "elapsed_time": "0:13:17", "remaining_time": "1:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 1424, "loss": 0.0151, "accuracy": 1.0, "learning_rate": 3.797922668254715e-05, "epoch": 0.13338013338013338, "percentage": 13.34, "elapsed_time": "0:13:21", "remaining_time": "1:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 191, "total_steps": 1424, "loss": 0.01, "accuracy": 1.0, "learning_rate": 3.801722278746213e-05, "epoch": 0.13408213408213407, "percentage": 13.41, "elapsed_time": "0:13:25", "remaining_time": "1:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 192, "total_steps": 1424, "loss": 0.0107, "accuracy": 1.0, "learning_rate": 3.8055020478392495e-05, "epoch": 0.13478413478413478, "percentage": 13.48, "elapsed_time": "0:13:29", "remaining_time": "1:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 193, "total_steps": 1424, "loss": 0.0065, "accuracy": 1.0, "learning_rate": 3.809262181679623e-05, "epoch": 0.13548613548613547, "percentage": 13.55, "elapsed_time": "0:13:34", "remaining_time": "1:26:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 194, "total_steps": 1424, "loss": 0.0089, "accuracy": 1.0, "learning_rate": 3.813002883217044e-05, "epoch": 0.1361881361881362, "percentage": 13.62, "elapsed_time": "0:13:38", "remaining_time": "1:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 195, "total_steps": 1424, "loss": 0.0129, "accuracy": 1.0, "learning_rate": 3.816724352270863e-05, "epoch": 0.13689013689013688, "percentage": 13.69, "elapsed_time": "0:13:42", "remaining_time": "1:26:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 196, "total_steps": 1424, "loss": 0.0033, "accuracy": 1.0, "learning_rate": 3.8204267855941266e-05, "epoch": 0.1375921375921376, "percentage": 13.76, "elapsed_time": "0:13:46", "remaining_time": "1:26:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 197, "total_steps": 1424, "loss": 0.026, "accuracy": 1.0, "learning_rate": 3.824110376935989e-05, "epoch": 0.1382941382941383, "percentage": 13.83, "elapsed_time": "0:13:50", "remaining_time": "1:26:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 198, "total_steps": 1424, "loss": 0.0117, "accuracy": 1.0, "learning_rate": 3.827775317102552e-05, "epoch": 0.138996138996139, "percentage": 13.9, "elapsed_time": "0:13:54", "remaining_time": "1:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 199, "total_steps": 1424, "loss": 0.0067, "accuracy": 1.0, "learning_rate": 3.831421794016178e-05, "epoch": 0.1396981396981397, "percentage": 13.97, "elapsed_time": "0:13:58", "remaining_time": "1:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 1424, "loss": 0.0497, "accuracy": 1.0, "learning_rate": 3.835049992773302e-05, "epoch": 0.1404001404001404, "percentage": 14.04, "elapsed_time": "0:14:03", "remaining_time": "1:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 201, "total_steps": 1424, "loss": 0.0184, "accuracy": 1.0, "learning_rate": 3.838660095700815e-05, "epoch": 0.14110214110214112, "percentage": 14.12, "elapsed_time": "0:14:14", "remaining_time": "1:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 202, "total_steps": 1424, "loss": 0.0125, "accuracy": 1.0, "learning_rate": 3.84225228241104e-05, "epoch": 0.1418041418041418, "percentage": 14.19, "elapsed_time": "0:14:18", "remaining_time": "1:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 203, "total_steps": 1424, "loss": 0.0062, "accuracy": 1.0, "learning_rate": 3.8458267298553554e-05, "epoch": 0.14250614250614252, "percentage": 14.26, "elapsed_time": "0:14:22", "remaining_time": "1:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 204, "total_steps": 1424, "loss": 0.0452, "accuracy": 1.0, "learning_rate": 3.8493836123764984e-05, "epoch": 0.1432081432081432, "percentage": 14.33, "elapsed_time": "0:14:26", "remaining_time": "1:26:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 205, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 3.852923101759591e-05, "epoch": 0.14391014391014392, "percentage": 14.4, "elapsed_time": "0:14:30", "remaining_time": "1:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 206, "total_steps": 1424, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 3.856445367281923e-05, "epoch": 0.1446121446121446, "percentage": 14.47, "elapsed_time": "0:14:34", "remaining_time": "1:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 207, "total_steps": 1424, "loss": 0.0074, "accuracy": 1.0, "learning_rate": 3.859950575761529e-05, "epoch": 0.14531414531414533, "percentage": 14.54, "elapsed_time": "0:14:38", "remaining_time": "1:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 208, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 3.8634388916046025e-05, "epoch": 0.14601614601614601, "percentage": 14.61, "elapsed_time": "0:14:43", "remaining_time": "1:26:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 209, "total_steps": 1424, "loss": 0.0088, "accuracy": 1.0, "learning_rate": 3.866910476851757e-05, "epoch": 0.14671814671814673, "percentage": 14.68, "elapsed_time": "0:14:47", "remaining_time": "1:25:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 1424, "loss": 0.0208, "accuracy": 1.0, "learning_rate": 3.870365491223199e-05, "epoch": 0.14742014742014742, "percentage": 14.75, "elapsed_time": "0:14:51", "remaining_time": "1:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 211, "total_steps": 1424, "loss": 0.0032, "accuracy": 1.0, "learning_rate": 3.8738040921628215e-05, "epoch": 0.14812214812214813, "percentage": 14.82, "elapsed_time": "0:14:55", "remaining_time": "1:25:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 212, "total_steps": 1424, "loss": 0.0857, "accuracy": 1.0, "learning_rate": 3.877226434881253e-05, "epoch": 0.14882414882414882, "percentage": 14.89, "elapsed_time": "0:14:59", "remaining_time": "1:25:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 213, "total_steps": 1424, "loss": 0.0269, "accuracy": 1.0, "learning_rate": 3.880632672397897e-05, "epoch": 0.14952614952614954, "percentage": 14.96, "elapsed_time": "0:15:03", "remaining_time": "1:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 214, "total_steps": 1424, "loss": 0.0143, "accuracy": 1.0, "learning_rate": 3.884022955581985e-05, "epoch": 0.15022815022815023, "percentage": 15.03, "elapsed_time": "0:15:07", "remaining_time": "1:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 215, "total_steps": 1424, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 3.887397433192676e-05, "epoch": 0.15093015093015094, "percentage": 15.1, "elapsed_time": "0:15:12", "remaining_time": "1:25:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 216, "total_steps": 1424, "loss": 0.0038, "accuracy": 1.0, "learning_rate": 3.890756251918219e-05, "epoch": 0.15163215163215163, "percentage": 15.17, "elapsed_time": "0:15:16", "remaining_time": "1:25:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 217, "total_steps": 1424, "loss": 0.0056, "accuracy": 1.0, "learning_rate": 3.894099556414216e-05, "epoch": 0.15233415233415235, "percentage": 15.24, "elapsed_time": "0:15:20", "remaining_time": "1:25:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 218, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 3.897427489341009e-05, "epoch": 0.15303615303615303, "percentage": 15.31, "elapsed_time": "0:15:24", "remaining_time": "1:25:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 219, "total_steps": 1424, "loss": 0.0067, "accuracy": 1.0, "learning_rate": 3.900740191400198e-05, "epoch": 0.15373815373815375, "percentage": 15.38, "elapsed_time": "0:15:28", "remaining_time": "1:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 1424, "loss": 0.0227, "accuracy": 1.0, "learning_rate": 3.904037801370344e-05, "epoch": 0.15444015444015444, "percentage": 15.45, "elapsed_time": "0:15:32", "remaining_time": "1:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 221, "total_steps": 1424, "loss": 0.0488, "accuracy": 1.0, "learning_rate": 3.9073204561418514e-05, "epoch": 0.15514215514215515, "percentage": 15.52, "elapsed_time": "0:15:37", "remaining_time": "1:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 222, "total_steps": 1424, "loss": 0.0118, "accuracy": 1.0, "learning_rate": 3.9105882907510644e-05, "epoch": 0.15584415584415584, "percentage": 15.59, "elapsed_time": "0:15:41", "remaining_time": "1:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 223, "total_steps": 1424, "loss": 0.0207, "accuracy": 1.0, "learning_rate": 3.913841438413601e-05, "epoch": 0.15654615654615656, "percentage": 15.66, "elapsed_time": "0:15:45", "remaining_time": "1:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 224, "total_steps": 1424, "loss": 0.011, "accuracy": 1.0, "learning_rate": 3.917080030556938e-05, "epoch": 0.15724815724815724, "percentage": 15.73, "elapsed_time": "0:15:49", "remaining_time": "1:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 225, "total_steps": 1424, "loss": 0.0136, "accuracy": 1.0, "learning_rate": 3.9203041968522716e-05, "epoch": 0.15795015795015796, "percentage": 15.8, "elapsed_time": "0:15:53", "remaining_time": "1:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 226, "total_steps": 1424, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 3.923514065245669e-05, "epoch": 0.15865215865215865, "percentage": 15.87, "elapsed_time": "0:15:57", "remaining_time": "1:24:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 227, "total_steps": 1424, "loss": 0.0047, "accuracy": 1.0, "learning_rate": 3.926709761988538e-05, "epoch": 0.15935415935415936, "percentage": 15.94, "elapsed_time": "0:16:01", "remaining_time": "1:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 228, "total_steps": 1424, "loss": 0.002, "accuracy": 1.0, "learning_rate": 3.929891411667424e-05, "epoch": 0.16005616005616005, "percentage": 16.01, "elapsed_time": "0:16:06", "remaining_time": "1:24:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 229, "total_steps": 1424, "loss": 0.0056, "accuracy": 1.0, "learning_rate": 3.933059137233147e-05, "epoch": 0.16075816075816077, "percentage": 16.08, "elapsed_time": "0:16:10", "remaining_time": "1:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 1424, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 3.9362130600293214e-05, "epoch": 0.16146016146016146, "percentage": 16.15, "elapsed_time": "0:16:14", "remaining_time": "1:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 231, "total_steps": 1424, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 3.9393532998202405e-05, "epoch": 0.16216216216216217, "percentage": 16.22, "elapsed_time": "0:16:18", "remaining_time": "1:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 232, "total_steps": 1424, "loss": 0.0052, "accuracy": 1.0, "learning_rate": 3.942479974818166e-05, "epoch": 0.16286416286416286, "percentage": 16.29, "elapsed_time": "0:16:22", "remaining_time": "1:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 233, "total_steps": 1424, "loss": 0.0057, "accuracy": 1.0, "learning_rate": 3.945593201710032e-05, "epoch": 0.16356616356616357, "percentage": 16.36, "elapsed_time": "0:16:26", "remaining_time": "1:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 234, "total_steps": 1424, "loss": 0.0285, "accuracy": 1.0, "learning_rate": 3.9486930956835724e-05, "epoch": 0.16426816426816426, "percentage": 16.43, "elapsed_time": "0:16:30", "remaining_time": "1:23:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 235, "total_steps": 1424, "loss": 0.0423, "accuracy": 1.0, "learning_rate": 3.951779770452894e-05, "epoch": 0.16497016497016498, "percentage": 16.5, "elapsed_time": "0:16:35", "remaining_time": "1:23:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 236, "total_steps": 1424, "loss": 0.0031, "accuracy": 1.0, "learning_rate": 3.954853338283512e-05, "epoch": 0.16567216567216567, "percentage": 16.57, "elapsed_time": "0:16:39", "remaining_time": "1:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 237, "total_steps": 1424, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 3.9579139100168404e-05, "epoch": 0.16637416637416638, "percentage": 16.64, "elapsed_time": "0:16:43", "remaining_time": "1:23:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 238, "total_steps": 1424, "loss": 0.0114, "accuracy": 1.0, "learning_rate": 3.960961595094187e-05, "epoch": 0.16707616707616707, "percentage": 16.71, "elapsed_time": "0:16:47", "remaining_time": "1:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 239, "total_steps": 1424, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 3.96399650158023e-05, "epoch": 0.16777816777816779, "percentage": 16.78, "elapsed_time": "0:16:51", "remaining_time": "1:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 1424, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 3.96701873618601e-05, "epoch": 0.16848016848016847, "percentage": 16.85, "elapsed_time": "0:16:55", "remaining_time": "1:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 241, "total_steps": 1424, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 3.970028404291448e-05, "epoch": 0.1691821691821692, "percentage": 16.92, "elapsed_time": "0:16:59", "remaining_time": "1:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 242, "total_steps": 1424, "loss": 0.0034, "accuracy": 1.0, "learning_rate": 3.9730256099673865e-05, "epoch": 0.16988416988416988, "percentage": 16.99, "elapsed_time": "0:17:04", "remaining_time": "1:23:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 243, "total_steps": 1424, "loss": 0.0022, "accuracy": 1.0, "learning_rate": 3.976010455997187e-05, "epoch": 0.1705861705861706, "percentage": 17.06, "elapsed_time": "0:17:08", "remaining_time": "1:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 244, "total_steps": 1424, "loss": 0.0042, "accuracy": 1.0, "learning_rate": 3.978983043897883e-05, "epoch": 0.17128817128817128, "percentage": 17.13, "elapsed_time": "0:17:12", "remaining_time": "1:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 245, "total_steps": 1424, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 3.981943473940888e-05, "epoch": 0.171990171990172, "percentage": 17.21, "elapsed_time": "0:17:16", "remaining_time": "1:23:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 246, "total_steps": 1424, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 3.984891845172299e-05, "epoch": 0.17269217269217269, "percentage": 17.28, "elapsed_time": "0:17:20", "remaining_time": "1:23:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 247, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 3.987828255432777e-05, "epoch": 0.1733941733941734, "percentage": 17.35, "elapsed_time": "0:17:24", "remaining_time": "1:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 248, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 3.9907528013770276e-05, "epoch": 0.1740961740961741, "percentage": 17.42, "elapsed_time": "0:17:28", "remaining_time": "1:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 249, "total_steps": 1424, "loss": 0.0021, "accuracy": 1.0, "learning_rate": 3.993665578492894e-05, "epoch": 0.1747981747981748, "percentage": 17.49, "elapsed_time": "0:17:32", "remaining_time": "1:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 3.9965666811200624e-05, "epoch": 0.1755001755001755, "percentage": 17.56, "elapsed_time": "0:17:37", "remaining_time": "1:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 251, "total_steps": 1424, "loss": 0.0342, "accuracy": 1.0, "learning_rate": 3.999456202468397e-05, "epoch": 0.1762021762021762, "percentage": 17.63, "elapsed_time": "0:17:41", "remaining_time": "1:22:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 252, "total_steps": 1424, "loss": 0.0092, "accuracy": 1.0, "learning_rate": 4.002334234635907e-05, "epoch": 0.1769041769041769, "percentage": 17.7, "elapsed_time": "0:17:45", "remaining_time": "1:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 253, "total_steps": 1424, "loss": 0.0079, "accuracy": 1.0, "learning_rate": 4.005200868626364e-05, "epoch": 0.1776061776061776, "percentage": 17.77, "elapsed_time": "0:17:49", "remaining_time": "1:22:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 254, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.008056194366564e-05, "epoch": 0.1783081783081783, "percentage": 17.84, "elapsed_time": "0:17:53", "remaining_time": "1:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 255, "total_steps": 1424, "loss": 0.0055, "accuracy": 1.0, "learning_rate": 4.010900300723259e-05, "epoch": 0.17901017901017902, "percentage": 17.91, "elapsed_time": "0:17:57", "remaining_time": "1:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 256, "total_steps": 1424, "loss": 0.0046, "accuracy": 1.0, "learning_rate": 4.013733275519749e-05, "epoch": 0.1797121797121797, "percentage": 17.98, "elapsed_time": "0:18:01", "remaining_time": "1:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 257, "total_steps": 1424, "loss": 0.0068, "accuracy": 1.0, "learning_rate": 4.016555205552158e-05, "epoch": 0.18041418041418042, "percentage": 18.05, "elapsed_time": "0:18:06", "remaining_time": "1:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 258, "total_steps": 1424, "loss": 0.0029, "accuracy": 1.0, "learning_rate": 4.0193661766053834e-05, "epoch": 0.1811161811161811, "percentage": 18.12, "elapsed_time": "0:18:10", "remaining_time": "1:22:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 259, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.022166273468753e-05, "epoch": 0.18181818181818182, "percentage": 18.19, "elapsed_time": "0:18:14", "remaining_time": "1:22:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.024955579951363e-05, "epoch": 0.1825201825201825, "percentage": 18.26, "elapsed_time": "0:18:18", "remaining_time": "1:21:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 261, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.027734178897136e-05, "epoch": 0.18322218322218323, "percentage": 18.33, "elapsed_time": "0:18:22", "remaining_time": "1:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 262, "total_steps": 1424, "loss": 0.0022, "accuracy": 1.0, "learning_rate": 4.030502152199576e-05, "epoch": 0.18392418392418391, "percentage": 18.4, "elapsed_time": "0:18:26", "remaining_time": "1:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 263, "total_steps": 1424, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 4.033259580816264e-05, "epoch": 0.18462618462618463, "percentage": 18.47, "elapsed_time": "0:18:30", "remaining_time": "1:21:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 264, "total_steps": 1424, "loss": 0.0033, "accuracy": 1.0, "learning_rate": 4.036006544783052e-05, "epoch": 0.18532818532818532, "percentage": 18.54, "elapsed_time": "0:18:34", "remaining_time": "1:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 265, "total_steps": 1424, "loss": 0.0024, "accuracy": 1.0, "learning_rate": 4.0387431232280135e-05, "epoch": 0.18603018603018603, "percentage": 18.61, "elapsed_time": "0:18:39", "remaining_time": "1:21:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 266, "total_steps": 1424, "loss": 0.0045, "accuracy": 1.0, "learning_rate": 4.041469394385112e-05, "epoch": 0.18673218673218672, "percentage": 18.68, "elapsed_time": "0:18:43", "remaining_time": "1:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 267, "total_steps": 1424, "loss": 0.003, "accuracy": 1.0, "learning_rate": 4.0441854356076257e-05, "epoch": 0.18743418743418744, "percentage": 18.75, "elapsed_time": "0:18:47", "remaining_time": "1:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 268, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.046891323381315e-05, "epoch": 0.18813618813618813, "percentage": 18.82, "elapsed_time": "0:18:51", "remaining_time": "1:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 269, "total_steps": 1424, "loss": 0.0747, "accuracy": 1.0, "learning_rate": 4.049587133337347e-05, "epoch": 0.18883818883818884, "percentage": 18.89, "elapsed_time": "0:18:55", "remaining_time": "1:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.0522729402649793e-05, "epoch": 0.18954018954018953, "percentage": 18.96, "elapsed_time": "0:18:59", "remaining_time": "1:21:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 271, "total_steps": 1424, "loss": 0.0023, "accuracy": 1.0, "learning_rate": 4.0549488181240096e-05, "epoch": 0.19024219024219025, "percentage": 19.03, "elapsed_time": "0:19:03", "remaining_time": "1:21:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 272, "total_steps": 1424, "loss": 0.0266, "accuracy": 1.0, "learning_rate": 4.057614840056998e-05, "epoch": 0.19094419094419093, "percentage": 19.1, "elapsed_time": "0:19:08", "remaining_time": "1:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 273, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.06027107840126e-05, "epoch": 0.19164619164619165, "percentage": 19.17, "elapsed_time": "0:19:12", "remaining_time": "1:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 274, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.0629176047006474e-05, "epoch": 0.19234819234819234, "percentage": 19.24, "elapsed_time": "0:19:16", "remaining_time": "1:20:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 275, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.065554489717105e-05, "epoch": 0.19305019305019305, "percentage": 19.31, "elapsed_time": "0:19:20", "remaining_time": "1:20:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 276, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.068181803442029e-05, "epoch": 0.19375219375219374, "percentage": 19.38, "elapsed_time": "0:19:24", "remaining_time": "1:20:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 277, "total_steps": 1424, "loss": 0.0536, "accuracy": 1.0, "learning_rate": 4.0707996151074147e-05, "epoch": 0.19445419445419446, "percentage": 19.45, "elapsed_time": "0:19:28", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 278, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.073407993196794e-05, "epoch": 0.19515619515619514, "percentage": 19.52, "elapsed_time": "0:19:33", "remaining_time": "1:20:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 279, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.076007005455996e-05, "epoch": 0.19585819585819586, "percentage": 19.59, "elapsed_time": "0:19:37", "remaining_time": "1:20:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.0785967189036986e-05, "epoch": 0.19656019656019655, "percentage": 19.66, "elapsed_time": "0:19:41", "remaining_time": "1:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 281, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.0811771998418e-05, "epoch": 0.19726219726219726, "percentage": 19.73, "elapsed_time": "0:19:45", "remaining_time": "1:20:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 282, "total_steps": 1424, "loss": 0.0046, "accuracy": 1.0, "learning_rate": 4.083748513865602e-05, "epoch": 0.19796419796419795, "percentage": 19.8, "elapsed_time": "0:19:49", "remaining_time": "1:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 283, "total_steps": 1424, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 4.086310725873818e-05, "epoch": 0.19866619866619867, "percentage": 19.87, "elapsed_time": "0:19:53", "remaining_time": "1:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 284, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.0888639000783966e-05, "epoch": 0.19936819936819936, "percentage": 19.94, "elapsed_time": "0:19:57", "remaining_time": "1:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 285, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.0914081000141844e-05, "epoch": 0.20007020007020007, "percentage": 20.01, "elapsed_time": "0:20:02", "remaining_time": "1:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 286, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.0939433885484055e-05, "epoch": 0.20077220077220076, "percentage": 20.08, "elapsed_time": "0:20:06", "remaining_time": "1:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 287, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.0964698278899874e-05, "epoch": 0.20147420147420148, "percentage": 20.15, "elapsed_time": "0:20:10", "remaining_time": "1:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 288, "total_steps": 1424, "loss": 0.0022, "accuracy": 1.0, "learning_rate": 4.0989874795987185e-05, "epoch": 0.20217620217620216, "percentage": 20.22, "elapsed_time": "0:20:14", "remaining_time": "1:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 289, "total_steps": 1424, "loss": 0.0032, "accuracy": 1.0, "learning_rate": 4.1014964045942465e-05, "epoch": 0.20287820287820288, "percentage": 20.29, "elapsed_time": "0:20:18", "remaining_time": "1:19:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.103996663164927e-05, "epoch": 0.20358020358020357, "percentage": 20.37, "elapsed_time": "0:20:22", "remaining_time": "1:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 291, "total_steps": 1424, "loss": 0.0029, "accuracy": 1.0, "learning_rate": 4.106488314976513e-05, "epoch": 0.20428220428220428, "percentage": 20.44, "elapsed_time": "0:20:26", "remaining_time": "1:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 292, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.108971419080698e-05, "epoch": 0.20498420498420497, "percentage": 20.51, "elapsed_time": "0:20:31", "remaining_time": "1:19:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 293, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.111446033923516e-05, "epoch": 0.2056862056862057, "percentage": 20.58, "elapsed_time": "0:20:35", "remaining_time": "1:19:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 294, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.113912217353596e-05, "epoch": 0.20638820638820637, "percentage": 20.65, "elapsed_time": "0:20:39", "remaining_time": "1:19:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 295, "total_steps": 1424, "loss": 0.0139, "accuracy": 1.0, "learning_rate": 4.116370026630272e-05, "epoch": 0.2070902070902071, "percentage": 20.72, "elapsed_time": "0:20:43", "remaining_time": "1:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 296, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.118819518431564e-05, "epoch": 0.2077922077922078, "percentage": 20.79, "elapsed_time": "0:20:47", "remaining_time": "1:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 297, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.121260748862021e-05, "epoch": 0.2084942084942085, "percentage": 20.86, "elapsed_time": "0:20:51", "remaining_time": "1:19:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 298, "total_steps": 1424, "loss": 0.0039, "accuracy": 1.0, "learning_rate": 4.123693773460426e-05, "epoch": 0.2091962091962092, "percentage": 20.93, "elapsed_time": "0:20:55", "remaining_time": "1:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 299, "total_steps": 1424, "loss": 0.0479, "accuracy": 1.0, "learning_rate": 4.126118647207383e-05, "epoch": 0.2098982098982099, "percentage": 21.0, "elapsed_time": "0:21:00", "remaining_time": "1:19:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.1285354245327715e-05, "epoch": 0.2106002106002106, "percentage": 21.07, "elapsed_time": "0:21:04", "remaining_time": "1:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 301, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.1309441593230726e-05, "epoch": 0.2113022113022113, "percentage": 21.14, "elapsed_time": "0:21:14", "remaining_time": "1:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 302, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.133344904928585e-05, "epoch": 0.21200421200421202, "percentage": 21.21, "elapsed_time": "0:21:18", "remaining_time": "1:19:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 303, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.1357377141705084e-05, "epoch": 0.2127062127062127, "percentage": 21.28, "elapsed_time": "0:21:23", "remaining_time": "1:19:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 304, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.1381226393479236e-05, "epoch": 0.21340821340821342, "percentage": 21.35, "elapsed_time": "0:21:27", "remaining_time": "1:19:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 305, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.1404997322446435e-05, "epoch": 0.2141102141102141, "percentage": 21.42, "elapsed_time": "0:21:31", "remaining_time": "1:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 306, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.142869044135967e-05, "epoch": 0.21481221481221482, "percentage": 21.49, "elapsed_time": "0:21:35", "remaining_time": "1:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 307, "total_steps": 1424, "loss": 0.0032, "accuracy": 1.0, "learning_rate": 4.145230625795311e-05, "epoch": 0.2155142155142155, "percentage": 21.56, "elapsed_time": "0:21:39", "remaining_time": "1:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 308, "total_steps": 1424, "loss": 0.0018, "accuracy": 1.0, "learning_rate": 4.14758452750074e-05, "epoch": 0.21621621621621623, "percentage": 21.63, "elapsed_time": "0:21:43", "remaining_time": "1:18:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 309, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.149930799041392e-05, "epoch": 0.21691821691821692, "percentage": 21.7, "elapsed_time": "0:21:47", "remaining_time": "1:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.152269489723788e-05, "epoch": 0.21762021762021763, "percentage": 21.77, "elapsed_time": "0:21:52", "remaining_time": "1:18:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 311, "total_steps": 1424, "loss": 0.065, "accuracy": 1.0, "learning_rate": 4.1546006483780626e-05, "epoch": 0.21832221832221832, "percentage": 21.84, "elapsed_time": "0:21:56", "remaining_time": "1:18:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 312, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.156924323364072e-05, "epoch": 0.21902421902421904, "percentage": 21.91, "elapsed_time": "0:22:00", "remaining_time": "1:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 313, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.1592405625774144e-05, "epoch": 0.21972621972621972, "percentage": 21.98, "elapsed_time": "0:22:04", "remaining_time": "1:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 314, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.161549413455358e-05, "epoch": 0.22042822042822044, "percentage": 22.05, "elapsed_time": "0:22:08", "remaining_time": "1:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 315, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.163850922982668e-05, "epoch": 0.22113022113022113, "percentage": 22.12, "elapsed_time": "0:22:12", "remaining_time": "1:18:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 316, "total_steps": 1424, "loss": 0.0023, "accuracy": 1.0, "learning_rate": 4.16614513769734e-05, "epoch": 0.22183222183222184, "percentage": 22.19, "elapsed_time": "0:22:16", "remaining_time": "1:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 317, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.1684321036962526e-05, "epoch": 0.22253422253422253, "percentage": 22.26, "elapsed_time": "0:22:20", "remaining_time": "1:18:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 318, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.170711866640721e-05, "epoch": 0.22323622323622325, "percentage": 22.33, "elapsed_time": "0:22:25", "remaining_time": "1:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 319, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 4.1729844717619684e-05, "epoch": 0.22393822393822393, "percentage": 22.4, "elapsed_time": "0:22:29", "remaining_time": "1:17:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 1424, "loss": 0.0115, "accuracy": 1.0, "learning_rate": 4.17524996386651e-05, "epoch": 0.22464022464022465, "percentage": 22.47, "elapsed_time": "0:22:33", "remaining_time": "1:17:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 321, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.177508387341454e-05, "epoch": 0.22534222534222534, "percentage": 22.54, "elapsed_time": "0:22:37", "remaining_time": "1:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 322, "total_steps": 1424, "loss": 0.0027, "accuracy": 1.0, "learning_rate": 4.179759786159719e-05, "epoch": 0.22604422604422605, "percentage": 22.61, "elapsed_time": "0:22:41", "remaining_time": "1:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 323, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.182004203885172e-05, "epoch": 0.22674622674622674, "percentage": 22.68, "elapsed_time": "0:22:45", "remaining_time": "1:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 324, "total_steps": 1424, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 4.184241683677687e-05, "epoch": 0.22744822744822746, "percentage": 22.75, "elapsed_time": "0:22:50", "remaining_time": "1:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 325, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.1864722682981245e-05, "epoch": 0.22815022815022815, "percentage": 22.82, "elapsed_time": "0:22:54", "remaining_time": "1:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 326, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.188696000113232e-05, "epoch": 0.22885222885222886, "percentage": 22.89, "elapsed_time": "0:22:58", "remaining_time": "1:17:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 327, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.190912921100477e-05, "epoch": 0.22955422955422955, "percentage": 22.96, "elapsed_time": "0:23:02", "remaining_time": "1:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 328, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.1931230728527994e-05, "epoch": 0.23025623025623027, "percentage": 23.03, "elapsed_time": "0:23:06", "remaining_time": "1:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 329, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.195326496583291e-05, "epoch": 0.23095823095823095, "percentage": 23.1, "elapsed_time": "0:23:11", "remaining_time": "1:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.1975232331298125e-05, "epoch": 0.23166023166023167, "percentage": 23.17, "elapsed_time": "0:23:15", "remaining_time": "1:17:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 331, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.1997133229595316e-05, "epoch": 0.23236223236223236, "percentage": 23.24, "elapsed_time": "0:23:19", "remaining_time": "1:17:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 332, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.201896806173394e-05, "epoch": 0.23306423306423307, "percentage": 23.31, "elapsed_time": "0:23:23", "remaining_time": "1:16:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 333, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.2040737225105335e-05, "epoch": 0.23376623376623376, "percentage": 23.38, "elapsed_time": "0:23:27", "remaining_time": "1:16:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 334, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.206244111352608e-05, "epoch": 0.23446823446823448, "percentage": 23.46, "elapsed_time": "0:23:31", "remaining_time": "1:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 335, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.2084080117280756e-05, "epoch": 0.23517023517023516, "percentage": 23.53, "elapsed_time": "0:23:35", "remaining_time": "1:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 336, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.210565462316407e-05, "epoch": 0.23587223587223588, "percentage": 23.6, "elapsed_time": "0:23:42", "remaining_time": "1:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 337, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.2127165014522315e-05, "epoch": 0.23657423657423657, "percentage": 23.67, "elapsed_time": "0:23:46", "remaining_time": "1:16:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 338, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.214861167129425e-05, "epoch": 0.23727623727623728, "percentage": 23.74, "elapsed_time": "0:23:50", "remaining_time": "1:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 339, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.2169994970051365e-05, "epoch": 0.23797823797823797, "percentage": 23.81, "elapsed_time": "0:23:54", "remaining_time": "1:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.219131528403759e-05, "epoch": 0.2386802386802387, "percentage": 23.88, "elapsed_time": "0:23:58", "remaining_time": "1:16:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 341, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.22125729832083e-05, "epoch": 0.23938223938223938, "percentage": 23.95, "elapsed_time": "0:24:02", "remaining_time": "1:16:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 342, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.2233768434268914e-05, "epoch": 0.2400842400842401, "percentage": 24.02, "elapsed_time": "0:24:07", "remaining_time": "1:16:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 343, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.225490200071284e-05, "epoch": 0.24078624078624078, "percentage": 24.09, "elapsed_time": "0:24:11", "remaining_time": "1:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 344, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.227597404285883e-05, "epoch": 0.2414882414882415, "percentage": 24.16, "elapsed_time": "0:24:15", "remaining_time": "1:16:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 345, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.229698491788791e-05, "epoch": 0.24219024219024218, "percentage": 24.23, "elapsed_time": "0:24:19", "remaining_time": "1:16:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 346, "total_steps": 1424, "loss": 0.0023, "accuracy": 1.0, "learning_rate": 4.231793497987961e-05, "epoch": 0.2428922428922429, "percentage": 24.3, "elapsed_time": "0:24:23", "remaining_time": "1:16:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 347, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.2338824579847904e-05, "epoch": 0.2435942435942436, "percentage": 24.37, "elapsed_time": "0:24:27", "remaining_time": "1:15:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 348, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.235965406577636e-05, "epoch": 0.2442962442962443, "percentage": 24.44, "elapsed_time": "0:24:31", "remaining_time": "1:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 349, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.2380423782653e-05, "epoch": 0.244998244998245, "percentage": 24.51, "elapsed_time": "0:24:36", "remaining_time": "1:15:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 1424, "loss": 0.0018, "accuracy": 1.0, "learning_rate": 4.240113407250459e-05, "epoch": 0.2457002457002457, "percentage": 24.58, "elapsed_time": "0:24:40", "remaining_time": "1:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 351, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.24217852744304e-05, "epoch": 0.2464022464022464, "percentage": 24.65, "elapsed_time": "0:24:44", "remaining_time": "1:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 352, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.244237772463552e-05, "epoch": 0.2471042471042471, "percentage": 24.72, "elapsed_time": "0:24:48", "remaining_time": "1:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 353, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.246291175646371e-05, "epoch": 0.2478062478062478, "percentage": 24.79, "elapsed_time": "0:24:52", "remaining_time": "1:15:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 354, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.24833877004298e-05, "epoch": 0.2485082485082485, "percentage": 24.86, "elapsed_time": "0:24:56", "remaining_time": "1:15:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 355, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.250380588425157e-05, "epoch": 0.2492102492102492, "percentage": 24.93, "elapsed_time": "0:25:00", "remaining_time": "1:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 356, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.2524166632881255e-05, "epoch": 0.24991224991224992, "percentage": 25.0, "elapsed_time": "0:25:05", "remaining_time": "1:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 357, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.254447026853656e-05, "epoch": 0.25061425061425063, "percentage": 25.07, "elapsed_time": "0:25:09", "remaining_time": "1:15:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 358, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2564717110731244e-05, "epoch": 0.2513162513162513, "percentage": 25.14, "elapsed_time": "0:25:13", "remaining_time": "1:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 359, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.258490747630532e-05, "epoch": 0.252018252018252, "percentage": 25.21, "elapsed_time": "0:25:17", "remaining_time": "1:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.260504167945479e-05, "epoch": 0.2527202527202527, "percentage": 25.28, "elapsed_time": "0:25:21", "remaining_time": "1:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 361, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.2625120031760965e-05, "epoch": 0.25342225342225344, "percentage": 25.35, "elapsed_time": "0:25:25", "remaining_time": "1:14:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 362, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.264514284221944e-05, "epoch": 0.2541242541242541, "percentage": 25.42, "elapsed_time": "0:25:29", "remaining_time": "1:14:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 363, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.266511041726854e-05, "epoch": 0.2548262548262548, "percentage": 25.49, "elapsed_time": "0:25:34", "remaining_time": "1:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 364, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.26850230608176e-05, "epoch": 0.25552825552825553, "percentage": 25.56, "elapsed_time": "0:25:38", "remaining_time": "1:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 365, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.2704881074274584e-05, "epoch": 0.25623025623025625, "percentage": 25.63, "elapsed_time": "0:25:42", "remaining_time": "1:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 366, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.272468475657351e-05, "epoch": 0.2569322569322569, "percentage": 25.7, "elapsed_time": "0:25:46", "remaining_time": "1:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 367, "total_steps": 1424, "loss": 0.0018, "accuracy": 1.0, "learning_rate": 4.2744434404201497e-05, "epoch": 0.2576342576342576, "percentage": 25.77, "elapsed_time": "0:25:50", "remaining_time": "1:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 368, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.27641303112253e-05, "epoch": 0.25833625833625834, "percentage": 25.84, "elapsed_time": "0:25:54", "remaining_time": "1:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 369, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.278377276931767e-05, "epoch": 0.25903825903825906, "percentage": 25.91, "elapsed_time": "0:25:58", "remaining_time": "1:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.2803362067783256e-05, "epoch": 0.2597402597402597, "percentage": 25.98, "elapsed_time": "0:26:03", "remaining_time": "1:14:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 371, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.2822898493584104e-05, "epoch": 0.26044226044226043, "percentage": 26.05, "elapsed_time": "0:26:07", "remaining_time": "1:14:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 372, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.284238233136496e-05, "epoch": 0.26114426114426115, "percentage": 26.12, "elapsed_time": "0:26:11", "remaining_time": "1:14:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 373, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.286181386347813e-05, "epoch": 0.26184626184626186, "percentage": 26.19, "elapsed_time": "0:26:15", "remaining_time": "1:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 374, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.288119337000801e-05, "epoch": 0.2625482625482625, "percentage": 26.26, "elapsed_time": "0:26:19", "remaining_time": "1:13:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 375, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.2900521128795315e-05, "epoch": 0.26325026325026324, "percentage": 26.33, "elapsed_time": "0:26:23", "remaining_time": "1:13:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 376, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.291979741546102e-05, "epoch": 0.26395226395226395, "percentage": 26.4, "elapsed_time": "0:26:27", "remaining_time": "1:13:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 377, "total_steps": 1424, "loss": 0.0666, "accuracy": 1.0, "learning_rate": 4.293902250342989e-05, "epoch": 0.26465426465426467, "percentage": 26.47, "elapsed_time": "0:26:32", "remaining_time": "1:13:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 378, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.295819666395376e-05, "epoch": 0.26535626535626533, "percentage": 26.54, "elapsed_time": "0:26:36", "remaining_time": "1:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 379, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.297732016613454e-05, "epoch": 0.26605826605826605, "percentage": 26.62, "elapsed_time": "0:26:40", "remaining_time": "1:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.299639327694684e-05, "epoch": 0.26676026676026676, "percentage": 26.69, "elapsed_time": "0:26:44", "remaining_time": "1:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 381, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.3015416261260325e-05, "epoch": 0.2674622674622675, "percentage": 26.76, "elapsed_time": "0:26:48", "remaining_time": "1:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 382, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.303438938186182e-05, "epoch": 0.26816426816426814, "percentage": 26.83, "elapsed_time": "0:26:52", "remaining_time": "1:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 383, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.305331289947705e-05, "epoch": 0.26886626886626885, "percentage": 26.9, "elapsed_time": "0:26:57", "remaining_time": "1:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 384, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.3072187072792184e-05, "epoch": 0.26956826956826957, "percentage": 26.97, "elapsed_time": "0:27:01", "remaining_time": "1:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 385, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.309101215847502e-05, "epoch": 0.2702702702702703, "percentage": 27.04, "elapsed_time": "0:27:05", "remaining_time": "1:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 386, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.3109788411195924e-05, "epoch": 0.27097227097227095, "percentage": 27.11, "elapsed_time": "0:27:09", "remaining_time": "1:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 387, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.312851608364853e-05, "epoch": 0.27167427167427166, "percentage": 27.18, "elapsed_time": "0:27:13", "remaining_time": "1:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 388, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.314719542657013e-05, "epoch": 0.2723762723762724, "percentage": 27.25, "elapsed_time": "0:27:17", "remaining_time": "1:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 389, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.3165826688761796e-05, "epoch": 0.2730782730782731, "percentage": 27.32, "elapsed_time": "0:27:21", "remaining_time": "1:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.318441011710833e-05, "epoch": 0.27378027378027375, "percentage": 27.39, "elapsed_time": "0:27:26", "remaining_time": "1:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 391, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.3202945956597786e-05, "epoch": 0.27448227448227447, "percentage": 27.46, "elapsed_time": "0:27:30", "remaining_time": "1:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 392, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.3221434450340956e-05, "epoch": 0.2751842751842752, "percentage": 27.53, "elapsed_time": "0:27:34", "remaining_time": "1:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 393, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.323987583959045e-05, "epoch": 0.2758862758862759, "percentage": 27.6, "elapsed_time": "0:27:38", "remaining_time": "1:12:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 394, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.325827036375957e-05, "epoch": 0.2765882765882766, "percentage": 27.67, "elapsed_time": "0:27:42", "remaining_time": "1:12:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 395, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.327661826044101e-05, "epoch": 0.2772902772902773, "percentage": 27.74, "elapsed_time": "0:27:46", "remaining_time": "1:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 396, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.329491976542521e-05, "epoch": 0.277992277992278, "percentage": 27.81, "elapsed_time": "0:27:50", "remaining_time": "1:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 397, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.331317511271859e-05, "epoch": 0.2786942786942787, "percentage": 27.88, "elapsed_time": "0:27:55", "remaining_time": "1:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 398, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.333138453456147e-05, "epoch": 0.2793962793962794, "percentage": 27.95, "elapsed_time": "0:27:59", "remaining_time": "1:12:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 399, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.334954826144581e-05, "epoch": 0.2800982800982801, "percentage": 28.02, "elapsed_time": "0:28:03", "remaining_time": "1:12:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.336766652213271e-05, "epoch": 0.2808002808002808, "percentage": 28.09, "elapsed_time": "0:28:07", "remaining_time": "1:11:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 401, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.338573954366971e-05, "epoch": 0.2815022815022815, "percentage": 28.16, "elapsed_time": "0:28:17", "remaining_time": "1:12:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 402, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.340376755140784e-05, "epoch": 0.28220428220428223, "percentage": 28.23, "elapsed_time": "0:28:21", "remaining_time": "1:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 403, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.342175076901849e-05, "epoch": 0.2829062829062829, "percentage": 28.3, "elapsed_time": "0:28:26", "remaining_time": "1:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 404, "total_steps": 1424, "loss": 0.0566, "accuracy": 1.0, "learning_rate": 4.343968941851009e-05, "epoch": 0.2836082836082836, "percentage": 28.37, "elapsed_time": "0:28:30", "remaining_time": "1:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 405, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.345758372024448e-05, "epoch": 0.2843102843102843, "percentage": 28.44, "elapsed_time": "0:28:34", "remaining_time": "1:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 406, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.347543389295324e-05, "epoch": 0.28501228501228504, "percentage": 28.51, "elapsed_time": "0:28:38", "remaining_time": "1:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 407, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.3493240153753666e-05, "epoch": 0.2857142857142857, "percentage": 28.58, "elapsed_time": "0:28:42", "remaining_time": "1:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 408, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.3511002718164666e-05, "epoch": 0.2864162864162864, "percentage": 28.65, "elapsed_time": "0:28:46", "remaining_time": "1:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 409, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.352872180012237e-05, "epoch": 0.28711828711828713, "percentage": 28.72, "elapsed_time": "0:28:50", "remaining_time": "1:11:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.35463976119956e-05, "epoch": 0.28782028782028785, "percentage": 28.79, "elapsed_time": "0:28:55", "remaining_time": "1:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 411, "total_steps": 1424, "loss": 0.0167, "accuracy": 1.0, "learning_rate": 4.356403036460115e-05, "epoch": 0.2885222885222885, "percentage": 28.86, "elapsed_time": "0:28:59", "remaining_time": "1:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 412, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.3581620267218916e-05, "epoch": 0.2892242892242892, "percentage": 28.93, "elapsed_time": "0:29:03", "remaining_time": "1:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 413, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.359916752760669e-05, "epoch": 0.28992628992628994, "percentage": 29.0, "elapsed_time": "0:29:07", "remaining_time": "1:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 414, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.361667235201499e-05, "epoch": 0.29062829062829065, "percentage": 29.07, "elapsed_time": "0:29:11", "remaining_time": "1:11:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 415, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.363413494520154e-05, "epoch": 0.2913302913302913, "percentage": 29.14, "elapsed_time": "0:29:15", "remaining_time": "1:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 416, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.365155551044572e-05, "epoch": 0.29203229203229203, "percentage": 29.21, "elapsed_time": "0:29:20", "remaining_time": "1:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 417, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.366893424956263e-05, "epoch": 0.29273429273429274, "percentage": 29.28, "elapsed_time": "0:29:24", "remaining_time": "1:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 418, "total_steps": 1424, "loss": 0.0161, "accuracy": 1.0, "learning_rate": 4.368627136291726e-05, "epoch": 0.29343629343629346, "percentage": 29.35, "elapsed_time": "0:29:28", "remaining_time": "1:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 419, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.370356704943825e-05, "epoch": 0.2941382941382941, "percentage": 29.42, "elapsed_time": "0:29:32", "remaining_time": "1:10:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 1424, "loss": 0.0028, "accuracy": 1.0, "learning_rate": 4.372082150663168e-05, "epoch": 0.29484029484029484, "percentage": 29.49, "elapsed_time": "0:29:36", "remaining_time": "1:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 421, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.3738034930594475e-05, "epoch": 0.29554229554229555, "percentage": 29.56, "elapsed_time": "0:29:40", "remaining_time": "1:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 422, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.3755207516027904e-05, "epoch": 0.29624429624429627, "percentage": 29.63, "elapsed_time": "0:29:44", "remaining_time": "1:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 423, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.377233945625071e-05, "epoch": 0.29694629694629693, "percentage": 29.71, "elapsed_time": "0:29:48", "remaining_time": "1:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 424, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.378943094321221e-05, "epoch": 0.29764829764829764, "percentage": 29.78, "elapsed_time": "0:29:53", "remaining_time": "1:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 425, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.3806482167505196e-05, "epoch": 0.29835029835029836, "percentage": 29.85, "elapsed_time": "0:29:57", "remaining_time": "1:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 426, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.382349331837866e-05, "epoch": 0.2990522990522991, "percentage": 29.92, "elapsed_time": "0:30:01", "remaining_time": "1:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 427, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.3840464583750404e-05, "epoch": 0.29975429975429974, "percentage": 29.99, "elapsed_time": "0:30:05", "remaining_time": "1:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 428, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.385739615021954e-05, "epoch": 0.30045630045630045, "percentage": 30.06, "elapsed_time": "0:30:09", "remaining_time": "1:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 429, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.387428820307874e-05, "epoch": 0.30115830115830117, "percentage": 30.13, "elapsed_time": "0:30:13", "remaining_time": "1:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.3891140926326446e-05, "epoch": 0.3018603018603019, "percentage": 30.2, "elapsed_time": "0:30:17", "remaining_time": "1:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 431, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.390795450267886e-05, "epoch": 0.30256230256230254, "percentage": 30.27, "elapsed_time": "0:30:22", "remaining_time": "1:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 432, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.3924729113581876e-05, "epoch": 0.30326430326430326, "percentage": 30.34, "elapsed_time": "0:30:26", "remaining_time": "1:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 433, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.394146493922276e-05, "epoch": 0.303966303966304, "percentage": 30.41, "elapsed_time": "0:30:30", "remaining_time": "1:09:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 434, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.395816215854185e-05, "epoch": 0.3046683046683047, "percentage": 30.48, "elapsed_time": "0:30:34", "remaining_time": "1:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 435, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.397482094924396e-05, "epoch": 0.30537030537030535, "percentage": 30.55, "elapsed_time": "0:30:38", "remaining_time": "1:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 436, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.399144148780977e-05, "epoch": 0.30607230607230607, "percentage": 30.62, "elapsed_time": "0:30:42", "remaining_time": "1:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 437, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.400802394950703e-05, "epoch": 0.3067743067743068, "percentage": 30.69, "elapsed_time": "0:30:46", "remaining_time": "1:09:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 438, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.402456850840166e-05, "epoch": 0.3074763074763075, "percentage": 30.76, "elapsed_time": "0:30:50", "remaining_time": "1:09:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 439, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4041075337368695e-05, "epoch": 0.30817830817830816, "percentage": 30.83, "elapsed_time": "0:30:55", "remaining_time": "1:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.405754460810312e-05, "epoch": 0.3088803088803089, "percentage": 30.9, "elapsed_time": "0:30:59", "remaining_time": "1:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 441, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.407397649113065e-05, "epoch": 0.3095823095823096, "percentage": 30.97, "elapsed_time": "0:31:03", "remaining_time": "1:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 442, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.40903711558182e-05, "epoch": 0.3102843102843103, "percentage": 31.04, "elapsed_time": "0:31:07", "remaining_time": "1:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 443, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.41067287703845e-05, "epoch": 0.31098631098631097, "percentage": 31.11, "elapsed_time": "0:31:11", "remaining_time": "1:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 444, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.412304950191033e-05, "epoch": 0.3116883116883117, "percentage": 31.18, "elapsed_time": "0:31:15", "remaining_time": "1:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 445, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.413933351634886e-05, "epoch": 0.3123903123903124, "percentage": 31.25, "elapsed_time": "0:31:19", "remaining_time": "1:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 446, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.4155580978535707e-05, "epoch": 0.3130923130923131, "percentage": 31.32, "elapsed_time": "0:31:24", "remaining_time": "1:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 447, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.417179205219895e-05, "epoch": 0.3137943137943138, "percentage": 31.39, "elapsed_time": "0:31:28", "remaining_time": "1:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 448, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.418796689996907e-05, "epoch": 0.3144963144963145, "percentage": 31.46, "elapsed_time": "0:31:32", "remaining_time": "1:08:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 449, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.420410568338872e-05, "epoch": 0.3151983151983152, "percentage": 31.53, "elapsed_time": "0:31:36", "remaining_time": "1:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.42202085629224e-05, "epoch": 0.3159003159003159, "percentage": 31.6, "elapsed_time": "0:31:40", "remaining_time": "1:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 451, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.423627569796601e-05, "epoch": 0.3166023166023166, "percentage": 31.67, "elapsed_time": "0:31:44", "remaining_time": "1:08:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 452, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.425230724685638e-05, "epoch": 0.3173043173043173, "percentage": 31.74, "elapsed_time": "0:31:48", "remaining_time": "1:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 453, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4268303366880536e-05, "epoch": 0.318006318006318, "percentage": 31.81, "elapsed_time": "0:31:52", "remaining_time": "1:08:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 454, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.428426421428507e-05, "epoch": 0.3187083187083187, "percentage": 31.88, "elapsed_time": "0:31:57", "remaining_time": "1:08:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 455, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.430018994428521e-05, "epoch": 0.3194103194103194, "percentage": 31.95, "elapsed_time": "0:32:01", "remaining_time": "1:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 456, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.431608071107392e-05, "epoch": 0.3201123201123201, "percentage": 32.02, "elapsed_time": "0:32:05", "remaining_time": "1:08:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 457, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.433193666783084e-05, "epoch": 0.3208143208143208, "percentage": 32.09, "elapsed_time": "0:32:09", "remaining_time": "1:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 458, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4347757966731156e-05, "epoch": 0.32151632151632153, "percentage": 32.16, "elapsed_time": "0:32:13", "remaining_time": "1:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 459, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.436354475895436e-05, "epoch": 0.3222183222183222, "percentage": 32.23, "elapsed_time": "0:32:17", "remaining_time": "1:07:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.437929719469291e-05, "epoch": 0.3229203229203229, "percentage": 32.3, "elapsed_time": "0:32:22", "remaining_time": "1:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 461, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.4395015423160807e-05, "epoch": 0.3236223236223236, "percentage": 32.37, "elapsed_time": "0:32:26", "remaining_time": "1:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 462, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4410699592602094e-05, "epoch": 0.32432432432432434, "percentage": 32.44, "elapsed_time": "0:32:30", "remaining_time": "1:07:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 463, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.442634985029922e-05, "epoch": 0.325026325026325, "percentage": 32.51, "elapsed_time": "0:32:34", "remaining_time": "1:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 464, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.444196634258136e-05, "epoch": 0.3257283257283257, "percentage": 32.58, "elapsed_time": "0:32:38", "remaining_time": "1:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 465, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4457549214832566e-05, "epoch": 0.32643032643032643, "percentage": 32.65, "elapsed_time": "0:32:42", "remaining_time": "1:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 466, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.44730986115e-05, "epoch": 0.32713232713232715, "percentage": 32.72, "elapsed_time": "0:32:46", "remaining_time": "1:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 467, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.448861467610187e-05, "epoch": 0.3278343278343278, "percentage": 32.79, "elapsed_time": "0:32:51", "remaining_time": "1:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 468, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4504097551235406e-05, "epoch": 0.3285363285363285, "percentage": 32.87, "elapsed_time": "0:32:55", "remaining_time": "1:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 469, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4519547378584725e-05, "epoch": 0.32923832923832924, "percentage": 32.94, "elapsed_time": "0:32:59", "remaining_time": "1:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.453496429892863e-05, "epoch": 0.32994032994032996, "percentage": 33.01, "elapsed_time": "0:33:03", "remaining_time": "1:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 471, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.455034845214827e-05, "epoch": 0.3306423306423306, "percentage": 33.08, "elapsed_time": "0:33:07", "remaining_time": "1:07:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 472, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4565699977234796e-05, "epoch": 0.33134433134433133, "percentage": 33.15, "elapsed_time": "0:33:11", "remaining_time": "1:06:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 473, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.458101901229686e-05, "epoch": 0.33204633204633205, "percentage": 33.22, "elapsed_time": "0:33:16", "remaining_time": "1:06:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 474, "total_steps": 1424, "loss": 0.0176, "accuracy": 1.0, "learning_rate": 4.459630569456809e-05, "epoch": 0.33274833274833276, "percentage": 33.29, "elapsed_time": "0:33:20", "remaining_time": "1:06:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 475, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.461156016041444e-05, "epoch": 0.3334503334503334, "percentage": 33.36, "elapsed_time": "0:33:24", "remaining_time": "1:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 476, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.462678254534156e-05, "epoch": 0.33415233415233414, "percentage": 33.43, "elapsed_time": "0:33:28", "remaining_time": "1:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 477, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.464197298400191e-05, "epoch": 0.33485433485433486, "percentage": 33.5, "elapsed_time": "0:33:32", "remaining_time": "1:06:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 478, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.4657131610201994e-05, "epoch": 0.33555633555633557, "percentage": 33.57, "elapsed_time": "0:33:36", "remaining_time": "1:06:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 479, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.467225855690939e-05, "epoch": 0.33625833625833623, "percentage": 33.64, "elapsed_time": "0:33:40", "remaining_time": "1:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.468735395625979e-05, "epoch": 0.33696033696033695, "percentage": 33.71, "elapsed_time": "0:33:45", "remaining_time": "1:06:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 481, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.470241793956387e-05, "epoch": 0.33766233766233766, "percentage": 33.78, "elapsed_time": "0:33:49", "remaining_time": "1:06:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 482, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.471745063731416e-05, "epoch": 0.3383643383643384, "percentage": 33.85, "elapsed_time": "0:33:53", "remaining_time": "1:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 483, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.473245217919187e-05, "epoch": 0.33906633906633904, "percentage": 33.92, "elapsed_time": "0:33:57", "remaining_time": "1:06:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 484, "total_steps": 1424, "loss": 0.0016, "accuracy": 1.0, "learning_rate": 4.474742269407355e-05, "epoch": 0.33976833976833976, "percentage": 33.99, "elapsed_time": "0:34:01", "remaining_time": "1:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 485, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.476236231003773e-05, "epoch": 0.34047034047034047, "percentage": 34.06, "elapsed_time": "0:34:05", "remaining_time": "1:06:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 486, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.477727115437156e-05, "epoch": 0.3411723411723412, "percentage": 34.13, "elapsed_time": "0:34:09", "remaining_time": "1:05:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 487, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.479214935357724e-05, "epoch": 0.34187434187434185, "percentage": 34.2, "elapsed_time": "0:34:14", "remaining_time": "1:05:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 488, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.480699703337852e-05, "epoch": 0.34257634257634256, "percentage": 34.27, "elapsed_time": "0:34:18", "remaining_time": "1:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 489, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4821814318727016e-05, "epoch": 0.3432783432783433, "percentage": 34.34, "elapsed_time": "0:34:22", "remaining_time": "1:05:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.483660133380856e-05, "epoch": 0.343980343980344, "percentage": 34.41, "elapsed_time": "0:34:26", "remaining_time": "1:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 491, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.485135820204948e-05, "epoch": 0.34468234468234465, "percentage": 34.48, "elapsed_time": "0:34:30", "remaining_time": "1:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 492, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.486608504612267e-05, "epoch": 0.34538434538434537, "percentage": 34.55, "elapsed_time": "0:34:34", "remaining_time": "1:05:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 493, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.488078198795383e-05, "epoch": 0.3460863460863461, "percentage": 34.62, "elapsed_time": "0:34:39", "remaining_time": "1:05:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 494, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.489544914872745e-05, "epoch": 0.3467883467883468, "percentage": 34.69, "elapsed_time": "0:34:43", "remaining_time": "1:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 495, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4910086648892815e-05, "epoch": 0.3474903474903475, "percentage": 34.76, "elapsed_time": "0:34:47", "remaining_time": "1:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 496, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4924694608169965e-05, "epoch": 0.3481923481923482, "percentage": 34.83, "elapsed_time": "0:34:51", "remaining_time": "1:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 497, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4939273145555536e-05, "epoch": 0.3488943488943489, "percentage": 34.9, "elapsed_time": "0:34:55", "remaining_time": "1:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 498, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.495382237932863e-05, "epoch": 0.3495963495963496, "percentage": 34.97, "elapsed_time": "0:34:59", "remaining_time": "1:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 499, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.4968342427056505e-05, "epoch": 0.3502983502983503, "percentage": 35.04, "elapsed_time": "0:35:03", "remaining_time": "1:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.498283340560031e-05, "epoch": 0.351000351000351, "percentage": 35.11, "elapsed_time": "0:35:08", "remaining_time": "1:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 501, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.499729543112076e-05, "epoch": 0.3517023517023517, "percentage": 35.18, "elapsed_time": "0:35:20", "remaining_time": "1:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 502, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.501172861908366e-05, "epoch": 0.3524043524043524, "percentage": 35.25, "elapsed_time": "0:35:24", "remaining_time": "1:05:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 503, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.502613308426546e-05, "epoch": 0.35310635310635313, "percentage": 35.32, "elapsed_time": "0:35:28", "remaining_time": "1:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 504, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.504050894075876e-05, "epoch": 0.3538083538083538, "percentage": 35.39, "elapsed_time": "0:35:33", "remaining_time": "1:04:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 505, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5054856301977696e-05, "epoch": 0.3545103545103545, "percentage": 35.46, "elapsed_time": "0:35:37", "remaining_time": "1:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 506, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.506917528066332e-05, "epoch": 0.3552123552123552, "percentage": 35.53, "elapsed_time": "0:35:41", "remaining_time": "1:04:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 507, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.508346598888894e-05, "epoch": 0.35591435591435594, "percentage": 35.6, "elapsed_time": "0:35:45", "remaining_time": "1:04:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 508, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.509772853806532e-05, "epoch": 0.3566163566163566, "percentage": 35.67, "elapsed_time": "0:35:49", "remaining_time": "1:04:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 509, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.511196303894598e-05, "epoch": 0.3573183573183573, "percentage": 35.74, "elapsed_time": "0:35:53", "remaining_time": "1:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.512616960163227e-05, "epoch": 0.35802035802035803, "percentage": 35.81, "elapsed_time": "0:35:57", "remaining_time": "1:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 511, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5140348335578547e-05, "epoch": 0.35872235872235875, "percentage": 35.88, "elapsed_time": "0:36:02", "remaining_time": "1:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 512, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.515449934959718e-05, "epoch": 0.3594243594243594, "percentage": 35.96, "elapsed_time": "0:36:06", "remaining_time": "1:04:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 513, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.516862275186361e-05, "epoch": 0.3601263601263601, "percentage": 36.03, "elapsed_time": "0:36:10", "remaining_time": "1:04:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 514, "total_steps": 1424, "loss": 0.0035, "accuracy": 1.0, "learning_rate": 4.518271864992127e-05, "epoch": 0.36082836082836084, "percentage": 36.1, "elapsed_time": "0:36:14", "remaining_time": "1:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 515, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.519678715068652e-05, "epoch": 0.36153036153036155, "percentage": 36.17, "elapsed_time": "0:36:18", "remaining_time": "1:04:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 516, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.521082836045353e-05, "epoch": 0.3622323622323622, "percentage": 36.24, "elapsed_time": "0:36:22", "remaining_time": "1:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 517, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5224842384899045e-05, "epoch": 0.36293436293436293, "percentage": 36.31, "elapsed_time": "0:36:26", "remaining_time": "1:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 518, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.523882932908722e-05, "epoch": 0.36363636363636365, "percentage": 36.38, "elapsed_time": "0:36:31", "remaining_time": "1:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 519, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.52527892974743e-05, "epoch": 0.36433836433836436, "percentage": 36.45, "elapsed_time": "0:36:35", "remaining_time": "1:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.526672239391333e-05, "epoch": 0.365040365040365, "percentage": 36.52, "elapsed_time": "0:36:39", "remaining_time": "1:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 521, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.528062872165875e-05, "epoch": 0.36574236574236574, "percentage": 36.59, "elapsed_time": "0:36:43", "remaining_time": "1:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 522, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.529450838337104e-05, "epoch": 0.36644436644436645, "percentage": 36.66, "elapsed_time": "0:36:47", "remaining_time": "1:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 523, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.530836148112124e-05, "epoch": 0.36714636714636717, "percentage": 36.73, "elapsed_time": "0:36:51", "remaining_time": "1:03:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 524, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.532218811639545e-05, "epoch": 0.36784836784836783, "percentage": 36.8, "elapsed_time": "0:36:56", "remaining_time": "1:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 525, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5335988390099284e-05, "epoch": 0.36855036855036855, "percentage": 36.87, "elapsed_time": "0:37:00", "remaining_time": "1:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 526, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.534976240256232e-05, "epoch": 0.36925236925236926, "percentage": 36.94, "elapsed_time": "0:37:04", "remaining_time": "1:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 527, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.536351025354245e-05, "epoch": 0.36995436995437, "percentage": 37.01, "elapsed_time": "0:37:08", "remaining_time": "1:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 528, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.537723204223021e-05, "epoch": 0.37065637065637064, "percentage": 37.08, "elapsed_time": "0:37:12", "remaining_time": "1:03:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 529, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.53909278672531e-05, "epoch": 0.37135837135837135, "percentage": 37.15, "elapsed_time": "0:37:16", "remaining_time": "1:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5404597826679824e-05, "epoch": 0.37206037206037207, "percentage": 37.22, "elapsed_time": "0:37:20", "remaining_time": "1:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 531, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.541824201802449e-05, "epoch": 0.3727623727623728, "percentage": 37.29, "elapsed_time": "0:37:25", "remaining_time": "1:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 532, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.543186053825081e-05, "epoch": 0.37346437346437344, "percentage": 37.36, "elapsed_time": "0:37:29", "remaining_time": "1:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 533, "total_steps": 1424, "loss": 0.002, "accuracy": 1.0, "learning_rate": 4.544545348377621e-05, "epoch": 0.37416637416637416, "percentage": 37.43, "elapsed_time": "0:37:33", "remaining_time": "1:02:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 534, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5459020950475946e-05, "epoch": 0.3748683748683749, "percentage": 37.5, "elapsed_time": "0:37:37", "remaining_time": "1:02:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 535, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5472563033687145e-05, "epoch": 0.3755703755703756, "percentage": 37.57, "elapsed_time": "0:37:41", "remaining_time": "1:02:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 536, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.548607982821284e-05, "epoch": 0.37627237627237625, "percentage": 37.64, "elapsed_time": "0:37:45", "remaining_time": "1:02:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 537, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5499571428325935e-05, "epoch": 0.37697437697437697, "percentage": 37.71, "elapsed_time": "0:37:49", "remaining_time": "1:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 538, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5513037927773155e-05, "epoch": 0.3776763776763777, "percentage": 37.78, "elapsed_time": "0:37:54", "remaining_time": "1:02:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 539, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5526479419778986e-05, "epoch": 0.3783783783783784, "percentage": 37.85, "elapsed_time": "0:37:58", "remaining_time": "1:02:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.553989599704948e-05, "epoch": 0.37908037908037906, "percentage": 37.92, "elapsed_time": "0:38:02", "remaining_time": "1:02:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 541, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.555328775177616e-05, "epoch": 0.3797823797823798, "percentage": 37.99, "elapsed_time": "0:38:06", "remaining_time": "1:02:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 542, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5566654775639785e-05, "epoch": 0.3804843804843805, "percentage": 38.06, "elapsed_time": "0:38:10", "remaining_time": "1:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 543, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.5579997159814117e-05, "epoch": 0.3811863811863812, "percentage": 38.13, "elapsed_time": "0:38:14", "remaining_time": "1:02:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 544, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5593314994969665e-05, "epoch": 0.38188838188838187, "percentage": 38.2, "elapsed_time": "0:38:18", "remaining_time": "1:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 545, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.560660837127738e-05, "epoch": 0.3825903825903826, "percentage": 38.27, "elapsed_time": "0:38:23", "remaining_time": "1:01:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 546, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.561987737841229e-05, "epoch": 0.3832923832923833, "percentage": 38.34, "elapsed_time": "0:38:27", "remaining_time": "1:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 547, "total_steps": 1424, "loss": 0.0092, "accuracy": 1.0, "learning_rate": 4.563312210555719e-05, "epoch": 0.383994383994384, "percentage": 38.41, "elapsed_time": "0:38:31", "remaining_time": "1:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 548, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.564634264140616e-05, "epoch": 0.3846963846963847, "percentage": 38.48, "elapsed_time": "0:38:35", "remaining_time": "1:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 549, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.56595390741682e-05, "epoch": 0.3853983853983854, "percentage": 38.55, "elapsed_time": "0:38:39", "remaining_time": "1:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.567271149157073e-05, "epoch": 0.3861003861003861, "percentage": 38.62, "elapsed_time": "0:38:44", "remaining_time": "1:01:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 551, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5685859980863086e-05, "epoch": 0.3868023868023868, "percentage": 38.69, "elapsed_time": "0:38:48", "remaining_time": "1:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 552, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.569898462881999e-05, "epoch": 0.3875043875043875, "percentage": 38.76, "elapsed_time": "0:38:52", "remaining_time": "1:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 553, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.571208552174497e-05, "epoch": 0.3882063882063882, "percentage": 38.83, "elapsed_time": "0:38:56", "remaining_time": "1:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 554, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.572516274547383e-05, "epoch": 0.3889083889083889, "percentage": 38.9, "elapsed_time": "0:39:00", "remaining_time": "1:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 555, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.573821638537794e-05, "epoch": 0.38961038961038963, "percentage": 38.97, "elapsed_time": "0:39:04", "remaining_time": "1:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 556, "total_steps": 1424, "loss": 0.0044, "accuracy": 1.0, "learning_rate": 4.575124652636763e-05, "epoch": 0.3903123903123903, "percentage": 39.04, "elapsed_time": "0:39:08", "remaining_time": "1:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 557, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5764253252895486e-05, "epoch": 0.391014391014391, "percentage": 39.12, "elapsed_time": "0:39:12", "remaining_time": "1:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 558, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.577723664895965e-05, "epoch": 0.3917163917163917, "percentage": 39.19, "elapsed_time": "0:39:17", "remaining_time": "1:00:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 559, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.579019679810706e-05, "epoch": 0.39241839241839244, "percentage": 39.26, "elapsed_time": "0:39:21", "remaining_time": "1:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5803133783436676e-05, "epoch": 0.3931203931203931, "percentage": 39.33, "elapsed_time": "0:39:25", "remaining_time": "1:00:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 561, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.581604768760269e-05, "epoch": 0.3938223938223938, "percentage": 39.4, "elapsed_time": "0:39:29", "remaining_time": "1:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 562, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.582893859281769e-05, "epoch": 0.39452439452439453, "percentage": 39.47, "elapsed_time": "0:39:33", "remaining_time": "1:00:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 563, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.584180658085578e-05, "epoch": 0.39522639522639524, "percentage": 39.54, "elapsed_time": "0:39:37", "remaining_time": "1:00:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 564, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.585465173305571e-05, "epoch": 0.3959283959283959, "percentage": 39.61, "elapsed_time": "0:39:42", "remaining_time": "1:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 565, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5867474130323984e-05, "epoch": 0.3966303966303966, "percentage": 39.68, "elapsed_time": "0:39:46", "remaining_time": "1:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 566, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.588027385313786e-05, "epoch": 0.39733239733239734, "percentage": 39.75, "elapsed_time": "0:39:50", "remaining_time": "1:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 567, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5893050981548446e-05, "epoch": 0.39803439803439805, "percentage": 39.82, "elapsed_time": "0:39:54", "remaining_time": "1:00:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 568, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5905805595183656e-05, "epoch": 0.3987363987363987, "percentage": 39.89, "elapsed_time": "0:39:58", "remaining_time": "1:00:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 569, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.591853777325119e-05, "epoch": 0.3994383994383994, "percentage": 39.96, "elapsed_time": "0:40:02", "remaining_time": "1:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.593124759454153e-05, "epoch": 0.40014040014040014, "percentage": 40.03, "elapsed_time": "0:40:06", "remaining_time": "1:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 571, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5943935137430806e-05, "epoch": 0.40084240084240086, "percentage": 40.1, "elapsed_time": "0:40:11", "remaining_time": "1:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 572, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.595660047988374e-05, "epoch": 0.4015444015444015, "percentage": 40.17, "elapsed_time": "0:40:15", "remaining_time": "0:59:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 573, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.59692436994565e-05, "epoch": 0.40224640224640223, "percentage": 40.24, "elapsed_time": "0:40:19", "remaining_time": "0:59:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 574, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.5981864873299563e-05, "epoch": 0.40294840294840295, "percentage": 40.31, "elapsed_time": "0:40:23", "remaining_time": "0:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 575, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.599446407816052e-05, "epoch": 0.40365040365040367, "percentage": 40.38, "elapsed_time": "0:40:27", "remaining_time": "0:59:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 576, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.6007041390386874e-05, "epoch": 0.4043524043524043, "percentage": 40.45, "elapsed_time": "0:40:31", "remaining_time": "0:59:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 577, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.601959688592886e-05, "epoch": 0.40505440505440504, "percentage": 40.52, "elapsed_time": "0:40:36", "remaining_time": "0:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 578, "total_steps": 1424, "loss": 0.0768, "accuracy": 1.0, "learning_rate": 4.603213064034216e-05, "epoch": 0.40575640575640576, "percentage": 40.59, "elapsed_time": "0:40:40", "remaining_time": "0:59:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 579, "total_steps": 1424, "loss": 0.0023, "accuracy": 1.0, "learning_rate": 4.604464272879061e-05, "epoch": 0.4064584064584065, "percentage": 40.66, "elapsed_time": "0:40:44", "remaining_time": "0:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.605713322604896e-05, "epoch": 0.40716040716040713, "percentage": 40.73, "elapsed_time": "0:40:48", "remaining_time": "0:59:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 581, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.606960220650551e-05, "epoch": 0.40786240786240785, "percentage": 40.8, "elapsed_time": "0:40:52", "remaining_time": "0:59:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 582, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.608204974416481e-05, "epoch": 0.40856440856440857, "percentage": 40.87, "elapsed_time": "0:40:56", "remaining_time": "0:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 583, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.6094475912650234e-05, "epoch": 0.4092664092664093, "percentage": 40.94, "elapsed_time": "0:41:00", "remaining_time": "0:59:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 584, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.610688078520666e-05, "epoch": 0.40996840996840994, "percentage": 41.01, "elapsed_time": "0:41:04", "remaining_time": "0:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 585, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.611926443470301e-05, "epoch": 0.41067041067041066, "percentage": 41.08, "elapsed_time": "0:41:09", "remaining_time": "0:59:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 586, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.6131626933634844e-05, "epoch": 0.4113724113724114, "percentage": 41.15, "elapsed_time": "0:41:13", "remaining_time": "0:58:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 587, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.6143968354126914e-05, "epoch": 0.4120744120744121, "percentage": 41.22, "elapsed_time": "0:41:17", "remaining_time": "0:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 588, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.6156288767935646e-05, "epoch": 0.41277641277641275, "percentage": 41.29, "elapsed_time": "0:41:21", "remaining_time": "0:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 589, "total_steps": 1424, "loss": 0.0018, "accuracy": 1.0, "learning_rate": 4.61685882464517e-05, "epoch": 0.41347841347841346, "percentage": 41.36, "elapsed_time": "0:41:25", "remaining_time": "0:58:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.61808668607024e-05, "epoch": 0.4141804141804142, "percentage": 41.43, "elapsed_time": "0:41:29", "remaining_time": "0:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 591, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.619312468135426e-05, "epoch": 0.4148824148824149, "percentage": 41.5, "elapsed_time": "0:41:34", "remaining_time": "0:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 592, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.620536177871533e-05, "epoch": 0.4155844155844156, "percentage": 41.57, "elapsed_time": "0:41:38", "remaining_time": "0:58:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 593, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.621757822273772e-05, "epoch": 0.41628641628641627, "percentage": 41.64, "elapsed_time": "0:41:42", "remaining_time": "0:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 594, "total_steps": 1424, "loss": 0.0249, "accuracy": 1.0, "learning_rate": 4.62297740830199e-05, "epoch": 0.416988416988417, "percentage": 41.71, "elapsed_time": "0:41:46", "remaining_time": "0:58:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 595, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6241949428809165e-05, "epoch": 0.4176904176904177, "percentage": 41.78, "elapsed_time": "0:41:50", "remaining_time": "0:58:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 596, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.625410432900395e-05, "epoch": 0.4183924183924184, "percentage": 41.85, "elapsed_time": "0:41:55", "remaining_time": "0:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 597, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.626623885215616e-05, "epoch": 0.4190944190944191, "percentage": 41.92, "elapsed_time": "0:41:59", "remaining_time": "0:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 598, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.627835306647352e-05, "epoch": 0.4197964197964198, "percentage": 41.99, "elapsed_time": "0:42:03", "remaining_time": "0:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 599, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.629044703982186e-05, "epoch": 0.4204984204984205, "percentage": 42.06, "elapsed_time": "0:42:07", "remaining_time": "0:58:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.63025208397274e-05, "epoch": 0.4212004212004212, "percentage": 42.13, "elapsed_time": "0:42:11", "remaining_time": "0:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 601, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.6314574533379e-05, "epoch": 0.4219024219024219, "percentage": 42.21, "elapsed_time": "0:42:23", "remaining_time": "0:58:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 602, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.632660818763041e-05, "epoch": 0.4226044226044226, "percentage": 42.28, "elapsed_time": "0:42:27", "remaining_time": "0:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 603, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.633862186900253e-05, "epoch": 0.4233064233064233, "percentage": 42.35, "elapsed_time": "0:42:31", "remaining_time": "0:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 604, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.6350615643685535e-05, "epoch": 0.42400842400842403, "percentage": 42.42, "elapsed_time": "0:42:35", "remaining_time": "0:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 605, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.6362589577541154e-05, "epoch": 0.4247104247104247, "percentage": 42.49, "elapsed_time": "0:42:39", "remaining_time": "0:57:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 606, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.637454373610477e-05, "epoch": 0.4254124254124254, "percentage": 42.56, "elapsed_time": "0:42:44", "remaining_time": "0:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 607, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.638647818458763e-05, "epoch": 0.4261144261144261, "percentage": 42.63, "elapsed_time": "0:42:48", "remaining_time": "0:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 608, "total_steps": 1424, "loss": 0.0046, "accuracy": 1.0, "learning_rate": 4.639839298787892e-05, "epoch": 0.42681642681642684, "percentage": 42.7, "elapsed_time": "0:42:52", "remaining_time": "0:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 609, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.641028821054793e-05, "epoch": 0.4275184275184275, "percentage": 42.77, "elapsed_time": "0:42:56", "remaining_time": "0:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.6422163916846124e-05, "epoch": 0.4282204282204282, "percentage": 42.84, "elapsed_time": "0:43:00", "remaining_time": "0:57:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 611, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.643402017070924e-05, "epoch": 0.42892242892242893, "percentage": 42.91, "elapsed_time": "0:43:04", "remaining_time": "0:57:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 612, "total_steps": 1424, "loss": 0.0059, "accuracy": 1.0, "learning_rate": 4.644585703575936e-05, "epoch": 0.42962442962442965, "percentage": 42.98, "elapsed_time": "0:43:08", "remaining_time": "0:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 613, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.645767457530692e-05, "epoch": 0.4303264303264303, "percentage": 43.05, "elapsed_time": "0:43:13", "remaining_time": "0:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 614, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.64694728523528e-05, "epoch": 0.431028431028431, "percentage": 43.12, "elapsed_time": "0:43:17", "remaining_time": "0:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 615, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.648125192959028e-05, "epoch": 0.43173043173043174, "percentage": 43.19, "elapsed_time": "0:43:21", "remaining_time": "0:57:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 616, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.649301186940709e-05, "epoch": 0.43243243243243246, "percentage": 43.26, "elapsed_time": "0:43:25", "remaining_time": "0:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 617, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.650475273388737e-05, "epoch": 0.4331344331344331, "percentage": 43.33, "elapsed_time": "0:43:29", "remaining_time": "0:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 618, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.651647458481359e-05, "epoch": 0.43383643383643383, "percentage": 43.4, "elapsed_time": "0:43:33", "remaining_time": "0:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 619, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.652817748366864e-05, "epoch": 0.43453843453843455, "percentage": 43.47, "elapsed_time": "0:43:38", "remaining_time": "0:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.653986149163757e-05, "epoch": 0.43524043524043526, "percentage": 43.54, "elapsed_time": "0:43:42", "remaining_time": "0:56:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 621, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.655152666960967e-05, "epoch": 0.4359424359424359, "percentage": 43.61, "elapsed_time": "0:43:46", "remaining_time": "0:56:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 622, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.6563173078180315e-05, "epoch": 0.43664443664443664, "percentage": 43.68, "elapsed_time": "0:43:50", "remaining_time": "0:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 623, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.657480077765283e-05, "epoch": 0.43734643734643736, "percentage": 43.75, "elapsed_time": "0:43:54", "remaining_time": "0:56:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 624, "total_steps": 1424, "loss": 0.0433, "accuracy": 1.0, "learning_rate": 4.6586409828040405e-05, "epoch": 0.43804843804843807, "percentage": 43.82, "elapsed_time": "0:43:58", "remaining_time": "0:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 625, "total_steps": 1424, "loss": 0.0027, "accuracy": 1.0, "learning_rate": 4.659800028906792e-05, "epoch": 0.43875043875043873, "percentage": 43.89, "elapsed_time": "0:44:02", "remaining_time": "0:56:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 626, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.660957222017383e-05, "epoch": 0.43945243945243945, "percentage": 43.96, "elapsed_time": "0:44:07", "remaining_time": "0:56:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 627, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.662112568051194e-05, "epoch": 0.44015444015444016, "percentage": 44.03, "elapsed_time": "0:44:11", "remaining_time": "0:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 628, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.663266072895327e-05, "epoch": 0.4408564408564409, "percentage": 44.1, "elapsed_time": "0:44:15", "remaining_time": "0:56:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 629, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.664417742408782e-05, "epoch": 0.44155844155844154, "percentage": 44.17, "elapsed_time": "0:44:19", "remaining_time": "0:56:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.665567582422637e-05, "epoch": 0.44226044226044225, "percentage": 44.24, "elapsed_time": "0:44:23", "remaining_time": "0:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 631, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.666715598740224e-05, "epoch": 0.44296244296244297, "percentage": 44.31, "elapsed_time": "0:44:27", "remaining_time": "0:55:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 632, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.667861797137309e-05, "epoch": 0.4436644436644437, "percentage": 44.38, "elapsed_time": "0:44:32", "remaining_time": "0:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 633, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.669006183362258e-05, "epoch": 0.44436644436644435, "percentage": 44.45, "elapsed_time": "0:44:36", "remaining_time": "0:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 634, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.670148763136221e-05, "epoch": 0.44506844506844506, "percentage": 44.52, "elapsed_time": "0:44:40", "remaining_time": "0:55:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 635, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.671289542153293e-05, "epoch": 0.4457704457704458, "percentage": 44.59, "elapsed_time": "0:44:44", "remaining_time": "0:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 636, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.672428526080691e-05, "epoch": 0.4464724464724465, "percentage": 44.66, "elapsed_time": "0:44:48", "remaining_time": "0:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 637, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.673565720558918e-05, "epoch": 0.44717444717444715, "percentage": 44.73, "elapsed_time": "0:44:52", "remaining_time": "0:55:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 638, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6747011312019374e-05, "epoch": 0.44787644787644787, "percentage": 44.8, "elapsed_time": "0:44:57", "remaining_time": "0:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 639, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.6758347635973334e-05, "epoch": 0.4485784485784486, "percentage": 44.87, "elapsed_time": "0:45:01", "remaining_time": "0:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.676966623306479e-05, "epoch": 0.4492804492804493, "percentage": 44.94, "elapsed_time": "0:45:05", "remaining_time": "0:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 641, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.678096715864696e-05, "epoch": 0.44998244998244996, "percentage": 45.01, "elapsed_time": "0:45:09", "remaining_time": "0:55:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 642, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.679225046781422e-05, "epoch": 0.4506844506844507, "percentage": 45.08, "elapsed_time": "0:45:13", "remaining_time": "0:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 643, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.68035162154037e-05, "epoch": 0.4513864513864514, "percentage": 45.15, "elapsed_time": "0:45:17", "remaining_time": "0:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 644, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.681476445599687e-05, "epoch": 0.4520884520884521, "percentage": 45.22, "elapsed_time": "0:45:22", "remaining_time": "0:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 645, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6825995243921137e-05, "epoch": 0.45279045279045277, "percentage": 45.29, "elapsed_time": "0:45:26", "remaining_time": "0:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 646, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.683720863325141e-05, "epoch": 0.4534924534924535, "percentage": 45.37, "elapsed_time": "0:45:30", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 647, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.684840467781168e-05, "epoch": 0.4541944541944542, "percentage": 45.44, "elapsed_time": "0:45:34", "remaining_time": "0:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 648, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.685958343117656e-05, "epoch": 0.4548964548964549, "percentage": 45.51, "elapsed_time": "0:45:38", "remaining_time": "0:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 649, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.6870744946672826e-05, "epoch": 0.4555984555984556, "percentage": 45.58, "elapsed_time": "0:45:42", "remaining_time": "0:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.688188927738093e-05, "epoch": 0.4563004563004563, "percentage": 45.65, "elapsed_time": "0:45:46", "remaining_time": "0:54:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 651, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.689301647613653e-05, "epoch": 0.457002457002457, "percentage": 45.72, "elapsed_time": "0:45:51", "remaining_time": "0:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 652, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6904126595532014e-05, "epoch": 0.4577044577044577, "percentage": 45.79, "elapsed_time": "0:45:55", "remaining_time": "0:54:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 653, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.69152196879179e-05, "epoch": 0.4584064584064584, "percentage": 45.86, "elapsed_time": "0:45:59", "remaining_time": "0:54:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 654, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.692629580540446e-05, "epoch": 0.4591084591084591, "percentage": 45.93, "elapsed_time": "0:46:03", "remaining_time": "0:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 655, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.693735499986305e-05, "epoch": 0.4598104598104598, "percentage": 46.0, "elapsed_time": "0:46:07", "remaining_time": "0:54:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 656, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.694839732292767e-05, "epoch": 0.46051246051246053, "percentage": 46.07, "elapsed_time": "0:46:11", "remaining_time": "0:54:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 657, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6959422825996345e-05, "epoch": 0.4612144612144612, "percentage": 46.14, "elapsed_time": "0:46:16", "remaining_time": "0:54:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 658, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.69704315602326e-05, "epoch": 0.4619164619164619, "percentage": 46.21, "elapsed_time": "0:46:20", "remaining_time": "0:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 659, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.698142357656684e-05, "epoch": 0.4626184626184626, "percentage": 46.28, "elapsed_time": "0:46:24", "remaining_time": "0:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6992398925697814e-05, "epoch": 0.46332046332046334, "percentage": 46.35, "elapsed_time": "0:46:28", "remaining_time": "0:53:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 661, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7003357658094e-05, "epoch": 0.464022464022464, "percentage": 46.42, "elapsed_time": "0:46:32", "remaining_time": "0:53:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 662, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7014299823995005e-05, "epoch": 0.4647244647244647, "percentage": 46.49, "elapsed_time": "0:46:36", "remaining_time": "0:53:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 663, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.702522547341289e-05, "epoch": 0.46542646542646543, "percentage": 46.56, "elapsed_time": "0:46:41", "remaining_time": "0:53:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 664, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.703613465613363e-05, "epoch": 0.46612846612846615, "percentage": 46.63, "elapsed_time": "0:46:45", "remaining_time": "0:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 665, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.704702742171841e-05, "epoch": 0.4668304668304668, "percentage": 46.7, "elapsed_time": "0:46:49", "remaining_time": "0:53:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 666, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7057903819505024e-05, "epoch": 0.4675324675324675, "percentage": 46.77, "elapsed_time": "0:46:53", "remaining_time": "0:53:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 667, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7068763898609154e-05, "epoch": 0.46823446823446824, "percentage": 46.84, "elapsed_time": "0:46:57", "remaining_time": "0:53:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 668, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.707960770792576e-05, "epoch": 0.46893646893646895, "percentage": 46.91, "elapsed_time": "0:47:01", "remaining_time": "0:53:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 669, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.709043529613039e-05, "epoch": 0.4696384696384696, "percentage": 46.98, "elapsed_time": "0:47:05", "remaining_time": "0:53:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.710124671168044e-05, "epoch": 0.47034047034047033, "percentage": 47.05, "elapsed_time": "0:47:10", "remaining_time": "0:53:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 671, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.711204200281654e-05, "epoch": 0.47104247104247104, "percentage": 47.12, "elapsed_time": "0:47:14", "remaining_time": "0:53:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 672, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.712282121756376e-05, "epoch": 0.47174447174447176, "percentage": 47.19, "elapsed_time": "0:47:18", "remaining_time": "0:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 673, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.713358440373295e-05, "epoch": 0.4724464724464724, "percentage": 47.26, "elapsed_time": "0:47:22", "remaining_time": "0:52:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 674, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7144331608922e-05, "epoch": 0.47314847314847314, "percentage": 47.33, "elapsed_time": "0:47:26", "remaining_time": "0:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 675, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.715506288051709e-05, "epoch": 0.47385047385047385, "percentage": 47.4, "elapsed_time": "0:47:30", "remaining_time": "0:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 676, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7165778265693935e-05, "epoch": 0.47455247455247457, "percentage": 47.47, "elapsed_time": "0:47:34", "remaining_time": "0:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 677, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7176477811419076e-05, "epoch": 0.47525447525447523, "percentage": 47.54, "elapsed_time": "0:47:39", "remaining_time": "0:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 678, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.718716156445106e-05, "epoch": 0.47595647595647594, "percentage": 47.61, "elapsed_time": "0:47:43", "remaining_time": "0:52:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 679, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.7197829571341704e-05, "epoch": 0.47665847665847666, "percentage": 47.68, "elapsed_time": "0:47:47", "remaining_time": "0:52:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.720848187843727e-05, "epoch": 0.4773604773604774, "percentage": 47.75, "elapsed_time": "0:47:51", "remaining_time": "0:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 681, "total_steps": 1424, "loss": 0.0676, "accuracy": 1.0, "learning_rate": 4.721911853187975e-05, "epoch": 0.47806247806247804, "percentage": 47.82, "elapsed_time": "0:47:55", "remaining_time": "0:52:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 682, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.722973957760799e-05, "epoch": 0.47876447876447875, "percentage": 47.89, "elapsed_time": "0:47:59", "remaining_time": "0:52:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 683, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.724034506135888e-05, "epoch": 0.47946647946647947, "percentage": 47.96, "elapsed_time": "0:48:03", "remaining_time": "0:52:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 684, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.725093502866861e-05, "epoch": 0.4801684801684802, "percentage": 48.03, "elapsed_time": "0:48:07", "remaining_time": "0:52:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 685, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7261509524873764e-05, "epoch": 0.48087048087048084, "percentage": 48.1, "elapsed_time": "0:48:12", "remaining_time": "0:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 686, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.727206859511253e-05, "epoch": 0.48157248157248156, "percentage": 48.17, "elapsed_time": "0:48:16", "remaining_time": "0:51:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 687, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7282612284325846e-05, "epoch": 0.4822744822744823, "percentage": 48.24, "elapsed_time": "0:48:20", "remaining_time": "0:51:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 688, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.729314063725853e-05, "epoch": 0.482976482976483, "percentage": 48.31, "elapsed_time": "0:48:24", "remaining_time": "0:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 689, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.730365369846044e-05, "epoch": 0.4836784836784837, "percentage": 48.38, "elapsed_time": "0:48:28", "remaining_time": "0:51:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7314151512287594e-05, "epoch": 0.48438048438048437, "percentage": 48.46, "elapsed_time": "0:48:32", "remaining_time": "0:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 691, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 4.732463412290331e-05, "epoch": 0.4850824850824851, "percentage": 48.53, "elapsed_time": "0:48:37", "remaining_time": "0:51:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 692, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.73351015742793e-05, "epoch": 0.4857844857844858, "percentage": 48.6, "elapsed_time": "0:48:41", "remaining_time": "0:51:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 693, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7345553910196785e-05, "epoch": 0.4864864864864865, "percentage": 48.67, "elapsed_time": "0:48:45", "remaining_time": "0:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 694, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.735599117424759e-05, "epoch": 0.4871884871884872, "percentage": 48.74, "elapsed_time": "0:48:49", "remaining_time": "0:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 695, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.7366413409835235e-05, "epoch": 0.4878904878904879, "percentage": 48.81, "elapsed_time": "0:48:53", "remaining_time": "0:51:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 696, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.737682066017604e-05, "epoch": 0.4885924885924886, "percentage": 48.88, "elapsed_time": "0:48:57", "remaining_time": "0:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 697, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7387212968300166e-05, "epoch": 0.4892944892944893, "percentage": 48.95, "elapsed_time": "0:49:02", "remaining_time": "0:51:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 698, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7397590377052686e-05, "epoch": 0.48999648999649, "percentage": 49.02, "elapsed_time": "0:49:06", "remaining_time": "0:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 699, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.74079529290947e-05, "epoch": 0.4906984906984907, "percentage": 49.09, "elapsed_time": "0:49:10", "remaining_time": "0:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.741830066690428e-05, "epoch": 0.4914004914004914, "percentage": 49.16, "elapsed_time": "0:49:14", "remaining_time": "0:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 701, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.742863363277765e-05, "epoch": 0.49210249210249213, "percentage": 49.23, "elapsed_time": "0:49:25", "remaining_time": "0:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 702, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.743895186883009e-05, "epoch": 0.4928044928044928, "percentage": 49.3, "elapsed_time": "0:49:29", "remaining_time": "0:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 703, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.7449255416997075e-05, "epoch": 0.4935064935064935, "percentage": 49.37, "elapsed_time": "0:49:33", "remaining_time": "0:50:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 704, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.7459544319035206e-05, "epoch": 0.4942084942084942, "percentage": 49.44, "elapsed_time": "0:49:38", "remaining_time": "0:50:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 705, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.746981861652332e-05, "epoch": 0.49491049491049494, "percentage": 49.51, "elapsed_time": "0:49:42", "remaining_time": "0:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 706, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.74800783508634e-05, "epoch": 0.4956124956124956, "percentage": 49.58, "elapsed_time": "0:49:46", "remaining_time": "0:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 707, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7490323563281665e-05, "epoch": 0.4963144963144963, "percentage": 49.65, "elapsed_time": "0:49:50", "remaining_time": "0:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 708, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.750055429482949e-05, "epoch": 0.497016497016497, "percentage": 49.72, "elapsed_time": "0:49:54", "remaining_time": "0:50:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 709, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.751077058638445e-05, "epoch": 0.49771849771849774, "percentage": 49.79, "elapsed_time": "0:49:58", "remaining_time": "0:50:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.752097247865126e-05, "epoch": 0.4984204984204984, "percentage": 49.86, "elapsed_time": "0:50:03", "remaining_time": "0:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 711, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.753116001216277e-05, "epoch": 0.4991224991224991, "percentage": 49.93, "elapsed_time": "0:50:07", "remaining_time": "0:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 712, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7541333227280944e-05, "epoch": 0.49982449982449983, "percentage": 50.0, "elapsed_time": "0:50:11", "remaining_time": "0:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 713, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.755149216419776e-05, "epoch": 0.5005265005265005, "percentage": 50.07, "elapsed_time": "0:50:15", "remaining_time": "0:50:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 714, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.756163686293624e-05, "epoch": 0.5012285012285013, "percentage": 50.14, "elapsed_time": "0:50:19", "remaining_time": "0:50:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 715, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7571767363351344e-05, "epoch": 0.5019305019305019, "percentage": 50.21, "elapsed_time": "0:50:23", "remaining_time": "0:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 716, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.758188370513093e-05, "epoch": 0.5026325026325026, "percentage": 50.28, "elapsed_time": "0:50:28", "remaining_time": "0:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 717, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.759198592779667e-05, "epoch": 0.5033345033345034, "percentage": 50.35, "elapsed_time": "0:50:32", "remaining_time": "0:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 718, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.760207407070501e-05, "epoch": 0.504036504036504, "percentage": 50.42, "elapsed_time": "0:50:36", "remaining_time": "0:49:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 719, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.761214817304805e-05, "epoch": 0.5047385047385048, "percentage": 50.49, "elapsed_time": "0:50:40", "remaining_time": "0:49:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.762220827385448e-05, "epoch": 0.5054405054405054, "percentage": 50.56, "elapsed_time": "0:50:44", "remaining_time": "0:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 721, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.763225441199049e-05, "epoch": 0.5061425061425061, "percentage": 50.63, "elapsed_time": "0:50:48", "remaining_time": "0:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 722, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7642286626160654e-05, "epoch": 0.5068445068445069, "percentage": 50.7, "elapsed_time": "0:50:53", "remaining_time": "0:49:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 723, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.765230495490885e-05, "epoch": 0.5075465075465075, "percentage": 50.77, "elapsed_time": "0:50:57", "remaining_time": "0:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 724, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.7662309436619115e-05, "epoch": 0.5082485082485082, "percentage": 50.84, "elapsed_time": "0:51:01", "remaining_time": "0:49:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 725, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7672300109516563e-05, "epoch": 0.508950508950509, "percentage": 50.91, "elapsed_time": "0:51:05", "remaining_time": "0:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 726, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.768227701166823e-05, "epoch": 0.5096525096525096, "percentage": 50.98, "elapsed_time": "0:51:09", "remaining_time": "0:49:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 727, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7692240180983964e-05, "epoch": 0.5103545103545104, "percentage": 51.05, "elapsed_time": "0:51:13", "remaining_time": "0:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 728, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.770218965521729e-05, "epoch": 0.5110565110565111, "percentage": 51.12, "elapsed_time": "0:51:18", "remaining_time": "0:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 729, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7712125471966245e-05, "epoch": 0.5117585117585117, "percentage": 51.19, "elapsed_time": "0:51:22", "remaining_time": "0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7722047668674267e-05, "epoch": 0.5124605124605125, "percentage": 51.26, "elapsed_time": "0:51:26", "remaining_time": "0:48:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 731, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7731956282631004e-05, "epoch": 0.5131625131625132, "percentage": 51.33, "elapsed_time": "0:51:30", "remaining_time": "0:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 732, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.77418513509732e-05, "epoch": 0.5138645138645138, "percentage": 51.4, "elapsed_time": "0:51:34", "remaining_time": "0:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 733, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.775173291068547e-05, "epoch": 0.5145665145665146, "percentage": 51.47, "elapsed_time": "0:51:38", "remaining_time": "0:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 734, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.776160099860117e-05, "epoch": 0.5152685152685152, "percentage": 51.54, "elapsed_time": "0:51:42", "remaining_time": "0:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 735, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.777145565140325e-05, "epoch": 0.515970515970516, "percentage": 51.62, "elapsed_time": "0:51:47", "remaining_time": "0:48:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 736, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7781296905624986e-05, "epoch": 0.5166725166725167, "percentage": 51.69, "elapsed_time": "0:51:51", "remaining_time": "0:48:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 737, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.779112479765086e-05, "epoch": 0.5173745173745173, "percentage": 51.76, "elapsed_time": "0:51:55", "remaining_time": "0:48:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 738, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.780093936371736e-05, "epoch": 0.5180765180765181, "percentage": 51.83, "elapsed_time": "0:51:59", "remaining_time": "0:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 739, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.781074063991376e-05, "epoch": 0.5187785187785188, "percentage": 51.9, "elapsed_time": "0:52:03", "remaining_time": "0:48:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.782052866218294e-05, "epoch": 0.5194805194805194, "percentage": 51.97, "elapsed_time": "0:52:07", "remaining_time": "0:48:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 741, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.783030346632214e-05, "epoch": 0.5201825201825202, "percentage": 52.04, "elapsed_time": "0:52:11", "remaining_time": "0:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 742, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7840065087983786e-05, "epoch": 0.5208845208845209, "percentage": 52.11, "elapsed_time": "0:52:16", "remaining_time": "0:48:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 743, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.784981356267626e-05, "epoch": 0.5215865215865216, "percentage": 52.18, "elapsed_time": "0:52:20", "remaining_time": "0:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 744, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.785954892576465e-05, "epoch": 0.5222885222885223, "percentage": 52.25, "elapsed_time": "0:52:24", "remaining_time": "0:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 745, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7869271212471554e-05, "epoch": 0.522990522990523, "percentage": 52.32, "elapsed_time": "0:52:28", "remaining_time": "0:47:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 746, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7878980457877814e-05, "epoch": 0.5236925236925237, "percentage": 52.39, "elapsed_time": "0:52:32", "remaining_time": "0:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 747, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7888676696923315e-05, "epoch": 0.5243945243945244, "percentage": 52.46, "elapsed_time": "0:52:36", "remaining_time": "0:47:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 748, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.7898359964407695e-05, "epoch": 0.525096525096525, "percentage": 52.53, "elapsed_time": "0:52:41", "remaining_time": "0:47:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 749, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.790803029499111e-05, "epoch": 0.5257985257985258, "percentage": 52.6, "elapsed_time": "0:52:45", "remaining_time": "0:47:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7917687723195004e-05, "epoch": 0.5265005265005265, "percentage": 52.67, "elapsed_time": "0:52:49", "remaining_time": "0:47:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 751, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.792733228340281e-05, "epoch": 0.5272025272025272, "percentage": 52.74, "elapsed_time": "0:52:53", "remaining_time": "0:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 752, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.793696400986071e-05, "epoch": 0.5279045279045279, "percentage": 52.81, "elapsed_time": "0:52:57", "remaining_time": "0:47:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 753, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.7946582936678344e-05, "epoch": 0.5286065286065286, "percentage": 52.88, "elapsed_time": "0:53:01", "remaining_time": "0:47:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 754, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.795618909782957e-05, "epoch": 0.5293085293085293, "percentage": 52.95, "elapsed_time": "0:53:05", "remaining_time": "0:47:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 755, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.796578252715314e-05, "epoch": 0.53001053001053, "percentage": 53.02, "elapsed_time": "0:53:09", "remaining_time": "0:47:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 756, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.797536325835345e-05, "epoch": 0.5307125307125307, "percentage": 53.09, "elapsed_time": "0:53:14", "remaining_time": "0:47:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 757, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7984931325001216e-05, "epoch": 0.5314145314145314, "percentage": 53.16, "elapsed_time": "0:53:18", "remaining_time": "0:46:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 758, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.799448676053423e-05, "epoch": 0.5321165321165321, "percentage": 53.23, "elapsed_time": "0:53:22", "remaining_time": "0:46:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 759, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.800402959825802e-05, "epoch": 0.5328185328185329, "percentage": 53.3, "elapsed_time": "0:53:26", "remaining_time": "0:46:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.801355987134653e-05, "epoch": 0.5335205335205335, "percentage": 53.37, "elapsed_time": "0:53:30", "remaining_time": "0:46:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 761, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.802307761284289e-05, "epoch": 0.5342225342225342, "percentage": 53.44, "elapsed_time": "0:53:34", "remaining_time": "0:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 762, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.8032582855660014e-05, "epoch": 0.534924534924535, "percentage": 53.51, "elapsed_time": "0:53:38", "remaining_time": "0:46:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 763, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8042075632581346e-05, "epoch": 0.5356265356265356, "percentage": 53.58, "elapsed_time": "0:53:43", "remaining_time": "0:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 764, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.80515559762615e-05, "epoch": 0.5363285363285363, "percentage": 53.65, "elapsed_time": "0:53:47", "remaining_time": "0:46:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 765, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.8061023919226964e-05, "epoch": 0.537030537030537, "percentage": 53.72, "elapsed_time": "0:53:51", "remaining_time": "0:46:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 766, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.807047949387674e-05, "epoch": 0.5377325377325377, "percentage": 53.79, "elapsed_time": "0:53:55", "remaining_time": "0:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 767, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.807992273248302e-05, "epoch": 0.5384345384345385, "percentage": 53.86, "elapsed_time": "0:53:59", "remaining_time": "0:46:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 768, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.808935366719187e-05, "epoch": 0.5391365391365391, "percentage": 53.93, "elapsed_time": "0:54:03", "remaining_time": "0:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 769, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8098772330023855e-05, "epoch": 0.5398385398385398, "percentage": 54.0, "elapsed_time": "0:54:07", "remaining_time": "0:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.81081787528747e-05, "epoch": 0.5405405405405406, "percentage": 54.07, "elapsed_time": "0:54:12", "remaining_time": "0:46:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 771, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.811757296751595e-05, "epoch": 0.5412425412425412, "percentage": 54.14, "elapsed_time": "0:54:16", "remaining_time": "0:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 772, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.812695500559561e-05, "epoch": 0.5419445419445419, "percentage": 54.21, "elapsed_time": "0:54:20", "remaining_time": "0:45:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 773, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8136324898638756e-05, "epoch": 0.5426465426465427, "percentage": 54.28, "elapsed_time": "0:54:24", "remaining_time": "0:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 774, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8145682678048214e-05, "epoch": 0.5433485433485433, "percentage": 54.35, "elapsed_time": "0:54:28", "remaining_time": "0:45:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 775, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.815502837510518e-05, "epoch": 0.5440505440505441, "percentage": 54.42, "elapsed_time": "0:54:32", "remaining_time": "0:45:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 776, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.816436202096981e-05, "epoch": 0.5447525447525448, "percentage": 54.49, "elapsed_time": "0:54:37", "remaining_time": "0:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 777, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.81736836466819e-05, "epoch": 0.5454545454545454, "percentage": 54.56, "elapsed_time": "0:54:41", "remaining_time": "0:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 778, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8182993283161485e-05, "epoch": 0.5461565461565462, "percentage": 54.63, "elapsed_time": "0:54:45", "remaining_time": "0:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 779, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.819229096120941e-05, "epoch": 0.5468585468585468, "percentage": 54.71, "elapsed_time": "0:54:49", "remaining_time": "0:45:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 1424, "loss": 0.0791, "accuracy": 0.875, "learning_rate": 4.820157671150801e-05, "epoch": 0.5475605475605475, "percentage": 54.78, "elapsed_time": "0:54:53", "remaining_time": "0:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 781, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.821085056462168e-05, "epoch": 0.5482625482625483, "percentage": 54.85, "elapsed_time": "0:54:57", "remaining_time": "0:45:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 782, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.822011255099747e-05, "epoch": 0.5489645489645489, "percentage": 54.92, "elapsed_time": "0:55:01", "remaining_time": "0:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 783, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8229362700965726e-05, "epoch": 0.5496665496665497, "percentage": 54.99, "elapsed_time": "0:55:06", "remaining_time": "0:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 784, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8238601044740645e-05, "epoch": 0.5503685503685504, "percentage": 55.06, "elapsed_time": "0:55:10", "remaining_time": "0:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 785, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.824782761242088e-05, "epoch": 0.551070551070551, "percentage": 55.13, "elapsed_time": "0:55:14", "remaining_time": "0:44:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 786, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8257042433990135e-05, "epoch": 0.5517725517725518, "percentage": 55.2, "elapsed_time": "0:55:18", "remaining_time": "0:44:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 787, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.826624553931775e-05, "epoch": 0.5524745524745525, "percentage": 55.27, "elapsed_time": "0:55:22", "remaining_time": "0:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 788, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.827543695815926e-05, "epoch": 0.5531765531765532, "percentage": 55.34, "elapsed_time": "0:55:26", "remaining_time": "0:44:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 789, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 4.8284616720157006e-05, "epoch": 0.5538785538785539, "percentage": 55.41, "elapsed_time": "0:55:31", "remaining_time": "0:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.82937848548407e-05, "epoch": 0.5545805545805546, "percentage": 55.48, "elapsed_time": "0:55:35", "remaining_time": "0:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 791, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.8302941391627947e-05, "epoch": 0.5552825552825553, "percentage": 55.55, "elapsed_time": "0:55:39", "remaining_time": "0:44:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 792, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.83120863598249e-05, "epoch": 0.555984555984556, "percentage": 55.62, "elapsed_time": "0:55:43", "remaining_time": "0:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 793, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.832121978862673e-05, "epoch": 0.5566865566865566, "percentage": 55.69, "elapsed_time": "0:55:47", "remaining_time": "0:44:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 794, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8330341707118276e-05, "epoch": 0.5573885573885574, "percentage": 55.76, "elapsed_time": "0:55:51", "remaining_time": "0:44:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 795, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.833945214427451e-05, "epoch": 0.5580905580905581, "percentage": 55.83, "elapsed_time": "0:55:55", "remaining_time": "0:44:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 796, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.834855112896116e-05, "epoch": 0.5587925587925588, "percentage": 55.9, "elapsed_time": "0:55:59", "remaining_time": "0:44:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 797, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.835763868993521e-05, "epoch": 0.5594945594945595, "percentage": 55.97, "elapsed_time": "0:56:04", "remaining_time": "0:44:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 798, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.8366714855845496e-05, "epoch": 0.5601965601965602, "percentage": 56.04, "elapsed_time": "0:56:08", "remaining_time": "0:44:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 799, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.837577965523319e-05, "epoch": 0.5608985608985609, "percentage": 56.11, "elapsed_time": "0:56:12", "remaining_time": "0:43:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8384833116532396e-05, "epoch": 0.5616005616005616, "percentage": 56.18, "elapsed_time": "0:56:16", "remaining_time": "0:43:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 801, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8393875268070636e-05, "epoch": 0.5623025623025623, "percentage": 56.25, "elapsed_time": "0:56:27", "remaining_time": "0:43:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 802, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.84029061380694e-05, "epoch": 0.563004563004563, "percentage": 56.32, "elapsed_time": "0:56:32", "remaining_time": "0:43:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 803, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.841192575464469e-05, "epoch": 0.5637065637065637, "percentage": 56.39, "elapsed_time": "0:56:36", "remaining_time": "0:43:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 804, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.842093414580753e-05, "epoch": 0.5644085644085645, "percentage": 56.46, "elapsed_time": "0:56:40", "remaining_time": "0:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 805, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.842993133946448e-05, "epoch": 0.5651105651105651, "percentage": 56.53, "elapsed_time": "0:56:44", "remaining_time": "0:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 806, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.843891736341818e-05, "epoch": 0.5658125658125658, "percentage": 56.6, "elapsed_time": "0:56:48", "remaining_time": "0:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 807, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8447892245367846e-05, "epoch": 0.5665145665145666, "percentage": 56.67, "elapsed_time": "0:56:52", "remaining_time": "0:43:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 808, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.845685601290977e-05, "epoch": 0.5672165672165672, "percentage": 56.74, "elapsed_time": "0:56:56", "remaining_time": "0:43:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 809, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.846580869353787e-05, "epoch": 0.5679185679185679, "percentage": 56.81, "elapsed_time": "0:57:01", "remaining_time": "0:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.847475031464416e-05, "epoch": 0.5686205686205686, "percentage": 56.88, "elapsed_time": "0:57:05", "remaining_time": "0:43:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 811, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8483680903519274e-05, "epoch": 0.5693225693225693, "percentage": 56.95, "elapsed_time": "0:57:09", "remaining_time": "0:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 812, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8492600487352926e-05, "epoch": 0.5700245700245701, "percentage": 57.02, "elapsed_time": "0:57:13", "remaining_time": "0:43:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 813, "total_steps": 1424, "loss": 0.0053, "accuracy": 1.0, "learning_rate": 4.850150909323447e-05, "epoch": 0.5707265707265707, "percentage": 57.09, "elapsed_time": "0:57:17", "remaining_time": "0:43:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 814, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8510406748153355e-05, "epoch": 0.5714285714285714, "percentage": 57.16, "elapsed_time": "0:57:21", "remaining_time": "0:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 815, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8519293478999614e-05, "epoch": 0.5721305721305722, "percentage": 57.23, "elapsed_time": "0:57:25", "remaining_time": "0:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 816, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8528169312564355e-05, "epoch": 0.5728325728325728, "percentage": 57.3, "elapsed_time": "0:57:30", "remaining_time": "0:42:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 817, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8537034275540264e-05, "epoch": 0.5735345735345735, "percentage": 57.37, "elapsed_time": "0:57:34", "remaining_time": "0:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 818, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.854588839452205e-05, "epoch": 0.5742365742365743, "percentage": 57.44, "elapsed_time": "0:57:38", "remaining_time": "0:42:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 819, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.855473169600698e-05, "epoch": 0.5749385749385749, "percentage": 57.51, "elapsed_time": "0:57:42", "remaining_time": "0:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.856356420639528e-05, "epoch": 0.5756405756405757, "percentage": 57.58, "elapsed_time": "0:57:46", "remaining_time": "0:42:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 821, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.857238595199068e-05, "epoch": 0.5763425763425764, "percentage": 57.65, "elapsed_time": "0:57:50", "remaining_time": "0:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 822, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.858119695900084e-05, "epoch": 0.577044577044577, "percentage": 57.72, "elapsed_time": "0:57:54", "remaining_time": "0:42:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 823, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.858999725353783e-05, "epoch": 0.5777465777465778, "percentage": 57.79, "elapsed_time": "0:57:59", "remaining_time": "0:42:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 824, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8598786861618605e-05, "epoch": 0.5784485784485784, "percentage": 57.87, "elapsed_time": "0:58:03", "remaining_time": "0:42:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 825, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.860756580916542e-05, "epoch": 0.5791505791505791, "percentage": 57.94, "elapsed_time": "0:58:07", "remaining_time": "0:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 826, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.861633412200637e-05, "epoch": 0.5798525798525799, "percentage": 58.01, "elapsed_time": "0:58:11", "remaining_time": "0:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 827, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.862509182587578e-05, "epoch": 0.5805545805545805, "percentage": 58.08, "elapsed_time": "0:58:15", "remaining_time": "0:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 828, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.863383894641467e-05, "epoch": 0.5812565812565813, "percentage": 58.15, "elapsed_time": "0:58:19", "remaining_time": "0:41:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 829, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.864257550917123e-05, "epoch": 0.581958581958582, "percentage": 58.22, "elapsed_time": "0:58:23", "remaining_time": "0:41:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.865130153960124e-05, "epoch": 0.5826605826605826, "percentage": 58.29, "elapsed_time": "0:58:28", "remaining_time": "0:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 831, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8660017063068526e-05, "epoch": 0.5833625833625834, "percentage": 58.36, "elapsed_time": "0:58:32", "remaining_time": "0:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 832, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8668722104845403e-05, "epoch": 0.5840645840645841, "percentage": 58.43, "elapsed_time": "0:58:36", "remaining_time": "0:41:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 833, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8677416690113134e-05, "epoch": 0.5847665847665847, "percentage": 58.5, "elapsed_time": "0:58:40", "remaining_time": "0:41:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 834, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.868610084396232e-05, "epoch": 0.5854685854685855, "percentage": 58.57, "elapsed_time": "0:58:44", "remaining_time": "0:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 835, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.869477459139337e-05, "epoch": 0.5861705861705861, "percentage": 58.64, "elapsed_time": "0:58:48", "remaining_time": "0:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 836, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.870343795731694e-05, "epoch": 0.5868725868725869, "percentage": 58.71, "elapsed_time": "0:58:52", "remaining_time": "0:41:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 837, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.8712090966554334e-05, "epoch": 0.5875745875745876, "percentage": 58.78, "elapsed_time": "0:58:56", "remaining_time": "0:41:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 838, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.872073364383795e-05, "epoch": 0.5882765882765882, "percentage": 58.85, "elapsed_time": "0:59:01", "remaining_time": "0:41:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 839, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8729366013811674e-05, "epoch": 0.588978588978589, "percentage": 58.92, "elapsed_time": "0:59:05", "remaining_time": "0:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8737988101031366e-05, "epoch": 0.5896805896805897, "percentage": 58.99, "elapsed_time": "0:59:09", "remaining_time": "0:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 841, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.874659992996521e-05, "epoch": 0.5903825903825903, "percentage": 59.06, "elapsed_time": "0:59:13", "remaining_time": "0:41:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 842, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.875520152499416e-05, "epoch": 0.5910845910845911, "percentage": 59.13, "elapsed_time": "0:59:17", "remaining_time": "0:40:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 843, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.876379291041238e-05, "epoch": 0.5917865917865918, "percentage": 59.2, "elapsed_time": "0:59:21", "remaining_time": "0:40:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 844, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8772374110427594e-05, "epoch": 0.5924885924885925, "percentage": 59.27, "elapsed_time": "0:59:26", "remaining_time": "0:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 845, "total_steps": 1424, "loss": 0.0345, "accuracy": 1.0, "learning_rate": 4.878094514916154e-05, "epoch": 0.5931905931905932, "percentage": 59.34, "elapsed_time": "0:59:30", "remaining_time": "0:40:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 846, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8789506050650396e-05, "epoch": 0.5938925938925939, "percentage": 59.41, "elapsed_time": "0:59:34", "remaining_time": "0:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 847, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.879805683884512e-05, "epoch": 0.5945945945945946, "percentage": 59.48, "elapsed_time": "0:59:38", "remaining_time": "0:40:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 848, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8806597537611906e-05, "epoch": 0.5952965952965953, "percentage": 59.55, "elapsed_time": "0:59:42", "remaining_time": "0:40:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 849, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.881512817073255e-05, "epoch": 0.595998595998596, "percentage": 59.62, "elapsed_time": "0:59:47", "remaining_time": "0:40:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.882364876190489e-05, "epoch": 0.5967005967005967, "percentage": 59.69, "elapsed_time": "0:59:51", "remaining_time": "0:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 851, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8832159334743136e-05, "epoch": 0.5974025974025974, "percentage": 59.76, "elapsed_time": "0:59:55", "remaining_time": "0:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 852, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.884065991277833e-05, "epoch": 0.5981045981045982, "percentage": 59.83, "elapsed_time": "0:59:59", "remaining_time": "0:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 853, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8849150519458726e-05, "epoch": 0.5988065988065988, "percentage": 59.9, "elapsed_time": "1:00:03", "remaining_time": "0:40:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 854, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.885763117815009e-05, "epoch": 0.5995085995085995, "percentage": 59.97, "elapsed_time": "1:00:08", "remaining_time": "0:40:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 855, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.886610191213622e-05, "epoch": 0.6002106002106002, "percentage": 60.04, "elapsed_time": "1:00:12", "remaining_time": "0:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 856, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.887456274461922e-05, "epoch": 0.6009126009126009, "percentage": 60.11, "elapsed_time": "1:00:16", "remaining_time": "0:39:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 857, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8883013698719973e-05, "epoch": 0.6016146016146016, "percentage": 60.18, "elapsed_time": "1:00:20", "remaining_time": "0:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 858, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.889145479747843e-05, "epoch": 0.6023166023166023, "percentage": 60.25, "elapsed_time": "1:00:24", "remaining_time": "0:39:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 859, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.889988606385404e-05, "epoch": 0.603018603018603, "percentage": 60.32, "elapsed_time": "1:00:28", "remaining_time": "0:39:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8908307520726135e-05, "epoch": 0.6037206037206038, "percentage": 60.39, "elapsed_time": "1:00:33", "remaining_time": "0:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 861, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.891671919089425e-05, "epoch": 0.6044226044226044, "percentage": 60.46, "elapsed_time": "1:00:37", "remaining_time": "0:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 862, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.892512109707855e-05, "epoch": 0.6051246051246051, "percentage": 60.53, "elapsed_time": "1:00:41", "remaining_time": "0:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 863, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.893351326192016e-05, "epoch": 0.6058266058266059, "percentage": 60.6, "elapsed_time": "1:00:45", "remaining_time": "0:39:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 864, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.894189570798156e-05, "epoch": 0.6065286065286065, "percentage": 60.67, "elapsed_time": "1:00:49", "remaining_time": "0:39:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 865, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.895026845774691e-05, "epoch": 0.6072306072306072, "percentage": 60.74, "elapsed_time": "1:00:53", "remaining_time": "0:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 866, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.895863153362244e-05, "epoch": 0.607932607932608, "percentage": 60.81, "elapsed_time": "1:00:57", "remaining_time": "0:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 867, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.896698495793684e-05, "epoch": 0.6086346086346086, "percentage": 60.88, "elapsed_time": "1:01:01", "remaining_time": "0:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 868, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.897532875294154e-05, "epoch": 0.6093366093366094, "percentage": 60.96, "elapsed_time": "1:01:06", "remaining_time": "0:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 869, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8983662940811115e-05, "epoch": 0.61003861003861, "percentage": 61.03, "elapsed_time": "1:01:10", "remaining_time": "0:39:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.899198754364365e-05, "epoch": 0.6107406107406107, "percentage": 61.1, "elapsed_time": "1:01:14", "remaining_time": "0:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 871, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.900030258346106e-05, "epoch": 0.6114426114426115, "percentage": 61.17, "elapsed_time": "1:01:18", "remaining_time": "0:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 872, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.900860808220946e-05, "epoch": 0.6121446121446121, "percentage": 61.24, "elapsed_time": "1:01:22", "remaining_time": "0:38:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 873, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.90169040617595e-05, "epoch": 0.6128466128466128, "percentage": 61.31, "elapsed_time": "1:01:26", "remaining_time": "0:38:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 874, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.9025190543906715e-05, "epoch": 0.6135486135486136, "percentage": 61.38, "elapsed_time": "1:01:31", "remaining_time": "0:38:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 875, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.903346755037189e-05, "epoch": 0.6142506142506142, "percentage": 61.45, "elapsed_time": "1:01:35", "remaining_time": "0:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 876, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.904173510280135e-05, "epoch": 0.614952614952615, "percentage": 61.52, "elapsed_time": "1:01:39", "remaining_time": "0:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 877, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.904999322276735e-05, "epoch": 0.6156546156546157, "percentage": 61.59, "elapsed_time": "1:01:43", "remaining_time": "0:38:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 878, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9058241931768385e-05, "epoch": 0.6163566163566163, "percentage": 61.66, "elapsed_time": "1:01:47", "remaining_time": "0:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 879, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9066481251229535e-05, "epoch": 0.6170586170586171, "percentage": 61.73, "elapsed_time": "1:01:51", "remaining_time": "0:38:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.907471120250281e-05, "epoch": 0.6177606177606177, "percentage": 61.8, "elapsed_time": "1:01:56", "remaining_time": "0:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 881, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9082931806867474e-05, "epoch": 0.6184626184626184, "percentage": 61.87, "elapsed_time": "1:02:00", "remaining_time": "0:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 882, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.909114308553033e-05, "epoch": 0.6191646191646192, "percentage": 61.94, "elapsed_time": "1:02:04", "remaining_time": "0:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 883, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.909934505962615e-05, "epoch": 0.6198666198666198, "percentage": 62.01, "elapsed_time": "1:02:08", "remaining_time": "0:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 884, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.9107537750217886e-05, "epoch": 0.6205686205686206, "percentage": 62.08, "elapsed_time": "1:02:12", "remaining_time": "0:38:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 885, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9115721178297093e-05, "epoch": 0.6212706212706213, "percentage": 62.15, "elapsed_time": "1:02:16", "remaining_time": "0:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 886, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9123895364784184e-05, "epoch": 0.6219726219726219, "percentage": 62.22, "elapsed_time": "1:02:20", "remaining_time": "0:37:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 887, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.913206033052877e-05, "epoch": 0.6226746226746227, "percentage": 62.29, "elapsed_time": "1:02:25", "remaining_time": "0:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 888, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.914021609631002e-05, "epoch": 0.6233766233766234, "percentage": 62.36, "elapsed_time": "1:02:29", "remaining_time": "0:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 889, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.91483626828369e-05, "epoch": 0.6240786240786241, "percentage": 62.43, "elapsed_time": "1:02:33", "remaining_time": "0:37:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.915650011074855e-05, "epoch": 0.6247806247806248, "percentage": 62.5, "elapsed_time": "1:02:37", "remaining_time": "0:37:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 891, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.916462840061458e-05, "epoch": 0.6254826254826255, "percentage": 62.57, "elapsed_time": "1:02:41", "remaining_time": "0:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 892, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.917274757293539e-05, "epoch": 0.6261846261846262, "percentage": 62.64, "elapsed_time": "1:02:45", "remaining_time": "0:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 893, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.918085764814244e-05, "epoch": 0.6268866268866269, "percentage": 62.71, "elapsed_time": "1:02:50", "remaining_time": "0:37:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 894, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9188958646598624e-05, "epoch": 0.6275886275886275, "percentage": 62.78, "elapsed_time": "1:02:54", "remaining_time": "0:37:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 895, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.919705058859854e-05, "epoch": 0.6282906282906283, "percentage": 62.85, "elapsed_time": "1:02:58", "remaining_time": "0:37:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 896, "total_steps": 1424, "loss": 0.048, "accuracy": 1.0, "learning_rate": 4.920513349436875e-05, "epoch": 0.628992628992629, "percentage": 62.92, "elapsed_time": "1:03:02", "remaining_time": "0:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 897, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.92132073840682e-05, "epoch": 0.6296946296946297, "percentage": 62.99, "elapsed_time": "1:03:06", "remaining_time": "0:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 898, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.922127227778841e-05, "epoch": 0.6303966303966304, "percentage": 63.06, "elapsed_time": "1:03:10", "remaining_time": "0:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 899, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9229328195553815e-05, "epoch": 0.6310986310986311, "percentage": 63.13, "elapsed_time": "1:03:15", "remaining_time": "0:36:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.923737515732209e-05, "epoch": 0.6318006318006318, "percentage": 63.2, "elapsed_time": "1:03:19", "remaining_time": "0:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 901, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.924541318298438e-05, "epoch": 0.6325026325026325, "percentage": 63.27, "elapsed_time": "1:03:30", "remaining_time": "0:36:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 902, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.92534422923657e-05, "epoch": 0.6332046332046332, "percentage": 63.34, "elapsed_time": "1:03:34", "remaining_time": "0:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 903, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9261462505225106e-05, "epoch": 0.6339066339066339, "percentage": 63.41, "elapsed_time": "1:03:38", "remaining_time": "0:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 904, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.926947384125606e-05, "epoch": 0.6346086346086346, "percentage": 63.48, "elapsed_time": "1:03:42", "remaining_time": "0:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 905, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.927747632008672e-05, "epoch": 0.6353106353106354, "percentage": 63.55, "elapsed_time": "1:03:46", "remaining_time": "0:36:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 906, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.9285469961280226e-05, "epoch": 0.636012636012636, "percentage": 63.62, "elapsed_time": "1:03:51", "remaining_time": "0:36:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 907, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9293454784334924e-05, "epoch": 0.6367146367146367, "percentage": 63.69, "elapsed_time": "1:03:55", "remaining_time": "0:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 908, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.9301430808684754e-05, "epoch": 0.6374166374166375, "percentage": 63.76, "elapsed_time": "1:03:59", "remaining_time": "0:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 909, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.930939805369946e-05, "epoch": 0.6381186381186381, "percentage": 63.83, "elapsed_time": "1:04:03", "remaining_time": "0:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.93173565386849e-05, "epoch": 0.6388206388206388, "percentage": 63.9, "elapsed_time": "1:04:07", "remaining_time": "0:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 911, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.932530628288331e-05, "epoch": 0.6395226395226395, "percentage": 63.97, "elapsed_time": "1:04:12", "remaining_time": "0:36:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 912, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.933324730547361e-05, "epoch": 0.6402246402246402, "percentage": 64.04, "elapsed_time": "1:04:16", "remaining_time": "0:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 913, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.934117962557165e-05, "epoch": 0.640926640926641, "percentage": 64.12, "elapsed_time": "1:04:20", "remaining_time": "0:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 914, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9349103262230524e-05, "epoch": 0.6416286416286416, "percentage": 64.19, "elapsed_time": "1:04:24", "remaining_time": "0:35:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 915, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.935701823444081e-05, "epoch": 0.6423306423306423, "percentage": 64.26, "elapsed_time": "1:04:28", "remaining_time": "0:35:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 916, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9364924561130845e-05, "epoch": 0.6430326430326431, "percentage": 64.33, "elapsed_time": "1:04:32", "remaining_time": "0:35:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 917, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.937282226116702e-05, "epoch": 0.6437346437346437, "percentage": 64.4, "elapsed_time": "1:04:36", "remaining_time": "0:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 918, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.938071135335405e-05, "epoch": 0.6444366444366444, "percentage": 64.47, "elapsed_time": "1:04:41", "remaining_time": "0:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 919, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.938859185643519e-05, "epoch": 0.6451386451386452, "percentage": 64.54, "elapsed_time": "1:04:45", "remaining_time": "0:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.939646378909259e-05, "epoch": 0.6458406458406458, "percentage": 64.61, "elapsed_time": "1:04:49", "remaining_time": "0:35:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 921, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.940432716994748e-05, "epoch": 0.6465426465426466, "percentage": 64.68, "elapsed_time": "1:04:53", "remaining_time": "0:35:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 922, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.9412182017560496e-05, "epoch": 0.6472446472446473, "percentage": 64.75, "elapsed_time": "1:04:57", "remaining_time": "0:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 923, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.942002835043187e-05, "epoch": 0.6479466479466479, "percentage": 64.82, "elapsed_time": "1:05:01", "remaining_time": "0:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 924, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.942786618700178e-05, "epoch": 0.6486486486486487, "percentage": 64.89, "elapsed_time": "1:05:05", "remaining_time": "0:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 925, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9435695545650545e-05, "epoch": 0.6493506493506493, "percentage": 64.96, "elapsed_time": "1:05:10", "remaining_time": "0:35:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 926, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.944351644469891e-05, "epoch": 0.65005265005265, "percentage": 65.03, "elapsed_time": "1:05:14", "remaining_time": "0:35:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 927, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.945132890240829e-05, "epoch": 0.6507546507546508, "percentage": 65.1, "elapsed_time": "1:05:18", "remaining_time": "0:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 928, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.945913293698104e-05, "epoch": 0.6514566514566514, "percentage": 65.17, "elapsed_time": "1:05:22", "remaining_time": "0:34:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 929, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 4.9466928566560696e-05, "epoch": 0.6521586521586522, "percentage": 65.24, "elapsed_time": "1:05:26", "remaining_time": "0:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9474715809232256e-05, "epoch": 0.6528606528606529, "percentage": 65.31, "elapsed_time": "1:05:30", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 931, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.948249468302239e-05, "epoch": 0.6535626535626535, "percentage": 65.38, "elapsed_time": "1:05:34", "remaining_time": "0:34:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 932, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9490265205899697e-05, "epoch": 0.6542646542646543, "percentage": 65.45, "elapsed_time": "1:05:38", "remaining_time": "0:34:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 933, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9498027395775006e-05, "epoch": 0.654966654966655, "percentage": 65.52, "elapsed_time": "1:05:43", "remaining_time": "0:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 934, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.950578127050156e-05, "epoch": 0.6556686556686556, "percentage": 65.59, "elapsed_time": "1:05:47", "remaining_time": "0:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 935, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.95135268478753e-05, "epoch": 0.6563706563706564, "percentage": 65.66, "elapsed_time": "1:05:51", "remaining_time": "0:34:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 936, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.952126414563509e-05, "epoch": 0.657072657072657, "percentage": 65.73, "elapsed_time": "1:05:55", "remaining_time": "0:34:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 937, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.952899318146297e-05, "epoch": 0.6577746577746578, "percentage": 65.8, "elapsed_time": "1:05:59", "remaining_time": "0:34:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 938, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9536713972984414e-05, "epoch": 0.6584766584766585, "percentage": 65.87, "elapsed_time": "1:06:03", "remaining_time": "0:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 939, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.954442653776852e-05, "epoch": 0.6591786591786591, "percentage": 65.94, "elapsed_time": "1:06:07", "remaining_time": "0:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.955213089332832e-05, "epoch": 0.6598806598806599, "percentage": 66.01, "elapsed_time": "1:06:12", "remaining_time": "0:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 941, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.955982705712095e-05, "epoch": 0.6605826605826606, "percentage": 66.08, "elapsed_time": "1:06:16", "remaining_time": "0:34:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 942, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.956751504654796e-05, "epoch": 0.6612846612846612, "percentage": 66.15, "elapsed_time": "1:06:20", "remaining_time": "0:33:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 943, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.957519487895548e-05, "epoch": 0.661986661986662, "percentage": 66.22, "elapsed_time": "1:06:24", "remaining_time": "0:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 944, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9582866571634485e-05, "epoch": 0.6626886626886627, "percentage": 66.29, "elapsed_time": "1:06:28", "remaining_time": "0:33:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 945, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.959053014182106e-05, "epoch": 0.6633906633906634, "percentage": 66.36, "elapsed_time": "1:06:32", "remaining_time": "0:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 946, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.959818560669655e-05, "epoch": 0.6640926640926641, "percentage": 66.43, "elapsed_time": "1:06:36", "remaining_time": "0:33:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 947, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.96058329833879e-05, "epoch": 0.6647946647946648, "percentage": 66.5, "elapsed_time": "1:06:41", "remaining_time": "0:33:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 948, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.961347228896777e-05, "epoch": 0.6654966654966655, "percentage": 66.57, "elapsed_time": "1:06:45", "remaining_time": "0:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 949, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.962110354045488e-05, "epoch": 0.6661986661986662, "percentage": 66.64, "elapsed_time": "1:06:49", "remaining_time": "0:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.962872675481414e-05, "epoch": 0.6669006669006668, "percentage": 66.71, "elapsed_time": "1:06:53", "remaining_time": "0:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 951, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9636341948956906e-05, "epoch": 0.6676026676026676, "percentage": 66.78, "elapsed_time": "1:06:57", "remaining_time": "0:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 952, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.964394913974124e-05, "epoch": 0.6683046683046683, "percentage": 66.85, "elapsed_time": "1:07:01", "remaining_time": "0:33:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 953, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.965154834397211e-05, "epoch": 0.669006669006669, "percentage": 66.92, "elapsed_time": "1:07:05", "remaining_time": "0:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 954, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.965913957840159e-05, "epoch": 0.6697086697086697, "percentage": 66.99, "elapsed_time": "1:07:10", "remaining_time": "0:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 955, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.966672285972911e-05, "epoch": 0.6704106704106704, "percentage": 67.06, "elapsed_time": "1:07:14", "remaining_time": "0:33:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 956, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.967429820460167e-05, "epoch": 0.6711126711126711, "percentage": 67.13, "elapsed_time": "1:07:18", "remaining_time": "0:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 957, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9681865629614064e-05, "epoch": 0.6718146718146718, "percentage": 67.21, "elapsed_time": "1:07:22", "remaining_time": "0:32:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 958, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9689425151309074e-05, "epoch": 0.6725166725166725, "percentage": 67.28, "elapsed_time": "1:07:26", "remaining_time": "0:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 959, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.969697678617773e-05, "epoch": 0.6732186732186732, "percentage": 67.35, "elapsed_time": "1:07:30", "remaining_time": "0:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.970452055065948e-05, "epoch": 0.6739206739206739, "percentage": 67.42, "elapsed_time": "1:07:34", "remaining_time": "0:32:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 961, "total_steps": 1424, "loss": 0.044, "accuracy": 1.0, "learning_rate": 4.9712056461142423e-05, "epoch": 0.6746226746226747, "percentage": 67.49, "elapsed_time": "1:07:39", "remaining_time": "0:32:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 962, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.971958453396355e-05, "epoch": 0.6753246753246753, "percentage": 67.56, "elapsed_time": "1:07:43", "remaining_time": "0:32:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 963, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.972710478540891e-05, "epoch": 0.676026676026676, "percentage": 67.63, "elapsed_time": "1:07:47", "remaining_time": "0:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 964, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.973461723171385e-05, "epoch": 0.6767286767286768, "percentage": 67.7, "elapsed_time": "1:07:51", "remaining_time": "0:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 965, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9742121889063213e-05, "epoch": 0.6774306774306774, "percentage": 67.77, "elapsed_time": "1:07:55", "remaining_time": "0:32:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 966, "total_steps": 1424, "loss": 0.0034, "accuracy": 1.0, "learning_rate": 4.974961877359156e-05, "epoch": 0.6781326781326781, "percentage": 67.84, "elapsed_time": "1:07:59", "remaining_time": "0:32:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 967, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.975710790138336e-05, "epoch": 0.6788346788346789, "percentage": 67.91, "elapsed_time": "1:08:03", "remaining_time": "0:32:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 968, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.976458928847323e-05, "epoch": 0.6795366795366795, "percentage": 67.98, "elapsed_time": "1:08:07", "remaining_time": "0:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 969, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.977206295084609e-05, "epoch": 0.6802386802386803, "percentage": 68.05, "elapsed_time": "1:08:12", "remaining_time": "0:32:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9779528904437424e-05, "epoch": 0.6809406809406809, "percentage": 68.12, "elapsed_time": "1:08:16", "remaining_time": "0:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 971, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.978698716513342e-05, "epoch": 0.6816426816426816, "percentage": 68.19, "elapsed_time": "1:08:20", "remaining_time": "0:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 972, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9794437748771244e-05, "epoch": 0.6823446823446824, "percentage": 68.26, "elapsed_time": "1:08:24", "remaining_time": "0:31:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 973, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.9801880671139204e-05, "epoch": 0.683046683046683, "percentage": 68.33, "elapsed_time": "1:08:28", "remaining_time": "0:31:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 974, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.980931594797693e-05, "epoch": 0.6837486837486837, "percentage": 68.4, "elapsed_time": "1:08:32", "remaining_time": "0:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 975, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.981674359497562e-05, "epoch": 0.6844506844506845, "percentage": 68.47, "elapsed_time": "1:08:36", "remaining_time": "0:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 976, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.98241636277782e-05, "epoch": 0.6851526851526851, "percentage": 68.54, "elapsed_time": "1:08:41", "remaining_time": "0:31:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 977, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.983157606197955e-05, "epoch": 0.6858546858546859, "percentage": 68.61, "elapsed_time": "1:08:45", "remaining_time": "0:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 978, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.98389809131267e-05, "epoch": 0.6865566865566866, "percentage": 68.68, "elapsed_time": "1:08:49", "remaining_time": "0:31:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 979, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.984637819671897e-05, "epoch": 0.6872586872586872, "percentage": 68.75, "elapsed_time": "1:08:53", "remaining_time": "0:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.985376792820825e-05, "epoch": 0.687960687960688, "percentage": 68.82, "elapsed_time": "1:08:57", "remaining_time": "0:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 981, "total_steps": 1424, "loss": 0.0311, "accuracy": 0.875, "learning_rate": 4.986115012299915e-05, "epoch": 0.6886626886626886, "percentage": 68.89, "elapsed_time": "1:09:01", "remaining_time": "0:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 982, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.986852479644916e-05, "epoch": 0.6893646893646893, "percentage": 68.96, "elapsed_time": "1:09:05", "remaining_time": "0:31:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 983, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.987589196386893e-05, "epoch": 0.6900666900666901, "percentage": 69.03, "elapsed_time": "1:09:10", "remaining_time": "0:31:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 984, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.988325164052236e-05, "epoch": 0.6907686907686907, "percentage": 69.1, "elapsed_time": "1:09:14", "remaining_time": "0:30:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 985, "total_steps": 1424, "loss": 0.0118, "accuracy": 1.0, "learning_rate": 4.9890603841626866e-05, "epoch": 0.6914706914706915, "percentage": 69.17, "elapsed_time": "1:09:18", "remaining_time": "0:30:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 986, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.989794858235352e-05, "epoch": 0.6921726921726922, "percentage": 69.24, "elapsed_time": "1:09:24", "remaining_time": "0:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 987, "total_steps": 1424, "loss": 0.0017, "accuracy": 1.0, "learning_rate": 4.990528587782729e-05, "epoch": 0.6928746928746928, "percentage": 69.31, "elapsed_time": "1:09:28", "remaining_time": "0:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 988, "total_steps": 1424, "loss": 0.0014, "accuracy": 1.0, "learning_rate": 4.9912615743127146e-05, "epoch": 0.6935766935766936, "percentage": 69.38, "elapsed_time": "1:09:32", "remaining_time": "0:30:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 989, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.991993819328633e-05, "epoch": 0.6942786942786943, "percentage": 69.45, "elapsed_time": "1:09:36", "remaining_time": "0:30:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9927253243292505e-05, "epoch": 0.694980694980695, "percentage": 69.52, "elapsed_time": "1:09:41", "remaining_time": "0:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 991, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.993456090808793e-05, "epoch": 0.6956826956826957, "percentage": 69.59, "elapsed_time": "1:09:45", "remaining_time": "0:30:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 992, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.994186120256965e-05, "epoch": 0.6963846963846964, "percentage": 69.66, "elapsed_time": "1:09:49", "remaining_time": "0:30:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 993, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9949154141589696e-05, "epoch": 0.6970866970866971, "percentage": 69.73, "elapsed_time": "1:09:53", "remaining_time": "0:30:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 994, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.995643973995523e-05, "epoch": 0.6977886977886978, "percentage": 69.8, "elapsed_time": "1:09:57", "remaining_time": "0:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 995, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9963718012428765e-05, "epoch": 0.6984906984906984, "percentage": 69.87, "elapsed_time": "1:10:01", "remaining_time": "0:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 996, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.9970988973728314e-05, "epoch": 0.6991926991926992, "percentage": 69.94, "elapsed_time": "1:10:05", "remaining_time": "0:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 997, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.99782526385276e-05, "epoch": 0.6998946998946999, "percentage": 70.01, "elapsed_time": "1:10:10", "remaining_time": "0:30:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 998, "total_steps": 1424, "loss": 0.0025, "accuracy": 1.0, "learning_rate": 4.998550902145619e-05, "epoch": 0.7005967005967007, "percentage": 70.08, "elapsed_time": "1:10:14", "remaining_time": "0:29:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 999, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.999275813709971e-05, "epoch": 0.7012987012987013, "percentage": 70.15, "elapsed_time": "1:10:18", "remaining_time": "0:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 5e-05, "epoch": 0.702000702000702, "percentage": 70.22, "elapsed_time": "1:10:22", "remaining_time": "0:29:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1001, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.999931382857749e-05, "epoch": 0.7027027027027027, "percentage": 70.29, "elapsed_time": "1:10:34", "remaining_time": "0:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1002, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9997255351980225e-05, "epoch": 0.7034047034047034, "percentage": 70.37, "elapsed_time": "1:10:38", "remaining_time": "0:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1003, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.999382468321693e-05, "epoch": 0.7041067041067041, "percentage": 70.44, "elapsed_time": "1:10:42", "remaining_time": "0:29:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1004, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9989022010628595e-05, "epoch": 0.7048087048087048, "percentage": 70.51, "elapsed_time": "1:10:46", "remaining_time": "0:29:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1005, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.99828475978781e-05, "epoch": 0.7055107055107055, "percentage": 70.58, "elapsed_time": "1:10:50", "remaining_time": "0:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1006, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.997530178393581e-05, "epoch": 0.7062127062127063, "percentage": 70.65, "elapsed_time": "1:10:54", "remaining_time": "0:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1007, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.99663849830609e-05, "epoch": 0.7069147069147069, "percentage": 70.72, "elapsed_time": "1:10:59", "remaining_time": "0:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1008, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.995609768477863e-05, "epoch": 0.7076167076167076, "percentage": 70.79, "elapsed_time": "1:11:03", "remaining_time": "0:29:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1009, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.994444045385348e-05, "epoch": 0.7083187083187084, "percentage": 70.86, "elapsed_time": "1:11:07", "remaining_time": "0:29:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.993141393025816e-05, "epoch": 0.709020709020709, "percentage": 70.93, "elapsed_time": "1:11:11", "remaining_time": "0:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1011, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9917018829138434e-05, "epoch": 0.7097227097227097, "percentage": 71.0, "elapsed_time": "1:11:15", "remaining_time": "0:29:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1012, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.990125594077389e-05, "epoch": 0.7104247104247104, "percentage": 71.07, "elapsed_time": "1:11:19", "remaining_time": "0:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1013, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.988412613053455e-05, "epoch": 0.7111267111267111, "percentage": 71.14, "elapsed_time": "1:11:23", "remaining_time": "0:28:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1014, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.986563033883335e-05, "epoch": 0.7118287118287119, "percentage": 71.21, "elapsed_time": "1:11:28", "remaining_time": "0:28:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1015, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.9845769581074534e-05, "epoch": 0.7125307125307125, "percentage": 71.28, "elapsed_time": "1:11:32", "remaining_time": "0:28:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1016, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9824544947597894e-05, "epoch": 0.7132327132327132, "percentage": 71.35, "elapsed_time": "1:11:36", "remaining_time": "0:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1017, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.980195760361889e-05, "epoch": 0.713934713934714, "percentage": 71.42, "elapsed_time": "1:11:40", "remaining_time": "0:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1018, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.977800878916474e-05, "epoch": 0.7146367146367146, "percentage": 71.49, "elapsed_time": "1:11:44", "remaining_time": "0:28:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1019, "total_steps": 1424, "loss": 0.0012, "accuracy": 1.0, "learning_rate": 4.975269981900627e-05, "epoch": 0.7153387153387153, "percentage": 71.56, "elapsed_time": "1:11:48", "remaining_time": "0:28:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.97260320825858e-05, "epoch": 0.7160407160407161, "percentage": 71.63, "elapsed_time": "1:11:52", "remaining_time": "0:28:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1021, "total_steps": 1424, "loss": 0.0702, "accuracy": 1.0, "learning_rate": 4.969800704394081e-05, "epoch": 0.7167427167427167, "percentage": 71.7, "elapsed_time": "1:11:57", "remaining_time": "0:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1022, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9668626241623635e-05, "epoch": 0.7174447174447175, "percentage": 71.77, "elapsed_time": "1:12:01", "remaining_time": "0:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1023, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.963789128861689e-05, "epoch": 0.7181467181467182, "percentage": 71.84, "elapsed_time": "1:12:05", "remaining_time": "0:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1024, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.960580387224505e-05, "epoch": 0.7188487188487188, "percentage": 71.91, "elapsed_time": "1:12:09", "remaining_time": "0:28:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1025, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.957236575408172e-05, "epoch": 0.7195507195507196, "percentage": 71.98, "elapsed_time": "1:12:13", "remaining_time": "0:28:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1026, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.953757876985294e-05, "epoch": 0.7202527202527202, "percentage": 72.05, "elapsed_time": "1:12:17", "remaining_time": "0:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1027, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.9501444829336464e-05, "epoch": 0.7209547209547209, "percentage": 72.12, "elapsed_time": "1:12:22", "remaining_time": "0:27:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1028, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9463965916256854e-05, "epoch": 0.7216567216567217, "percentage": 72.19, "elapsed_time": "1:12:26", "remaining_time": "0:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1029, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.9425144088176586e-05, "epoch": 0.7223587223587223, "percentage": 72.26, "elapsed_time": "1:12:30", "remaining_time": "0:27:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.938498147638311e-05, "epoch": 0.7230607230607231, "percentage": 72.33, "elapsed_time": "1:12:34", "remaining_time": "0:27:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1031, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.9343480285771825e-05, "epoch": 0.7237627237627238, "percentage": 72.4, "elapsed_time": "1:12:38", "remaining_time": "0:27:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1032, "total_steps": 1424, "loss": 0.0052, "accuracy": 1.0, "learning_rate": 4.930064279472507e-05, "epoch": 0.7244647244647244, "percentage": 72.47, "elapsed_time": "1:12:42", "remaining_time": "0:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1033, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.925647135498698e-05, "epoch": 0.7251667251667252, "percentage": 72.54, "elapsed_time": "1:12:46", "remaining_time": "0:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1034, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.921096839153443e-05, "epoch": 0.7258687258687259, "percentage": 72.61, "elapsed_time": "1:12:51", "remaining_time": "0:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1035, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.916413640244386e-05, "epoch": 0.7265707265707265, "percentage": 72.68, "elapsed_time": "1:12:55", "remaining_time": "0:27:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1036, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.91159779587542e-05, "epoch": 0.7272727272727273, "percentage": 72.75, "elapsed_time": "1:12:59", "remaining_time": "0:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1037, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.906649570432566e-05, "epoch": 0.727974727974728, "percentage": 72.82, "elapsed_time": "1:13:03", "remaining_time": "0:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1038, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.90156923556946e-05, "epoch": 0.7286767286767287, "percentage": 72.89, "elapsed_time": "1:13:07", "remaining_time": "0:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1039, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8963570701924404e-05, "epoch": 0.7293787293787294, "percentage": 72.96, "elapsed_time": "1:13:11", "remaining_time": "0:27:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8910133604452376e-05, "epoch": 0.73008073008073, "percentage": 73.03, "elapsed_time": "1:13:15", "remaining_time": "0:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1041, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.88553839969326e-05, "epoch": 0.7307827307827308, "percentage": 73.1, "elapsed_time": "1:13:20", "remaining_time": "0:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1042, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.879932488507493e-05, "epoch": 0.7314847314847315, "percentage": 73.17, "elapsed_time": "1:13:24", "remaining_time": "0:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1043, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.874195934647999e-05, "epoch": 0.7321867321867321, "percentage": 73.24, "elapsed_time": "1:13:28", "remaining_time": "0:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1044, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8683290530470146e-05, "epoch": 0.7328887328887329, "percentage": 73.31, "elapsed_time": "1:13:32", "remaining_time": "0:26:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1045, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8623321657916704e-05, "epoch": 0.7335907335907336, "percentage": 73.38, "elapsed_time": "1:13:36", "remaining_time": "0:26:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1046, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8562056021063e-05, "epoch": 0.7342927342927343, "percentage": 73.46, "elapsed_time": "1:13:40", "remaining_time": "0:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1047, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8499496983343704e-05, "epoch": 0.734994734994735, "percentage": 73.53, "elapsed_time": "1:13:45", "remaining_time": "0:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1048, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.84356479792002e-05, "epoch": 0.7356967356967357, "percentage": 73.6, "elapsed_time": "1:13:49", "remaining_time": "0:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1049, "total_steps": 1424, "loss": 0.0008, "accuracy": 1.0, "learning_rate": 4.8370512513891935e-05, "epoch": 0.7363987363987364, "percentage": 73.67, "elapsed_time": "1:13:53", "remaining_time": "0:26:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 4.8304094163304124e-05, "epoch": 0.7371007371007371, "percentage": 73.74, "elapsed_time": "1:13:57", "remaining_time": "0:26:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1051, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.8236396573751306e-05, "epoch": 0.7378027378027378, "percentage": 73.81, "elapsed_time": "1:14:01", "remaining_time": "0:26:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1052, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.8167423461777255e-05, "epoch": 0.7385047385047385, "percentage": 73.88, "elapsed_time": "1:14:05", "remaining_time": "0:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1053, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.80971786139509e-05, "epoch": 0.7392067392067392, "percentage": 73.95, "elapsed_time": "1:14:09", "remaining_time": "0:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1054, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.802566588665842e-05, "epoch": 0.73990873990874, "percentage": 74.02, "elapsed_time": "1:14:14", "remaining_time": "0:26:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1055, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.7952889205891635e-05, "epoch": 0.7406107406107406, "percentage": 74.09, "elapsed_time": "1:14:18", "remaining_time": "0:25:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1056, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.787885256703236e-05, "epoch": 0.7413127413127413, "percentage": 74.16, "elapsed_time": "1:14:22", "remaining_time": "0:25:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1057, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.78035600346331e-05, "epoch": 0.742014742014742, "percentage": 74.23, "elapsed_time": "1:14:26", "remaining_time": "0:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1058, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7727015742193945e-05, "epoch": 0.7427167427167427, "percentage": 74.3, "elapsed_time": "1:14:30", "remaining_time": "0:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1059, "total_steps": 1424, "loss": 0.0098, "accuracy": 1.0, "learning_rate": 4.7649223891935594e-05, "epoch": 0.7434187434187434, "percentage": 74.37, "elapsed_time": "1:14:34", "remaining_time": "0:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.757018875456868e-05, "epoch": 0.7441207441207441, "percentage": 74.44, "elapsed_time": "1:14:38", "remaining_time": "0:25:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1061, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.748991466905931e-05, "epoch": 0.7448227448227448, "percentage": 74.51, "elapsed_time": "1:14:43", "remaining_time": "0:25:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1062, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.740840604239086e-05, "epoch": 0.7455247455247456, "percentage": 74.58, "elapsed_time": "1:14:47", "remaining_time": "0:25:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1063, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.7325667349322035e-05, "epoch": 0.7462267462267462, "percentage": 74.65, "elapsed_time": "1:14:51", "remaining_time": "0:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1064, "total_steps": 1424, "loss": 0.0222, "accuracy": 1.0, "learning_rate": 4.72417031321412e-05, "epoch": 0.7469287469287469, "percentage": 74.72, "elapsed_time": "1:14:55", "remaining_time": "0:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1065, "total_steps": 1424, "loss": 0.0042, "accuracy": 1.0, "learning_rate": 4.715651800041701e-05, "epoch": 0.7476307476307477, "percentage": 74.79, "elapsed_time": "1:14:59", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1066, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.707011663074538e-05, "epoch": 0.7483327483327483, "percentage": 74.86, "elapsed_time": "1:15:03", "remaining_time": "0:25:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1067, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.698250376649269e-05, "epoch": 0.749034749034749, "percentage": 74.93, "elapsed_time": "1:15:08", "remaining_time": "0:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1068, "total_steps": 1424, "loss": 0.0042, "accuracy": 1.0, "learning_rate": 4.6893684217535426e-05, "epoch": 0.7497367497367498, "percentage": 75.0, "elapsed_time": "1:15:12", "remaining_time": "0:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1069, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.6803662859996126e-05, "epoch": 0.7504387504387504, "percentage": 75.07, "elapsed_time": "1:15:16", "remaining_time": "0:24:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 1424, "loss": 0.0272, "accuracy": 1.0, "learning_rate": 4.67124446359756e-05, "epoch": 0.7511407511407512, "percentage": 75.14, "elapsed_time": "1:15:20", "remaining_time": "0:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1071, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.662003455328173e-05, "epoch": 0.7518427518427518, "percentage": 75.21, "elapsed_time": "1:15:24", "remaining_time": "0:24:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1072, "total_steps": 1424, "loss": 0.0394, "accuracy": 1.0, "learning_rate": 4.652643768515447e-05, "epoch": 0.7525447525447525, "percentage": 75.28, "elapsed_time": "1:15:28", "remaining_time": "0:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1073, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.643165916998735e-05, "epoch": 0.7532467532467533, "percentage": 75.35, "elapsed_time": "1:15:33", "remaining_time": "0:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1074, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.633570421104539e-05, "epoch": 0.7539487539487539, "percentage": 75.42, "elapsed_time": "1:15:37", "remaining_time": "0:24:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1075, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.6238578076179414e-05, "epoch": 0.7546507546507546, "percentage": 75.49, "elapsed_time": "1:15:41", "remaining_time": "0:24:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1076, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.614028609753689e-05, "epoch": 0.7553527553527554, "percentage": 75.56, "elapsed_time": "1:15:45", "remaining_time": "0:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1077, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.6040833671269204e-05, "epoch": 0.756054756054756, "percentage": 75.63, "elapsed_time": "1:15:49", "remaining_time": "0:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1078, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.594022625723533e-05, "epoch": 0.7567567567567568, "percentage": 75.7, "elapsed_time": "1:15:53", "remaining_time": "0:24:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1079, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.58384693787022e-05, "epoch": 0.7574587574587575, "percentage": 75.77, "elapsed_time": "1:15:57", "remaining_time": "0:24:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.573556862204142e-05, "epoch": 0.7581607581607581, "percentage": 75.84, "elapsed_time": "1:16:01", "remaining_time": "0:24:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1081, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.56315296364226e-05, "epoch": 0.7588627588627589, "percentage": 75.91, "elapsed_time": "1:16:06", "remaining_time": "0:24:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1082, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.552635813350319e-05, "epoch": 0.7595647595647596, "percentage": 75.98, "elapsed_time": "1:16:10", "remaining_time": "0:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1083, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.542005988711497e-05, "epoch": 0.7602667602667603, "percentage": 76.05, "elapsed_time": "1:16:14", "remaining_time": "0:24:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1084, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.531264073294702e-05, "epoch": 0.760968760968761, "percentage": 76.12, "elapsed_time": "1:16:18", "remaining_time": "0:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1085, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.5204106568225364e-05, "epoch": 0.7616707616707616, "percentage": 76.19, "elapsed_time": "1:16:22", "remaining_time": "0:23:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1086, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.5094463351389225e-05, "epoch": 0.7623727623727624, "percentage": 76.26, "elapsed_time": "1:16:26", "remaining_time": "0:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1087, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.4983717101763894e-05, "epoch": 0.7630747630747631, "percentage": 76.33, "elapsed_time": "1:16:30", "remaining_time": "0:23:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1088, "total_steps": 1424, "loss": 0.0007, "accuracy": 1.0, "learning_rate": 4.48718738992303e-05, "epoch": 0.7637767637767637, "percentage": 76.4, "elapsed_time": "1:16:35", "remaining_time": "0:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1089, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.4758939883891196e-05, "epoch": 0.7644787644787645, "percentage": 76.47, "elapsed_time": "1:16:39", "remaining_time": "0:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 1424, "loss": 0.0009, "accuracy": 1.0, "learning_rate": 4.464492125573411e-05, "epoch": 0.7651807651807652, "percentage": 76.54, "elapsed_time": "1:16:43", "remaining_time": "0:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1091, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.452982427429092e-05, "epoch": 0.7658827658827659, "percentage": 76.62, "elapsed_time": "1:16:47", "remaining_time": "0:23:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1092, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.441365525829427e-05, "epoch": 0.7665847665847666, "percentage": 76.69, "elapsed_time": "1:16:51", "remaining_time": "0:23:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1093, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.4296420585330625e-05, "epoch": 0.7672867672867673, "percentage": 76.76, "elapsed_time": "1:16:55", "remaining_time": "0:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1094, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.417812669149019e-05, "epoch": 0.767988767988768, "percentage": 76.83, "elapsed_time": "1:16:59", "remaining_time": "0:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1095, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.405878007101354e-05, "epoch": 0.7686907686907687, "percentage": 76.9, "elapsed_time": "1:17:03", "remaining_time": "0:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1096, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.39383872759351e-05, "epoch": 0.7693927693927693, "percentage": 76.97, "elapsed_time": "1:17:08", "remaining_time": "0:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1097, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.381695491572346e-05, "epoch": 0.7700947700947701, "percentage": 77.04, "elapsed_time": "1:17:12", "remaining_time": "0:23:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1098, "total_steps": 1424, "loss": 0.0018, "accuracy": 1.0, "learning_rate": 4.36944896569185e-05, "epoch": 0.7707967707967708, "percentage": 77.11, "elapsed_time": "1:17:16", "remaining_time": "0:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1099, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.3570998222765404e-05, "epoch": 0.7714987714987716, "percentage": 77.18, "elapsed_time": "1:17:20", "remaining_time": "0:22:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.344648739284558e-05, "epoch": 0.7722007722007722, "percentage": 77.25, "elapsed_time": "1:17:24", "remaining_time": "0:22:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1101, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.332096400270444e-05, "epoch": 0.7729027729027729, "percentage": 77.32, "elapsed_time": "1:17:35", "remaining_time": "0:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1102, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.3194434943476174e-05, "epoch": 0.7736047736047736, "percentage": 77.39, "elapsed_time": "1:17:40", "remaining_time": "0:22:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1103, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.3066907161505356e-05, "epoch": 0.7743067743067743, "percentage": 77.46, "elapsed_time": "1:17:44", "remaining_time": "0:22:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1104, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2938387657965666e-05, "epoch": 0.775008775008775, "percentage": 77.53, "elapsed_time": "1:17:48", "remaining_time": "0:22:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1105, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2808883488475535e-05, "epoch": 0.7757107757107757, "percentage": 77.6, "elapsed_time": "1:17:52", "remaining_time": "0:22:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1106, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2678401762710726e-05, "epoch": 0.7764127764127764, "percentage": 77.67, "elapsed_time": "1:17:56", "remaining_time": "0:22:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1107, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2546949644014096e-05, "epoch": 0.7771147771147772, "percentage": 77.74, "elapsed_time": "1:18:00", "remaining_time": "0:22:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1108, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.241453434900228e-05, "epoch": 0.7778167778167778, "percentage": 77.81, "elapsed_time": "1:18:05", "remaining_time": "0:22:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1109, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2281163147169525e-05, "epoch": 0.7785187785187785, "percentage": 77.88, "elapsed_time": "1:18:09", "remaining_time": "0:22:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.2146843360488635e-05, "epoch": 0.7792207792207793, "percentage": 77.95, "elapsed_time": "1:18:13", "remaining_time": "0:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1111, "total_steps": 1424, "loss": 0.0097, "accuracy": 1.0, "learning_rate": 4.2011582363008926e-05, "epoch": 0.7799227799227799, "percentage": 78.02, "elapsed_time": "1:18:17", "remaining_time": "0:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1112, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.187538758045147e-05, "epoch": 0.7806247806247806, "percentage": 78.09, "elapsed_time": "1:18:21", "remaining_time": "0:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1113, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.173826648980136e-05, "epoch": 0.7813267813267813, "percentage": 78.16, "elapsed_time": "1:18:25", "remaining_time": "0:21:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1114, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.160022661889731e-05, "epoch": 0.782028782028782, "percentage": 78.23, "elapsed_time": "1:18:30", "remaining_time": "0:21:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1115, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.146127554601829e-05, "epoch": 0.7827307827307828, "percentage": 78.3, "elapsed_time": "1:18:34", "remaining_time": "0:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1116, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 4.132142089946757e-05, "epoch": 0.7834327834327834, "percentage": 78.37, "elapsed_time": "1:18:38", "remaining_time": "0:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1117, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.1180670357153876e-05, "epoch": 0.7841347841347841, "percentage": 78.44, "elapsed_time": "1:18:42", "remaining_time": "0:21:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1118, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.1039031646169915e-05, "epoch": 0.7848367848367849, "percentage": 78.51, "elapsed_time": "1:18:46", "remaining_time": "0:21:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1119, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.089651254236812e-05, "epoch": 0.7855387855387855, "percentage": 78.58, "elapsed_time": "1:18:50", "remaining_time": "0:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.0753120869933834e-05, "epoch": 0.7862407862407862, "percentage": 78.65, "elapsed_time": "1:18:55", "remaining_time": "0:21:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1121, "total_steps": 1424, "loss": 0.0043, "accuracy": 1.0, "learning_rate": 4.060886450095565e-05, "epoch": 0.786942786942787, "percentage": 78.72, "elapsed_time": "1:18:59", "remaining_time": "0:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1122, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.0463751354993395e-05, "epoch": 0.7876447876447876, "percentage": 78.79, "elapsed_time": "1:19:03", "remaining_time": "0:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1123, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.0317789398643214e-05, "epoch": 0.7883467883467884, "percentage": 78.86, "elapsed_time": "1:19:07", "remaining_time": "0:21:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1124, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.0170986645100286e-05, "epoch": 0.7890487890487891, "percentage": 78.93, "elapsed_time": "1:19:11", "remaining_time": "0:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1125, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.002335115371889e-05, "epoch": 0.7897507897507897, "percentage": 79.0, "elapsed_time": "1:19:15", "remaining_time": "0:21:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1126, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.987489102956994e-05, "epoch": 0.7904527904527905, "percentage": 79.07, "elapsed_time": "1:19:19", "remaining_time": "0:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1127, "total_steps": 1424, "loss": 0.0019, "accuracy": 1.0, "learning_rate": 3.972561442299604e-05, "epoch": 0.7911547911547911, "percentage": 79.14, "elapsed_time": "1:19:24", "remaining_time": "0:20:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1128, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.957552952916402e-05, "epoch": 0.7918567918567918, "percentage": 79.21, "elapsed_time": "1:19:28", "remaining_time": "0:20:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1129, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.942464458761504e-05, "epoch": 0.7925587925587926, "percentage": 79.28, "elapsed_time": "1:19:32", "remaining_time": "0:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.9272967881812254e-05, "epoch": 0.7932607932607932, "percentage": 79.35, "elapsed_time": "1:19:36", "remaining_time": "0:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1131, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.912050773868602e-05, "epoch": 0.793962793962794, "percentage": 79.42, "elapsed_time": "1:19:40", "remaining_time": "0:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1132, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.8967272528176805e-05, "epoch": 0.7946647946647947, "percentage": 79.49, "elapsed_time": "1:19:44", "remaining_time": "0:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1133, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.881327066277565e-05, "epoch": 0.7953667953667953, "percentage": 79.56, "elapsed_time": "1:19:49", "remaining_time": "0:20:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1134, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.865851059706233e-05, "epoch": 0.7960687960687961, "percentage": 79.63, "elapsed_time": "1:19:53", "remaining_time": "0:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1135, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.850300082724122e-05, "epoch": 0.7967707967707968, "percentage": 79.71, "elapsed_time": "1:19:57", "remaining_time": "0:20:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1136, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.8346749890674853e-05, "epoch": 0.7974727974727974, "percentage": 79.78, "elapsed_time": "1:20:01", "remaining_time": "0:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1137, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.818976636541524e-05, "epoch": 0.7981747981747982, "percentage": 79.85, "elapsed_time": "1:20:05", "remaining_time": "0:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1138, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.8032058869732905e-05, "epoch": 0.7988767988767989, "percentage": 79.92, "elapsed_time": "1:20:09", "remaining_time": "0:20:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1139, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.787363606164378e-05, "epoch": 0.7995787995787996, "percentage": 79.99, "elapsed_time": "1:20:13", "remaining_time": "0:20:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.7714506638433895e-05, "epoch": 0.8002808002808003, "percentage": 80.06, "elapsed_time": "1:20:17", "remaining_time": "0:20:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1141, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.7554679336181845e-05, "epoch": 0.800982800982801, "percentage": 80.13, "elapsed_time": "1:20:22", "remaining_time": "0:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1142, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.739416292927929e-05, "epoch": 0.8016848016848017, "percentage": 80.2, "elapsed_time": "1:20:26", "remaining_time": "0:19:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1143, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.7232966229949124e-05, "epoch": 0.8023868023868024, "percentage": 80.27, "elapsed_time": "1:20:30", "remaining_time": "0:19:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1144, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.7071098087761795e-05, "epoch": 0.803088803088803, "percentage": 80.34, "elapsed_time": "1:20:34", "remaining_time": "0:19:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1145, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.6908567389149424e-05, "epoch": 0.8037908037908038, "percentage": 80.41, "elapsed_time": "1:20:38", "remaining_time": "0:19:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1146, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 3.674538305691793e-05, "epoch": 0.8044928044928045, "percentage": 80.48, "elapsed_time": "1:20:42", "remaining_time": "0:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1147, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.6581554049757226e-05, "epoch": 0.8051948051948052, "percentage": 80.55, "elapsed_time": "1:20:46", "remaining_time": "0:19:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1148, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.6417089361749344e-05, "epoch": 0.8058968058968059, "percentage": 80.62, "elapsed_time": "1:20:51", "remaining_time": "0:19:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1149, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.62519980218747e-05, "epoch": 0.8065988065988066, "percentage": 80.69, "elapsed_time": "1:20:55", "remaining_time": "0:19:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 3.6086289093516385e-05, "epoch": 0.8073008073008073, "percentage": 80.76, "elapsed_time": "1:20:59", "remaining_time": "0:19:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1151, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.591997167396263e-05, "epoch": 0.808002808002808, "percentage": 80.83, "elapsed_time": "1:21:03", "remaining_time": "0:19:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1152, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.5753054893907326e-05, "epoch": 0.8087048087048087, "percentage": 80.9, "elapsed_time": "1:21:07", "remaining_time": "0:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1153, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.558554791694878e-05, "epoch": 0.8094068094068094, "percentage": 80.97, "elapsed_time": "1:21:11", "remaining_time": "0:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1154, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.541745993908666e-05, "epoch": 0.8101088101088101, "percentage": 81.04, "elapsed_time": "1:21:15", "remaining_time": "0:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1155, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.524880018821708e-05, "epoch": 0.8108108108108109, "percentage": 81.11, "elapsed_time": "1:21:20", "remaining_time": "0:18:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1156, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.507957792362609e-05, "epoch": 0.8115128115128115, "percentage": 81.18, "elapsed_time": "1:21:24", "remaining_time": "0:18:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1157, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.4909802435481256e-05, "epoch": 0.8122148122148122, "percentage": 81.25, "elapsed_time": "1:21:28", "remaining_time": "0:18:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1158, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.473948304432168e-05, "epoch": 0.812916812916813, "percentage": 81.32, "elapsed_time": "1:21:32", "remaining_time": "0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1159, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.4568629100546333e-05, "epoch": 0.8136188136188136, "percentage": 81.39, "elapsed_time": "1:21:36", "remaining_time": "0:18:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.439724998390067e-05, "epoch": 0.8143208143208143, "percentage": 81.46, "elapsed_time": "1:21:40", "remaining_time": "0:18:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1161, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.4225355102961737e-05, "epoch": 0.815022815022815, "percentage": 81.53, "elapsed_time": "1:21:44", "remaining_time": "0:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1162, "total_steps": 1424, "loss": 0.0037, "accuracy": 1.0, "learning_rate": 3.405295389462161e-05, "epoch": 0.8157248157248157, "percentage": 81.6, "elapsed_time": "1:21:49", "remaining_time": "0:18:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1163, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.388005582356935e-05, "epoch": 0.8164268164268165, "percentage": 81.67, "elapsed_time": "1:21:53", "remaining_time": "0:18:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1164, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.370667038177139e-05, "epoch": 0.8171288171288171, "percentage": 81.74, "elapsed_time": "1:21:57", "remaining_time": "0:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1165, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.353280708795041e-05, "epoch": 0.8178308178308178, "percentage": 81.81, "elapsed_time": "1:22:01", "remaining_time": "0:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1166, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.3358475487062804e-05, "epoch": 0.8185328185328186, "percentage": 81.88, "elapsed_time": "1:22:05", "remaining_time": "0:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1167, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.3183685149774654e-05, "epoch": 0.8192348192348192, "percentage": 81.95, "elapsed_time": "1:22:09", "remaining_time": "0:18:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1168, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.3008445671936286e-05, "epoch": 0.8199368199368199, "percentage": 82.02, "elapsed_time": "1:22:13", "remaining_time": "0:18:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1169, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.2832766674055486e-05, "epoch": 0.8206388206388207, "percentage": 82.09, "elapsed_time": "1:22:17", "remaining_time": "0:17:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.265665780076936e-05, "epoch": 0.8213408213408213, "percentage": 82.16, "elapsed_time": "1:22:22", "remaining_time": "0:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1171, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.248012872031482e-05, "epoch": 0.8220428220428221, "percentage": 82.23, "elapsed_time": "1:22:26", "remaining_time": "0:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1172, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.2303189123997806e-05, "epoch": 0.8227448227448227, "percentage": 82.3, "elapsed_time": "1:22:30", "remaining_time": "0:17:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1173, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.2125848725661265e-05, "epoch": 0.8234468234468234, "percentage": 82.37, "elapsed_time": "1:22:34", "remaining_time": "0:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1174, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.1948117261151865e-05, "epoch": 0.8241488241488242, "percentage": 82.44, "elapsed_time": "1:22:38", "remaining_time": "0:17:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1175, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.177000448778548e-05, "epoch": 0.8248508248508248, "percentage": 82.51, "elapsed_time": "1:22:42", "remaining_time": "0:17:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1176, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.159152018381152e-05, "epoch": 0.8255528255528255, "percentage": 82.58, "elapsed_time": "1:22:46", "remaining_time": "0:17:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1177, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.141267414787618e-05, "epoch": 0.8262548262548263, "percentage": 82.65, "elapsed_time": "1:22:50", "remaining_time": "0:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1178, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.1233476198484396e-05, "epoch": 0.8269568269568269, "percentage": 82.72, "elapsed_time": "1:22:55", "remaining_time": "0:17:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1179, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.105393617346091e-05, "epoch": 0.8276588276588277, "percentage": 82.79, "elapsed_time": "1:22:59", "remaining_time": "0:17:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.087406392941015e-05, "epoch": 0.8283608283608284, "percentage": 82.87, "elapsed_time": "1:23:03", "remaining_time": "0:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1181, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.0693869341175055e-05, "epoch": 0.829062829062829, "percentage": 82.94, "elapsed_time": "1:23:07", "remaining_time": "0:17:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1182, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.051336230129504e-05, "epoch": 0.8297648297648298, "percentage": 83.01, "elapsed_time": "1:23:11", "remaining_time": "0:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1183, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.033255271946287e-05, "epoch": 0.8304668304668305, "percentage": 83.08, "elapsed_time": "1:23:15", "remaining_time": "0:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1184, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.0151450521980612e-05, "epoch": 0.8311688311688312, "percentage": 83.15, "elapsed_time": "1:23:19", "remaining_time": "0:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1185, "total_steps": 1424, "loss": 0.005, "accuracy": 1.0, "learning_rate": 2.9970065651214692e-05, "epoch": 0.8318708318708319, "percentage": 83.22, "elapsed_time": "1:23:23", "remaining_time": "0:16:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1186, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.97884080650501e-05, "epoch": 0.8325728325728325, "percentage": 83.29, "elapsed_time": "1:23:28", "remaining_time": "0:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1187, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 2.9606487736343637e-05, "epoch": 0.8332748332748333, "percentage": 83.36, "elapsed_time": "1:23:32", "remaining_time": "0:16:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1188, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.9424314652376516e-05, "epoch": 0.833976833976834, "percentage": 83.43, "elapsed_time": "1:23:36", "remaining_time": "0:16:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1189, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.924189881430598e-05, "epoch": 0.8346788346788346, "percentage": 83.5, "elapsed_time": "1:23:40", "remaining_time": "0:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.905925023661628e-05, "epoch": 0.8353808353808354, "percentage": 83.57, "elapsed_time": "1:23:44", "remaining_time": "0:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1191, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.8876378946568893e-05, "epoch": 0.8360828360828361, "percentage": 83.64, "elapsed_time": "1:23:48", "remaining_time": "0:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1192, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.8693294983652032e-05, "epoch": 0.8367848367848368, "percentage": 83.71, "elapsed_time": "1:23:52", "remaining_time": "0:16:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1193, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.8510008399029458e-05, "epoch": 0.8374868374868375, "percentage": 83.78, "elapsed_time": "1:23:56", "remaining_time": "0:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1194, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.8326529254988742e-05, "epoch": 0.8381888381888382, "percentage": 83.85, "elapsed_time": "1:24:01", "remaining_time": "0:16:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1195, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.814286762438878e-05, "epoch": 0.8388908388908389, "percentage": 83.92, "elapsed_time": "1:24:05", "remaining_time": "0:16:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1196, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.795903359010685e-05, "epoch": 0.8395928395928396, "percentage": 83.99, "elapsed_time": "1:24:09", "remaining_time": "0:16:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1197, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.777503724448504e-05, "epoch": 0.8402948402948403, "percentage": 84.06, "elapsed_time": "1:24:13", "remaining_time": "0:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1198, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.7590888688776223e-05, "epoch": 0.840996840996841, "percentage": 84.13, "elapsed_time": "1:24:17", "remaining_time": "0:15:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1199, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 2.7406598032589475e-05, "epoch": 0.8416988416988417, "percentage": 84.2, "elapsed_time": "1:24:21", "remaining_time": "0:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.7222175393335063e-05, "epoch": 0.8424008424008425, "percentage": 84.27, "elapsed_time": "1:24:25", "remaining_time": "0:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1201, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.7037630895669043e-05, "epoch": 0.8431028431028431, "percentage": 84.34, "elapsed_time": "1:24:36", "remaining_time": "0:15:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1202, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.685297467093738e-05, "epoch": 0.8438048438048438, "percentage": 84.41, "elapsed_time": "1:24:40", "remaining_time": "0:15:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1203, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.6668216856619775e-05, "epoch": 0.8445068445068445, "percentage": 84.48, "elapsed_time": "1:24:44", "remaining_time": "0:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1204, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.6483367595773123e-05, "epoch": 0.8452088452088452, "percentage": 84.55, "elapsed_time": "1:24:48", "remaining_time": "0:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1205, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.6298437036474648e-05, "epoch": 0.8459108459108459, "percentage": 84.62, "elapsed_time": "1:24:53", "remaining_time": "0:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1206, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.611343533126479e-05, "epoch": 0.8466128466128466, "percentage": 84.69, "elapsed_time": "1:24:57", "remaining_time": "0:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1207, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.5928372636589865e-05, "epoch": 0.8473148473148473, "percentage": 84.76, "elapsed_time": "1:25:01", "remaining_time": "0:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1208, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.5743259112244435e-05, "epoch": 0.8480168480168481, "percentage": 84.83, "elapsed_time": "1:25:05", "remaining_time": "0:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1209, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.5558104920813602e-05, "epoch": 0.8487188487188487, "percentage": 84.9, "elapsed_time": "1:25:09", "remaining_time": "0:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.5372920227115033e-05, "epoch": 0.8494208494208494, "percentage": 84.97, "elapsed_time": "1:25:13", "remaining_time": "0:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1211, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.518771519764095e-05, "epoch": 0.8501228501228502, "percentage": 85.04, "elapsed_time": "1:25:18", "remaining_time": "0:15:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1212, "total_steps": 1424, "loss": 0.0315, "accuracy": 1.0, "learning_rate": 2.50025e-05, "epoch": 0.8508248508248508, "percentage": 85.11, "elapsed_time": "1:25:22", "remaining_time": "0:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1213, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.4817284802359054e-05, "epoch": 0.8515268515268515, "percentage": 85.18, "elapsed_time": "1:25:26", "remaining_time": "0:14:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1214, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.463207977288497e-05, "epoch": 0.8522288522288523, "percentage": 85.25, "elapsed_time": "1:25:30", "remaining_time": "0:14:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1215, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.4446895079186404e-05, "epoch": 0.8529308529308529, "percentage": 85.32, "elapsed_time": "1:25:34", "remaining_time": "0:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1216, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.426174088775557e-05, "epoch": 0.8536328536328537, "percentage": 85.39, "elapsed_time": "1:25:38", "remaining_time": "0:14:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1217, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.4076627363410145e-05, "epoch": 0.8543348543348543, "percentage": 85.46, "elapsed_time": "1:25:42", "remaining_time": "0:14:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1218, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.389156466873522e-05, "epoch": 0.855036855036855, "percentage": 85.53, "elapsed_time": "1:25:47", "remaining_time": "0:14:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1219, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.3706562963525355e-05, "epoch": 0.8557388557388558, "percentage": 85.6, "elapsed_time": "1:25:51", "remaining_time": "0:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 1424, "loss": 0.0359, "accuracy": 1.0, "learning_rate": 2.3521632404226873e-05, "epoch": 0.8564408564408564, "percentage": 85.67, "elapsed_time": "1:25:55", "remaining_time": "0:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1221, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.3336783143380218e-05, "epoch": 0.8571428571428571, "percentage": 85.74, "elapsed_time": "1:25:59", "remaining_time": "0:14:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1222, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.315202532906262e-05, "epoch": 0.8578448578448579, "percentage": 85.81, "elapsed_time": "1:26:03", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1223, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.2967369104330957e-05, "epoch": 0.8585468585468585, "percentage": 85.88, "elapsed_time": "1:26:07", "remaining_time": "0:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1224, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.278282460666494e-05, "epoch": 0.8592488592488593, "percentage": 85.96, "elapsed_time": "1:26:11", "remaining_time": "0:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1225, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.2598401967410532e-05, "epoch": 0.85995085995086, "percentage": 86.03, "elapsed_time": "1:26:16", "remaining_time": "0:14:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1226, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.2414111311223784e-05, "epoch": 0.8606528606528606, "percentage": 86.1, "elapsed_time": "1:26:20", "remaining_time": "0:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1227, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.222996275551497e-05, "epoch": 0.8613548613548614, "percentage": 86.17, "elapsed_time": "1:26:24", "remaining_time": "0:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1228, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.2045966409893164e-05, "epoch": 0.862056862056862, "percentage": 86.24, "elapsed_time": "1:26:28", "remaining_time": "0:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1229, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.1862132375611227e-05, "epoch": 0.8627588627588627, "percentage": 86.31, "elapsed_time": "1:26:32", "remaining_time": "0:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 1424, "loss": 0.0006, "accuracy": 1.0, "learning_rate": 2.1678470745011258e-05, "epoch": 0.8634608634608635, "percentage": 86.38, "elapsed_time": "1:26:36", "remaining_time": "0:13:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1231, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.1494991600970542e-05, "epoch": 0.8641628641628641, "percentage": 86.45, "elapsed_time": "1:26:40", "remaining_time": "0:13:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1232, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.131170501634798e-05, "epoch": 0.8648648648648649, "percentage": 86.52, "elapsed_time": "1:26:45", "remaining_time": "0:13:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1233, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.1128621053431113e-05, "epoch": 0.8655668655668656, "percentage": 86.59, "elapsed_time": "1:26:49", "remaining_time": "0:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1234, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.0945749763383727e-05, "epoch": 0.8662688662688662, "percentage": 86.66, "elapsed_time": "1:26:53", "remaining_time": "0:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1235, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.0763101185694027e-05, "epoch": 0.866970866970867, "percentage": 86.73, "elapsed_time": "1:26:57", "remaining_time": "0:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1236, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.0580685347623487e-05, "epoch": 0.8676728676728677, "percentage": 86.8, "elapsed_time": "1:27:01", "remaining_time": "0:13:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1237, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.039851226365636e-05, "epoch": 0.8683748683748683, "percentage": 86.87, "elapsed_time": "1:27:05", "remaining_time": "0:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1238, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.021659193494991e-05, "epoch": 0.8690768690768691, "percentage": 86.94, "elapsed_time": "1:27:09", "remaining_time": "0:13:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1239, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.0034934348785308e-05, "epoch": 0.8697788697788698, "percentage": 87.01, "elapsed_time": "1:27:14", "remaining_time": "0:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 1.9853549478019398e-05, "epoch": 0.8704808704808705, "percentage": 87.08, "elapsed_time": "1:27:18", "remaining_time": "0:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1241, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.9672447280537136e-05, "epoch": 0.8711828711828712, "percentage": 87.15, "elapsed_time": "1:27:22", "remaining_time": "0:12:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1242, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 1.9491637698704965e-05, "epoch": 0.8718848718848718, "percentage": 87.22, "elapsed_time": "1:27:26", "remaining_time": "0:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1243, "total_steps": 1424, "loss": 0.001, "accuracy": 1.0, "learning_rate": 1.9311130658824958e-05, "epoch": 0.8725868725868726, "percentage": 87.29, "elapsed_time": "1:27:30", "remaining_time": "0:12:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1244, "total_steps": 1424, "loss": 0.0015, "accuracy": 1.0, "learning_rate": 1.9130936070589864e-05, "epoch": 0.8732888732888733, "percentage": 87.36, "elapsed_time": "1:27:34", "remaining_time": "0:12:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1245, "total_steps": 1424, "loss": 0.0102, "accuracy": 1.0, "learning_rate": 1.8951063826539088e-05, "epoch": 0.8739908739908739, "percentage": 87.43, "elapsed_time": "1:27:38", "remaining_time": "0:12:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1246, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 1.877152380151561e-05, "epoch": 0.8746928746928747, "percentage": 87.5, "elapsed_time": "1:27:43", "remaining_time": "0:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1247, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8592325852123832e-05, "epoch": 0.8753948753948754, "percentage": 87.57, "elapsed_time": "1:27:47", "remaining_time": "0:12:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1248, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8413479816188488e-05, "epoch": 0.8760968760968761, "percentage": 87.64, "elapsed_time": "1:27:51", "remaining_time": "0:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1249, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.8234995512214535e-05, "epoch": 0.8767988767988768, "percentage": 87.71, "elapsed_time": "1:27:55", "remaining_time": "0:12:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8056882738848145e-05, "epoch": 0.8775008775008775, "percentage": 87.78, "elapsed_time": "1:27:59", "remaining_time": "0:12:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1251, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.7879151274338734e-05, "epoch": 0.8782028782028782, "percentage": 87.85, "elapsed_time": "1:28:03", "remaining_time": "0:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1252, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.77018108760022e-05, "epoch": 0.8789048789048789, "percentage": 87.92, "elapsed_time": "1:28:07", "remaining_time": "0:12:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1253, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.752487127968518e-05, "epoch": 0.8796068796068796, "percentage": 87.99, "elapsed_time": "1:28:12", "remaining_time": "0:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1254, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.734834219923064e-05, "epoch": 0.8803088803088803, "percentage": 88.06, "elapsed_time": "1:28:16", "remaining_time": "0:11:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1255, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.717223332594451e-05, "epoch": 0.881010881010881, "percentage": 88.13, "elapsed_time": "1:28:20", "remaining_time": "0:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1256, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.6996554328063714e-05, "epoch": 0.8817128817128818, "percentage": 88.2, "elapsed_time": "1:28:24", "remaining_time": "0:11:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1257, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.6821314850225346e-05, "epoch": 0.8824148824148824, "percentage": 88.27, "elapsed_time": "1:28:28", "remaining_time": "0:11:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1258, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 1.6646524512937193e-05, "epoch": 0.8831168831168831, "percentage": 88.34, "elapsed_time": "1:28:32", "remaining_time": "0:11:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1259, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.6472192912049593e-05, "epoch": 0.8838188838188838, "percentage": 88.41, "elapsed_time": "1:28:36", "remaining_time": "0:11:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.629832961822862e-05, "epoch": 0.8845208845208845, "percentage": 88.48, "elapsed_time": "1:28:40", "remaining_time": "0:11:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1261, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.6124944176430657e-05, "epoch": 0.8852228852228852, "percentage": 88.55, "elapsed_time": "1:28:45", "remaining_time": "0:11:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1262, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.5952046105378398e-05, "epoch": 0.8859248859248859, "percentage": 88.62, "elapsed_time": "1:28:49", "remaining_time": "0:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1263, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.5779644897038273e-05, "epoch": 0.8866268866268866, "percentage": 88.69, "elapsed_time": "1:28:53", "remaining_time": "0:11:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1264, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.5607750016099335e-05, "epoch": 0.8873288873288874, "percentage": 88.76, "elapsed_time": "1:28:58", "remaining_time": "0:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1265, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.543637089945367e-05, "epoch": 0.888030888030888, "percentage": 88.83, "elapsed_time": "1:29:02", "remaining_time": "0:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1266, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.526551695567832e-05, "epoch": 0.8887328887328887, "percentage": 88.9, "elapsed_time": "1:29:06", "remaining_time": "0:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1267, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.5095197564518754e-05, "epoch": 0.8894348894348895, "percentage": 88.97, "elapsed_time": "1:29:10", "remaining_time": "0:11:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1268, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.4925422076373918e-05, "epoch": 0.8901368901368901, "percentage": 89.04, "elapsed_time": "1:29:14", "remaining_time": "0:10:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1269, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.4756199811782927e-05, "epoch": 0.8908388908388908, "percentage": 89.12, "elapsed_time": "1:29:18", "remaining_time": "0:10:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.4587540060913358e-05, "epoch": 0.8915408915408916, "percentage": 89.19, "elapsed_time": "1:29:22", "remaining_time": "0:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1271, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.4419452083051233e-05, "epoch": 0.8922428922428922, "percentage": 89.26, "elapsed_time": "1:29:27", "remaining_time": "0:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1272, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.4251945106092675e-05, "epoch": 0.892944892944893, "percentage": 89.33, "elapsed_time": "1:29:31", "remaining_time": "0:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1273, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.4085028326037369e-05, "epoch": 0.8936468936468936, "percentage": 89.4, "elapsed_time": "1:29:35", "remaining_time": "0:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1274, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.3918710906483615e-05, "epoch": 0.8943488943488943, "percentage": 89.47, "elapsed_time": "1:29:39", "remaining_time": "0:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1275, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.3753001978125304e-05, "epoch": 0.8950508950508951, "percentage": 89.54, "elapsed_time": "1:29:43", "remaining_time": "0:10:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1276, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.3587910638250659e-05, "epoch": 0.8957528957528957, "percentage": 89.61, "elapsed_time": "1:29:47", "remaining_time": "0:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1277, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.3423445950242778e-05, "epoch": 0.8964548964548964, "percentage": 89.68, "elapsed_time": "1:29:51", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1278, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.325961694308207e-05, "epoch": 0.8971568971568972, "percentage": 89.75, "elapsed_time": "1:29:56", "remaining_time": "0:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1279, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.3096432610850581e-05, "epoch": 0.8978588978588978, "percentage": 89.82, "elapsed_time": "1:30:00", "remaining_time": "0:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.2933901912238209e-05, "epoch": 0.8985608985608986, "percentage": 89.89, "elapsed_time": "1:30:04", "remaining_time": "0:10:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1281, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.2772033770050884e-05, "epoch": 0.8992628992628993, "percentage": 89.96, "elapsed_time": "1:30:08", "remaining_time": "0:10:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1282, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.2610837070720721e-05, "epoch": 0.8999648999648999, "percentage": 90.03, "elapsed_time": "1:30:12", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1283, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.2450320663818148e-05, "epoch": 0.9006669006669007, "percentage": 90.1, "elapsed_time": "1:30:16", "remaining_time": "0:09:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1284, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.2290493361566108e-05, "epoch": 0.9013689013689014, "percentage": 90.17, "elapsed_time": "1:30:21", "remaining_time": "0:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1285, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.2131363938356214e-05, "epoch": 0.9020709020709021, "percentage": 90.24, "elapsed_time": "1:30:25", "remaining_time": "0:09:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1286, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1972941130267093e-05, "epoch": 0.9027729027729028, "percentage": 90.31, "elapsed_time": "1:30:29", "remaining_time": "0:09:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1287, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1815233634584758e-05, "epoch": 0.9034749034749034, "percentage": 90.38, "elapsed_time": "1:30:33", "remaining_time": "0:09:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1288, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1658250109325143e-05, "epoch": 0.9041769041769042, "percentage": 90.45, "elapsed_time": "1:30:37", "remaining_time": "0:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1289, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.1501999172758785e-05, "epoch": 0.9048789048789049, "percentage": 90.52, "elapsed_time": "1:30:41", "remaining_time": "0:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.1346489402937678e-05, "epoch": 0.9055809055809055, "percentage": 90.59, "elapsed_time": "1:30:45", "remaining_time": "0:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1291, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1191729337224358e-05, "epoch": 0.9062829062829063, "percentage": 90.66, "elapsed_time": "1:30:50", "remaining_time": "0:09:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1292, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.1037727471823201e-05, "epoch": 0.906984906984907, "percentage": 90.73, "elapsed_time": "1:30:54", "remaining_time": "0:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1293, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.0884492261313986e-05, "epoch": 0.9076869076869077, "percentage": 90.8, "elapsed_time": "1:30:58", "remaining_time": "0:09:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1294, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.0732032118187756e-05, "epoch": 0.9083889083889084, "percentage": 90.87, "elapsed_time": "1:31:02", "remaining_time": "0:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1295, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.0580355412384968e-05, "epoch": 0.9090909090909091, "percentage": 90.94, "elapsed_time": "1:31:06", "remaining_time": "0:09:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1296, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.042947047083599e-05, "epoch": 0.9097929097929098, "percentage": 91.01, "elapsed_time": "1:31:10", "remaining_time": "0:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1297, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.0279385577003959e-05, "epoch": 0.9104949104949105, "percentage": 91.08, "elapsed_time": "1:31:14", "remaining_time": "0:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1298, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.0130108970430057e-05, "epoch": 0.9111969111969112, "percentage": 91.15, "elapsed_time": "1:31:19", "remaining_time": "0:08:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1299, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 9.981648846281106e-06, "epoch": 0.9118989118989119, "percentage": 91.22, "elapsed_time": "1:31:23", "remaining_time": "0:08:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 9.834013354899712e-06, "epoch": 0.9126009126009126, "percentage": 91.29, "elapsed_time": "1:31:27", "remaining_time": "0:08:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1301, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.687210601356786e-06, "epoch": 0.9133029133029134, "percentage": 91.36, "elapsed_time": "1:31:38", "remaining_time": "0:08:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1302, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.541248645006606e-06, "epoch": 0.914004914004914, "percentage": 91.43, "elapsed_time": "1:31:42", "remaining_time": "0:08:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1303, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 9.39613549904435e-06, "epoch": 0.9147069147069147, "percentage": 91.5, "elapsed_time": "1:31:46", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1304, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.25187913006618e-06, "epoch": 0.9154089154089154, "percentage": 91.57, "elapsed_time": "1:31:51", "remaining_time": "0:08:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1305, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 9.108487457631881e-06, "epoch": 0.9161109161109161, "percentage": 91.64, "elapsed_time": "1:31:55", "remaining_time": "0:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1306, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.965968353830092e-06, "epoch": 0.9168129168129168, "percentage": 91.71, "elapsed_time": "1:31:59", "remaining_time": "0:08:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1307, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.82432964284613e-06, "epoch": 0.9175149175149175, "percentage": 91.78, "elapsed_time": "1:32:03", "remaining_time": "0:08:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1308, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.68357910053244e-06, "epoch": 0.9182169182169182, "percentage": 91.85, "elapsed_time": "1:32:07", "remaining_time": "0:08:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1309, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 8.54372445398172e-06, "epoch": 0.918918918918919, "percentage": 91.92, "elapsed_time": "1:32:11", "remaining_time": "0:08:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.404773381102702e-06, "epoch": 0.9196209196209196, "percentage": 91.99, "elapsed_time": "1:32:16", "remaining_time": "0:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1311, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 8.266733510198643e-06, "epoch": 0.9203229203229203, "percentage": 92.06, "elapsed_time": "1:32:20", "remaining_time": "0:07:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1312, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.129612419548536e-06, "epoch": 0.9210249210249211, "percentage": 92.13, "elapsed_time": "1:32:24", "remaining_time": "0:07:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1313, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 7.993417636991077e-06, "epoch": 0.9217269217269217, "percentage": 92.21, "elapsed_time": "1:32:28", "remaining_time": "0:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1314, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 7.858156639511373e-06, "epoch": 0.9224289224289224, "percentage": 92.28, "elapsed_time": "1:32:32", "remaining_time": "0:07:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1315, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.723836852830477e-06, "epoch": 0.9231309231309232, "percentage": 92.35, "elapsed_time": "1:32:36", "remaining_time": "0:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1316, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 7.590465650997731e-06, "epoch": 0.9238329238329238, "percentage": 92.42, "elapsed_time": "1:32:40", "remaining_time": "0:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1317, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.458050355985914e-06, "epoch": 0.9245349245349246, "percentage": 92.49, "elapsed_time": "1:32:45", "remaining_time": "0:07:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1318, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 7.32659823728928e-06, "epoch": 0.9252369252369252, "percentage": 92.56, "elapsed_time": "1:32:49", "remaining_time": "0:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1319, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 7.196116511524472e-06, "epoch": 0.9259389259389259, "percentage": 92.63, "elapsed_time": "1:32:53", "remaining_time": "0:07:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 7.066612342034335e-06, "epoch": 0.9266409266409267, "percentage": 92.7, "elapsed_time": "1:32:57", "remaining_time": "0:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1321, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.938092838494651e-06, "epoch": 0.9273429273429273, "percentage": 92.77, "elapsed_time": "1:33:01", "remaining_time": "0:07:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1322, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.810565056523835e-06, "epoch": 0.928044928044928, "percentage": 92.84, "elapsed_time": "1:33:05", "remaining_time": "0:07:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1323, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.6840359972955585e-06, "epoch": 0.9287469287469288, "percentage": 92.91, "elapsed_time": "1:33:10", "remaining_time": "0:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1324, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.558512607154426e-06, "epoch": 0.9294489294489294, "percentage": 92.98, "elapsed_time": "1:33:14", "remaining_time": "0:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1325, "total_steps": 1424, "loss": 0.0011, "accuracy": 1.0, "learning_rate": 6.4340017772346075e-06, "epoch": 0.9301509301509302, "percentage": 93.05, "elapsed_time": "1:33:18", "remaining_time": "0:06:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1326, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 6.310510343081513e-06, "epoch": 0.9308529308529309, "percentage": 93.12, "elapsed_time": "1:33:22", "remaining_time": "0:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1327, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.188045084276546e-06, "epoch": 0.9315549315549315, "percentage": 93.19, "elapsed_time": "1:33:26", "remaining_time": "0:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1328, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 6.0666127240649095e-06, "epoch": 0.9322569322569323, "percentage": 93.26, "elapsed_time": "1:33:30", "remaining_time": "0:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1329, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.946219928986463e-06, "epoch": 0.932958932958933, "percentage": 93.33, "elapsed_time": "1:33:34", "remaining_time": "0:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 5.82687330850982e-06, "epoch": 0.9336609336609336, "percentage": 93.4, "elapsed_time": "1:33:39", "remaining_time": "0:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1331, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 5.708579414669377e-06, "epoch": 0.9343629343629344, "percentage": 93.47, "elapsed_time": "1:33:43", "remaining_time": "0:06:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1332, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 5.59134474170573e-06, "epoch": 0.935064935064935, "percentage": 93.54, "elapsed_time": "1:33:47", "remaining_time": "0:06:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1333, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.475175725709085e-06, "epoch": 0.9357669357669358, "percentage": 93.61, "elapsed_time": "1:33:51", "remaining_time": "0:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1334, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 5.360078744265891e-06, "epoch": 0.9364689364689365, "percentage": 93.68, "elapsed_time": "1:33:55", "remaining_time": "0:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1335, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.246060116108807e-06, "epoch": 0.9371709371709371, "percentage": 93.75, "elapsed_time": "1:33:59", "remaining_time": "0:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1336, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.133126100769699e-06, "epoch": 0.9378729378729379, "percentage": 93.82, "elapsed_time": "1:34:04", "remaining_time": "0:06:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1337, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.021282898236112e-06, "epoch": 0.9385749385749386, "percentage": 93.89, "elapsed_time": "1:34:08", "remaining_time": "0:06:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1338, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.910536648610779e-06, "epoch": 0.9392769392769392, "percentage": 93.96, "elapsed_time": "1:34:12", "remaining_time": "0:06:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1339, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.800893431774644e-06, "epoch": 0.93997893997894, "percentage": 94.03, "elapsed_time": "1:34:16", "remaining_time": "0:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 4.692359267052982e-06, "epoch": 0.9406809406809407, "percentage": 94.1, "elapsed_time": "1:34:20", "remaining_time": "0:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1341, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.584940112885035e-06, "epoch": 0.9413829413829414, "percentage": 94.17, "elapsed_time": "1:34:25", "remaining_time": "0:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1342, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.478641866496808e-06, "epoch": 0.9420849420849421, "percentage": 94.24, "elapsed_time": "1:34:29", "remaining_time": "0:05:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1343, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.373470363577407e-06, "epoch": 0.9427869427869427, "percentage": 94.31, "elapsed_time": "1:34:33", "remaining_time": "0:05:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1344, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.269431377958582e-06, "epoch": 0.9434889434889435, "percentage": 94.38, "elapsed_time": "1:34:37", "remaining_time": "0:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1345, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.166530621297806e-06, "epoch": 0.9441909441909442, "percentage": 94.45, "elapsed_time": "1:34:41", "remaining_time": "0:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1346, "total_steps": 1424, "loss": 0.0005, "accuracy": 1.0, "learning_rate": 4.064773742764677e-06, "epoch": 0.9448929448929448, "percentage": 94.52, "elapsed_time": "1:34:45", "remaining_time": "0:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1347, "total_steps": 1424, "loss": 0.0338, "accuracy": 1.0, "learning_rate": 3.964166328730805e-06, "epoch": 0.9455949455949456, "percentage": 94.59, "elapsed_time": "1:34:50", "remaining_time": "0:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1348, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.864713902463106e-06, "epoch": 0.9462969462969463, "percentage": 94.66, "elapsed_time": "1:34:54", "remaining_time": "0:05:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1349, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.7664219238205853e-06, "epoch": 0.946998946998947, "percentage": 94.73, "elapsed_time": "1:34:58", "remaining_time": "0:05:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.6692957889546164e-06, "epoch": 0.9477009477009477, "percentage": 94.8, "elapsed_time": "1:35:02", "remaining_time": "0:05:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1351, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.573340830012647e-06, "epoch": 0.9484029484029484, "percentage": 94.87, "elapsed_time": "1:35:06", "remaining_time": "0:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1352, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.4785623148455357e-06, "epoch": 0.9491049491049491, "percentage": 94.94, "elapsed_time": "1:35:10", "remaining_time": "0:05:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1353, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.3849654467182704e-06, "epoch": 0.9498069498069498, "percentage": 95.01, "elapsed_time": "1:35:15", "remaining_time": "0:04:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1354, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.292555364024403e-06, "epoch": 0.9505089505089505, "percentage": 95.08, "elapsed_time": "1:35:19", "remaining_time": "0:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1355, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 3.201337140003882e-06, "epoch": 0.9512109512109512, "percentage": 95.15, "elapsed_time": "1:35:23", "remaining_time": "0:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1356, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.1113157824645705e-06, "epoch": 0.9519129519129519, "percentage": 95.22, "elapsed_time": "1:35:27", "remaining_time": "0:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1357, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.0224962335073144e-06, "epoch": 0.9526149526149527, "percentage": 95.29, "elapsed_time": "1:35:31", "remaining_time": "0:04:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1358, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.9348833692546268e-06, "epoch": 0.9533169533169533, "percentage": 95.37, "elapsed_time": "1:35:35", "remaining_time": "0:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1359, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.848481999582994e-06, "epoch": 0.954018954018954, "percentage": 95.44, "elapsed_time": "1:35:40", "remaining_time": "0:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.763296867858807e-06, "epoch": 0.9547209547209548, "percentage": 95.51, "elapsed_time": "1:35:44", "remaining_time": "0:04:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1361, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.679332650677969e-06, "epoch": 0.9554229554229554, "percentage": 95.58, "elapsed_time": "1:35:48", "remaining_time": "0:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1362, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.5965939576091444e-06, "epoch": 0.9561249561249561, "percentage": 95.65, "elapsed_time": "1:35:52", "remaining_time": "0:04:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1363, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.5150853309406934e-06, "epoch": 0.9568269568269568, "percentage": 95.72, "elapsed_time": "1:35:56", "remaining_time": "0:04:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1364, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.434811245431329e-06, "epoch": 0.9575289575289575, "percentage": 95.79, "elapsed_time": "1:36:00", "remaining_time": "0:04:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1365, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.355776108064412e-06, "epoch": 0.9582309582309583, "percentage": 95.86, "elapsed_time": "1:36:04", "remaining_time": "0:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1366, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.277984257806064e-06, "epoch": 0.9589329589329589, "percentage": 95.93, "elapsed_time": "1:36:09", "remaining_time": "0:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1367, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.2014399653669036e-06, "epoch": 0.9596349596349596, "percentage": 96.0, "elapsed_time": "1:36:13", "remaining_time": "0:04:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1368, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.1261474329676517e-06, "epoch": 0.9603369603369604, "percentage": 96.07, "elapsed_time": "1:36:17", "remaining_time": "0:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1369, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 2.0521107941083654e-06, "epoch": 0.961038961038961, "percentage": 96.14, "elapsed_time": "1:36:21", "remaining_time": "0:03:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.979334113341578e-06, "epoch": 0.9617409617409617, "percentage": 96.21, "elapsed_time": "1:36:25", "remaining_time": "0:03:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1371, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.9078213860491097e-06, "epoch": 0.9624429624429625, "percentage": 96.28, "elapsed_time": "1:36:29", "remaining_time": "0:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1372, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8375765382227453e-06, "epoch": 0.9631449631449631, "percentage": 96.35, "elapsed_time": "1:36:33", "remaining_time": "0:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1373, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.7686034262486925e-06, "epoch": 0.9638469638469639, "percentage": 96.42, "elapsed_time": "1:36:38", "remaining_time": "0:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1374, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.7009058366958787e-06, "epoch": 0.9645489645489645, "percentage": 96.49, "elapsed_time": "1:36:42", "remaining_time": "0:03:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1375, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.6344874861080682e-06, "epoch": 0.9652509652509652, "percentage": 96.56, "elapsed_time": "1:36:46", "remaining_time": "0:03:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1376, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 1.5693520207998132e-06, "epoch": 0.965952965952966, "percentage": 96.63, "elapsed_time": "1:36:50", "remaining_time": "0:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1377, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.5055030166563016e-06, "epoch": 0.9666549666549666, "percentage": 96.7, "elapsed_time": "1:36:54", "remaining_time": "0:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1378, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.4429439789370089e-06, "epoch": 0.9673569673569674, "percentage": 96.77, "elapsed_time": "1:36:58", "remaining_time": "0:03:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1379, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.3816783420833017e-06, "epoch": 0.9680589680589681, "percentage": 96.84, "elapsed_time": "1:37:02", "remaining_time": "0:03:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.3217094695298508e-06, "epoch": 0.9687609687609687, "percentage": 96.91, "elapsed_time": "1:37:07", "remaining_time": "0:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1381, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.263040653520016e-06, "epoch": 0.9694629694629695, "percentage": 96.98, "elapsed_time": "1:37:11", "remaining_time": "0:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1382, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.2056751149250679e-06, "epoch": 0.9701649701649702, "percentage": 97.05, "elapsed_time": "1:37:15", "remaining_time": "0:02:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1383, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.1496160030674104e-06, "epoch": 0.9708669708669708, "percentage": 97.12, "elapsed_time": "1:37:19", "remaining_time": "0:02:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1384, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.0948663955476308e-06, "epoch": 0.9715689715689716, "percentage": 97.19, "elapsed_time": "1:37:23", "remaining_time": "0:02:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1385, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.0414292980755935e-06, "epoch": 0.9722709722709723, "percentage": 97.26, "elapsed_time": "1:37:28", "remaining_time": "0:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1386, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.893076443054085e-07, "epoch": 0.972972972972973, "percentage": 97.33, "elapsed_time": "1:37:32", "remaining_time": "0:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1387, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 9.385042956743443e-07, "epoch": 0.9736749736749737, "percentage": 97.4, "elapsed_time": "1:37:36", "remaining_time": "0:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1388, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 8.890220412458051e-07, "epoch": 0.9743769743769743, "percentage": 97.47, "elapsed_time": "1:37:40", "remaining_time": "0:02:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1389, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.408635975561439e-07, "epoch": 0.9750789750789751, "percentage": 97.54, "elapsed_time": "1:37:44", "remaining_time": "0:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.94031608465584e-07, "epoch": 0.9757809757809758, "percentage": 97.61, "elapsed_time": "1:37:48", "remaining_time": "0:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1391, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 7.485286450130249e-07, "epoch": 0.9764829764829764, "percentage": 97.68, "elapsed_time": "1:37:53", "remaining_time": "0:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1392, "total_steps": 1424, "loss": 0.0013, "accuracy": 1.0, "learning_rate": 7.043572052749351e-07, "epoch": 0.9771849771849772, "percentage": 97.75, "elapsed_time": "1:37:57", "remaining_time": "0:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1393, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 6.615197142281737e-07, "epoch": 0.9778869778869779, "percentage": 97.82, "elapsed_time": "1:38:01", "remaining_time": "0:02:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1394, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 6.200185236168985e-07, "epoch": 0.9785889785889786, "percentage": 97.89, "elapsed_time": "1:38:05", "remaining_time": "0:02:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1395, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.798559118234185e-07, "epoch": 0.9792909792909793, "percentage": 97.96, "elapsed_time": "1:38:09", "remaining_time": "0:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1396, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.410340837431479e-07, "epoch": 0.97999297999298, "percentage": 98.03, "elapsed_time": "1:38:13", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1397, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.035551706635352e-07, "epoch": 0.9806949806949807, "percentage": 98.1, "elapsed_time": "1:38:17", "remaining_time": "0:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1398, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.6742123014705895e-07, "epoch": 0.9813969813969814, "percentage": 98.17, "elapsed_time": "1:38:22", "remaining_time": "0:01:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1399, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 4.3263424591828644e-07, "epoch": 0.982098982098982, "percentage": 98.24, "elapsed_time": "1:38:26", "remaining_time": "0:01:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.9919612775494824e-07, "epoch": 0.9828009828009828, "percentage": 98.31, "elapsed_time": "1:38:30", "remaining_time": "0:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1401, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.6710871138310834e-07, "epoch": 0.9835029835029835, "percentage": 98.38, "elapsed_time": "1:38:41", "remaining_time": "0:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1402, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.3637375837637116e-07, "epoch": 0.9842049842049843, "percentage": 98.46, "elapsed_time": "1:38:45", "remaining_time": "0:01:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1403, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 3.0699295605918796e-07, "epoch": 0.9849069849069849, "percentage": 98.53, "elapsed_time": "1:38:49", "remaining_time": "0:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1404, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.789679174142046e-07, "epoch": 0.9856089856089856, "percentage": 98.6, "elapsed_time": "1:38:53", "remaining_time": "0:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1405, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.523001809937351e-07, "epoch": 0.9863109863109863, "percentage": 98.67, "elapsed_time": "1:38:57", "remaining_time": "0:01:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1406, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 2.2699121083526567e-07, "epoch": 0.987012987012987, "percentage": 98.74, "elapsed_time": "1:39:01", "remaining_time": "0:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1407, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.0304239638111052e-07, "epoch": 0.9877149877149877, "percentage": 98.81, "elapsed_time": "1:39:05", "remaining_time": "0:01:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1408, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.8045505240211085e-07, "epoch": 0.9884169884169884, "percentage": 98.88, "elapsed_time": "1:39:10", "remaining_time": "0:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1409, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.5923041892546387e-07, "epoch": 0.9891189891189891, "percentage": 98.95, "elapsed_time": "1:39:14", "remaining_time": "0:01:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 1.3936966116665055e-07, "epoch": 0.9898209898209899, "percentage": 99.02, "elapsed_time": "1:39:18", "remaining_time": "0:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1411, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.2087386946545723e-07, "epoch": 0.9905229905229905, "percentage": 99.09, "elapsed_time": "1:39:22", "remaining_time": "0:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1412, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.0374405922611564e-07, "epoch": 0.9912249912249912, "percentage": 99.16, "elapsed_time": "1:39:26", "remaining_time": "0:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1413, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 8.79811708615723e-08, "epoch": 0.991926991926992, "percentage": 99.23, "elapsed_time": "1:39:30", "remaining_time": "0:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1414, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 7.358606974184355e-08, "epoch": 0.9926289926289926, "percentage": 99.3, "elapsed_time": "1:39:35", "remaining_time": "0:00:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1415, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 6.055954614652204e-08, "epoch": 0.9933309933309933, "percentage": 99.37, "elapsed_time": "1:39:39", "remaining_time": "0:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1416, "total_steps": 1424, "loss": 0.0004, "accuracy": 1.0, "learning_rate": 4.890231522137424e-08, "epoch": 0.994032994032994, "percentage": 99.44, "elapsed_time": "1:39:43", "remaining_time": "0:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1417, "total_steps": 1424, "loss": 0.0001, "accuracy": 1.0, "learning_rate": 3.8615016939103454e-08, "epoch": 0.9947349947349947, "percentage": 99.51, "elapsed_time": "1:39:47", "remaining_time": "0:00:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1418, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.9698216064189796e-08, "epoch": 0.9954369954369955, "percentage": 99.58, "elapsed_time": "1:39:51", "remaining_time": "0:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1419, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 2.2152402121901446e-08, "epoch": 0.9961389961389961, "percentage": 99.65, "elapsed_time": "1:39:55", "remaining_time": "0:00:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.5977989371413286e-08, "epoch": 0.9968409968409968, "percentage": 99.72, "elapsed_time": "1:40:00", "remaining_time": "0:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1421, "total_steps": 1424, "loss": 0.0003, "accuracy": 1.0, "learning_rate": 1.1175316783071778e-08, "epoch": 0.9975429975429976, "percentage": 99.79, "elapsed_time": "1:40:04", "remaining_time": "0:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1422, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 7.744648019775646e-09, "epoch": 0.9982449982449982, "percentage": 99.86, "elapsed_time": "1:40:08", "remaining_time": "0:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1423, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5.686171422511089e-09, "epoch": 0.9989469989469989, "percentage": 99.93, "elapsed_time": "1:40:12", "remaining_time": "0:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 1424, "loss": 0.0002, "accuracy": 1.0, "learning_rate": 5e-09, "epoch": 0.9996489996489997, "percentage": 100.0, "elapsed_time": "1:40:16", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1424, "total_steps": 1424, "epoch": 0.9996489996489997, "percentage": 100.0, "elapsed_time": "1:40:22", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}