{ "best_metric": 0.981159271079996, "best_model_checkpoint": "./output//42_roberta-large_nace_5__5e-6_0.01_0.06_07-21-22_10-40/checkpoint-12000", "epoch": 4.418262150220913, "global_step": 12000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.74, "learning_rate": 4.535840188014101e-06, "loss": 0.1726, "step": 2000 }, { "epoch": 0.74, "eval_accuracy": 0.9712155725823152, "eval_f1": 0.9751469526657729, "eval_loss": 0.08084136247634888, "eval_roc_auc": 0.9750559610355007, "eval_runtime": 143.2301, "eval_samples_per_second": 33.715, "step": 2000 }, { "epoch": 1.47, "learning_rate": 3.7524481002741874e-06, "loss": 0.0668, "step": 4000 }, { "epoch": 1.47, "eval_accuracy": 0.9726651480637813, "eval_f1": 0.9771228359439407, "eval_loss": 0.08218056708574295, "eval_roc_auc": 0.9770191055094254, "eval_runtime": 143.2878, "eval_samples_per_second": 33.701, "step": 4000 }, { "epoch": 2.21, "learning_rate": 2.969056012534274e-06, "loss": 0.0501, "step": 6000 }, { "epoch": 2.21, "eval_accuracy": 0.9749430523917996, "eval_f1": 0.9794069192751236, "eval_loss": 0.07129524648189545, "eval_roc_auc": 0.9792922833616305, "eval_runtime": 143.1874, "eval_samples_per_second": 33.725, "step": 6000 }, { "epoch": 2.95, "learning_rate": 2.18566392479436e-06, "loss": 0.0377, "step": 8000 }, { "epoch": 2.95, "eval_accuracy": 0.9757713812383516, "eval_f1": 0.9797813080255828, "eval_loss": 0.08654613047838211, "eval_roc_auc": 0.9797172685997191, "eval_runtime": 143.3834, "eval_samples_per_second": 33.679, "step": 8000 }, { "epoch": 3.68, "learning_rate": 1.4022718370544457e-06, "loss": 0.0254, "step": 10000 }, { "epoch": 3.68, "eval_accuracy": 0.9743218057568854, "eval_f1": 0.9794111591517397, "eval_loss": 0.09397488832473755, "eval_roc_auc": 0.979291082596074, "eval_runtime": 143.2996, "eval_samples_per_second": 33.699, "step": 10000 }, { "epoch": 4.42, "learning_rate": 6.18879749314532e-07, "loss": 0.0196, "step": 12000 }, { "epoch": 4.42, "eval_accuracy": 0.9763926278732656, "eval_f1": 0.981159271079996, "eval_loss": 0.09825791418552399, "eval_roc_auc": 0.981051940958186, "eval_runtime": 143.2702, "eval_samples_per_second": 33.706, "step": 12000 } ], "max_steps": 13580, "num_train_epochs": 5, "total_flos": 6.9866971594752e+16, "trial_name": null, "trial_params": null }