{ "best_metric": null, "best_model_checkpoint": null, "epoch": 10.526315789473685, "global_step": 400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.66, "eval_accuracy": 0.5721175930179145, "eval_f1": 0.34372003835091086, "eval_loss": 1.351142406463623, "eval_precision": 0.3301104972375691, "eval_recall": 0.3585, "eval_runtime": 3.6101, "eval_samples_per_second": 14.958, "eval_steps_per_second": 1.108, "step": 25 }, { "epoch": 1.32, "eval_accuracy": 0.7614836931557188, "eval_f1": 0.7229437229437228, "eval_loss": 0.905920684337616, "eval_precision": 0.6964782205746061, "eval_recall": 0.7515, "eval_runtime": 3.5063, "eval_samples_per_second": 15.401, "eval_steps_per_second": 1.141, "step": 50 }, { "epoch": 1.97, "eval_accuracy": 0.7796279283417548, "eval_f1": 0.7946449916327994, "eval_loss": 0.7163704633712769, "eval_precision": 0.7613376087952359, "eval_recall": 0.831, "eval_runtime": 3.5828, "eval_samples_per_second": 15.072, "eval_steps_per_second": 1.116, "step": 75 }, { "epoch": 2.63, "eval_accuracy": 0.799265043638034, "eval_f1": 0.8249158249158249, "eval_loss": 0.6392571926116943, "eval_precision": 0.7947173308619092, "eval_recall": 0.8575, "eval_runtime": 3.5968, "eval_samples_per_second": 15.013, "eval_steps_per_second": 1.112, "step": 100 }, { "epoch": 3.29, "eval_accuracy": 0.8104042259990814, "eval_f1": 0.8409859835669407, "eval_loss": 0.5755508542060852, "eval_precision": 0.813844714686623, "eval_recall": 0.87, "eval_runtime": 3.5975, "eval_samples_per_second": 15.011, "eval_steps_per_second": 1.112, "step": 125 }, { "epoch": 3.95, "eval_accuracy": 0.8323380799265043, "eval_f1": 0.8506134231416886, "eval_loss": 0.5508233308792114, "eval_precision": 0.8196569309225776, "eval_recall": 0.884, "eval_runtime": 3.6045, "eval_samples_per_second": 14.981, "eval_steps_per_second": 1.11, "step": 150 }, { "epoch": 4.61, "eval_accuracy": 0.8327974276527331, "eval_f1": 0.8600435097897026, "eval_loss": 0.5458412170410156, "eval_precision": 0.8324754328497894, "eval_recall": 0.8895, "eval_runtime": 3.5309, "eval_samples_per_second": 15.294, "eval_steps_per_second": 1.133, "step": 175 }, { "epoch": 5.26, "eval_accuracy": 0.826596233348645, "eval_f1": 0.8491160087188181, "eval_loss": 0.5740342736244202, "eval_precision": 0.8233912635039925, "eval_recall": 0.8765, "eval_runtime": 3.622, "eval_samples_per_second": 14.909, "eval_steps_per_second": 1.104, "step": 200 }, { "epoch": 5.92, "eval_accuracy": 0.8361276986678916, "eval_f1": 0.8709914320685433, "eval_loss": 0.5719187259674072, "eval_precision": 0.8532374100719424, "eval_recall": 0.8895, "eval_runtime": 3.5659, "eval_samples_per_second": 15.143, "eval_steps_per_second": 1.122, "step": 225 }, { "epoch": 6.58, "eval_accuracy": 0.8263665594855305, "eval_f1": 0.8736131210805596, "eval_loss": 0.5435599684715271, "eval_precision": 0.8438956197576887, "eval_recall": 0.9055, "eval_runtime": 3.5266, "eval_samples_per_second": 15.312, "eval_steps_per_second": 1.134, "step": 250 }, { "epoch": 7.24, "eval_accuracy": 0.8290078089113458, "eval_f1": 0.8783914728682171, "eval_loss": 0.5714461207389832, "eval_precision": 0.8519736842105263, "eval_recall": 0.9065, "eval_runtime": 3.6124, "eval_samples_per_second": 14.948, "eval_steps_per_second": 1.107, "step": 275 }, { "epoch": 7.89, "eval_accuracy": 0.8280891134588884, "eval_f1": 0.8791048406713695, "eval_loss": 0.5853330492973328, "eval_precision": 0.8559924206537186, "eval_recall": 0.9035, "eval_runtime": 3.6008, "eval_samples_per_second": 14.997, "eval_steps_per_second": 1.111, "step": 300 }, { "epoch": 8.55, "eval_accuracy": 0.8389986219568213, "eval_f1": 0.8807785888077859, "eval_loss": 0.570177435874939, "eval_precision": 0.8578199052132701, "eval_recall": 0.905, "eval_runtime": 3.5637, "eval_samples_per_second": 15.153, "eval_steps_per_second": 1.122, "step": 325 }, { "epoch": 9.21, "eval_accuracy": 0.8418695452457511, "eval_f1": 0.8775261748234722, "eval_loss": 0.5666728019714355, "eval_precision": 0.8552444233507357, "eval_recall": 0.901, "eval_runtime": 3.5809, "eval_samples_per_second": 15.08, "eval_steps_per_second": 1.117, "step": 350 }, { "epoch": 9.87, "eval_accuracy": 0.8338309600367478, "eval_f1": 0.8786773644541697, "eval_loss": 0.5793057084083557, "eval_precision": 0.8551822053951728, "eval_recall": 0.9035, "eval_runtime": 3.5472, "eval_samples_per_second": 15.223, "eval_steps_per_second": 1.128, "step": 375 }, { "epoch": 10.53, "eval_accuracy": 0.833371612310519, "eval_f1": 0.8794946550048591, "eval_loss": 0.5784164071083069, "eval_precision": 0.8553875236294896, "eval_recall": 0.905, "eval_runtime": 3.5919, "eval_samples_per_second": 15.034, "eval_steps_per_second": 1.114, "step": 400 }, { "epoch": 10.53, "step": 400, "total_flos": 416496442306560.0, "train_loss": 0.50620361328125, "train_runtime": 250.4274, "train_samples_per_second": 6.389, "train_steps_per_second": 1.597 } ], "max_steps": 400, "num_train_epochs": 11, "total_flos": 416496442306560.0, "trial_name": null, "trial_params": null }