{ "best_metric": null, "best_model_checkpoint": null, "epoch": 50.0, "eval_steps": 500, "global_step": 1800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7152777777777778, "eval_auc": 0.7881944444444445, "eval_balanced_acc": 0.7152777777777778, "eval_f1": 0.7320261437908496, "eval_fn": 16, "eval_fp": 25, "eval_gmean": 0.71254196324337, "eval_loss": 0.660514771938324, "eval_matthews_correlation": 0.43395920975133495, "eval_precision": 0.691358024691358, "eval_recall": 0.7777777777777778, "eval_roc_auc": 0.7881944444444445, "eval_runtime": 1.7448, "eval_samples_per_second": 82.531, "eval_specificity": 0.6527777777777778, "eval_steps_per_second": 0.573, "eval_tn": 47, "eval_tp": 56, "step": 36 }, { "epoch": 2.0, "eval_accuracy": 0.7291666666666666, "eval_auc": 0.8784722222222222, "eval_balanced_acc": 0.7291666666666666, "eval_f1": 0.6285714285714286, "eval_fn": 39, "eval_fp": 0, "eval_gmean": 0.67700320038633, "eval_loss": 0.5545561909675598, "eval_matthews_correlation": 0.5452497568062706, "eval_precision": 1.0, "eval_recall": 0.4583333333333333, "eval_roc_auc": 0.8784722222222222, "eval_runtime": 1.564, "eval_samples_per_second": 92.072, "eval_specificity": 1.0, "eval_steps_per_second": 0.639, "eval_tn": 72, "eval_tp": 33, "step": 72 }, { "epoch": 3.0, "eval_accuracy": 0.8055555555555556, "eval_auc": 0.8809799382716048, "eval_balanced_acc": 0.8055555555555556, "eval_f1": 0.7704918032786885, "eval_fn": 25, "eval_fp": 3, "eval_gmean": 0.7909353347168805, "eval_loss": 0.41891196370124817, "eval_matthews_correlation": 0.6418059625907361, "eval_precision": 0.94, "eval_recall": 0.6527777777777778, "eval_roc_auc": 0.8809799382716048, "eval_runtime": 1.5621, "eval_samples_per_second": 92.185, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.64, "eval_tn": 69, "eval_tp": 47, "step": 108 }, { "epoch": 4.0, "eval_accuracy": 0.875, "eval_auc": 0.9261188271604939, "eval_balanced_acc": 0.875, "eval_f1": 0.8695652173913043, "eval_fn": 12, "eval_fp": 6, "eval_gmean": 0.8740073734751262, "eval_loss": 0.3357275724411011, "eval_matthews_correlation": 0.7526178090063818, "eval_precision": 0.9090909090909091, "eval_recall": 0.8333333333333334, "eval_roc_auc": 0.9261188271604939, "eval_runtime": 1.5641, "eval_samples_per_second": 92.065, "eval_specificity": 0.9166666666666666, "eval_steps_per_second": 0.639, "eval_tn": 66, "eval_tp": 60, "step": 144 }, { "epoch": 5.0, "eval_accuracy": 0.8611111111111112, "eval_auc": 0.91820987654321, "eval_balanced_acc": 0.8611111111111112, "eval_f1": 0.8529411764705882, "eval_fn": 14, "eval_fp": 6, "eval_gmean": 0.8593171276810011, "eval_loss": 0.3432258367538452, "eval_matthews_correlation": 0.7267220926874316, "eval_precision": 0.90625, "eval_recall": 0.8055555555555556, "eval_roc_auc": 0.91820987654321, "eval_runtime": 1.6068, "eval_samples_per_second": 89.618, "eval_specificity": 0.9166666666666666, "eval_steps_per_second": 0.622, "eval_tn": 66, "eval_tp": 58, "step": 180 }, { "epoch": 6.0, "eval_accuracy": 0.8541666666666666, "eval_auc": 0.9330632716049384, "eval_balanced_acc": 0.8541666666666667, "eval_f1": 0.8372093023255814, "eval_fn": 18, "eval_fp": 3, "eval_gmean": 0.8477912478906585, "eval_loss": 0.34070253372192383, "eval_matthews_correlation": 0.7242243488319184, "eval_precision": 0.9473684210526315, "eval_recall": 0.75, "eval_roc_auc": 0.9330632716049384, "eval_runtime": 1.5703, "eval_samples_per_second": 91.705, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.637, "eval_tn": 69, "eval_tp": 54, "step": 216 }, { "epoch": 7.0, "eval_accuracy": 0.8611111111111112, "eval_auc": 0.9386574074074074, "eval_balanced_acc": 0.8611111111111112, "eval_f1": 0.8591549295774648, "eval_fn": 11, "eval_fp": 9, "eval_gmean": 0.8609990966571593, "eval_loss": 0.36071789264678955, "eval_matthews_correlation": 0.7225010186897469, "eval_precision": 0.8714285714285714, "eval_recall": 0.8472222222222222, "eval_roc_auc": 0.9386574074074074, "eval_runtime": 1.5692, "eval_samples_per_second": 91.766, "eval_specificity": 0.875, "eval_steps_per_second": 0.637, "eval_tn": 63, "eval_tp": 61, "step": 252 }, { "epoch": 8.0, "eval_accuracy": 0.8680555555555556, "eval_auc": 0.9415509259259259, "eval_balanced_acc": 0.8680555555555556, "eval_f1": 0.8527131782945736, "eval_fn": 17, "eval_fp": 2, "eval_gmean": 0.8617828920826983, "eval_loss": 0.3144780695438385, "eval_matthews_correlation": 0.7526253036880721, "eval_precision": 0.9649122807017544, "eval_recall": 0.7638888888888888, "eval_roc_auc": 0.9415509259259259, "eval_runtime": 1.564, "eval_samples_per_second": 92.069, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.639, "eval_tn": 70, "eval_tp": 55, "step": 288 }, { "epoch": 9.0, "eval_accuracy": 0.8888888888888888, "eval_auc": 0.9461805555555556, "eval_balanced_acc": 0.8888888888888888, "eval_f1": 0.875, "eval_fn": 16, "eval_fp": 0, "eval_gmean": 0.8819171036881969, "eval_loss": 0.29493772983551025, "eval_matthews_correlation": 0.7977240352174656, "eval_precision": 1.0, "eval_recall": 0.7777777777777778, "eval_roc_auc": 0.9461805555555556, "eval_runtime": 1.5731, "eval_samples_per_second": 91.538, "eval_specificity": 1.0, "eval_steps_per_second": 0.636, "eval_tn": 72, "eval_tp": 56, "step": 324 }, { "epoch": 10.0, "eval_accuracy": 0.8888888888888888, "eval_auc": 0.9157021604938271, "eval_balanced_acc": 0.8888888888888888, "eval_f1": 0.8787878787878788, "eval_fn": 14, "eval_fp": 2, "eval_gmean": 0.8849740178929996, "eval_loss": 0.28407514095306396, "eval_matthews_correlation": 0.7888106377466154, "eval_precision": 0.9666666666666667, "eval_recall": 0.8055555555555556, "eval_roc_auc": 0.9157021604938271, "eval_runtime": 1.5699, "eval_samples_per_second": 91.725, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.637, "eval_tn": 70, "eval_tp": 58, "step": 360 }, { "epoch": 11.0, "eval_accuracy": 0.8888888888888888, "eval_auc": 0.929398148148148, "eval_balanced_acc": 0.8888888888888888, "eval_f1": 0.8873239436619719, "eval_fn": 9, "eval_fp": 7, "eval_gmean": 0.8887803753208976, "eval_loss": 0.33784234523773193, "eval_matthews_correlation": 0.7780780201274198, "eval_precision": 0.9, "eval_recall": 0.875, "eval_roc_auc": 0.929398148148148, "eval_runtime": 1.5762, "eval_samples_per_second": 91.359, "eval_specificity": 0.9027777777777778, "eval_steps_per_second": 0.634, "eval_tn": 65, "eval_tp": 63, "step": 396 }, { "epoch": 12.0, "eval_accuracy": 0.875, "eval_auc": 0.9430941358024691, "eval_balanced_acc": 0.875, "eval_f1": 0.8676470588235294, "eval_fn": 13, "eval_fp": 5, "eval_gmean": 0.8732345505343416, "eval_loss": 0.30290982127189636, "eval_matthews_correlation": 0.754672942406179, "eval_precision": 0.921875, "eval_recall": 0.8194444444444444, "eval_roc_auc": 0.9430941358024691, "eval_runtime": 1.5674, "eval_samples_per_second": 91.874, "eval_specificity": 0.9305555555555556, "eval_steps_per_second": 0.638, "eval_tn": 67, "eval_tp": 59, "step": 432 }, { "epoch": 13.0, "eval_accuracy": 0.875, "eval_auc": 0.9290123456790124, "eval_balanced_acc": 0.875, "eval_f1": 0.8732394366197183, "eval_fn": 10, "eval_fp": 8, "eval_gmean": 0.8748897637790901, "eval_loss": 0.33074280619621277, "eval_matthews_correlation": 0.7502895194085833, "eval_precision": 0.8857142857142857, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9290123456790124, "eval_runtime": 1.5785, "eval_samples_per_second": 91.228, "eval_specificity": 0.8888888888888888, "eval_steps_per_second": 0.634, "eval_tn": 64, "eval_tp": 62, "step": 468 }, { "epoch": 13.88888888888889, "grad_norm": 1.0406557321548462, "learning_rate": 0.00038011695906432747, "loss": 0.3831, "step": 500 }, { "epoch": 14.0, "eval_accuracy": 0.8819444444444444, "eval_auc": 0.9479166666666667, "eval_balanced_acc": 0.8819444444444444, "eval_f1": 0.8794326241134752, "eval_fn": 10, "eval_fp": 7, "eval_gmean": 0.8816983471168822, "eval_loss": 0.31016406416893005, "eval_matthews_correlation": 0.7645528515426074, "eval_precision": 0.8985507246376812, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9479166666666667, "eval_runtime": 1.5778, "eval_samples_per_second": 91.264, "eval_specificity": 0.9027777777777778, "eval_steps_per_second": 0.634, "eval_tn": 65, "eval_tp": 62, "step": 504 }, { "epoch": 15.0, "eval_accuracy": 0.9097222222222222, "eval_auc": 0.9479166666666666, "eval_balanced_acc": 0.9097222222222223, "eval_f1": 0.9051094890510949, "eval_fn": 10, "eval_fp": 3, "eval_gmean": 0.9084225236537685, "eval_loss": 0.26771771907806396, "eval_matthews_correlation": 0.8233448771672452, "eval_precision": 0.9538461538461539, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9479166666666666, "eval_runtime": 1.5734, "eval_samples_per_second": 91.52, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.636, "eval_tn": 69, "eval_tp": 62, "step": 540 }, { "epoch": 16.0, "eval_accuracy": 0.8888888888888888, "eval_auc": 0.9598765432098766, "eval_balanced_acc": 0.8888888888888888, "eval_f1": 0.875, "eval_fn": 16, "eval_fp": 0, "eval_gmean": 0.8819171036881969, "eval_loss": 0.28312918543815613, "eval_matthews_correlation": 0.7977240352174656, "eval_precision": 1.0, "eval_recall": 0.7777777777777778, "eval_roc_auc": 0.9598765432098766, "eval_runtime": 1.5683, "eval_samples_per_second": 91.821, "eval_specificity": 1.0, "eval_steps_per_second": 0.638, "eval_tn": 72, "eval_tp": 56, "step": 576 }, { "epoch": 17.0, "eval_accuracy": 0.9027777777777778, "eval_auc": 0.9525462962962963, "eval_balanced_acc": 0.9027777777777778, "eval_f1": 0.8939393939393939, "eval_fn": 13, "eval_fp": 1, "eval_gmean": 0.8989233958491337, "eval_loss": 0.27800989151000977, "eval_matthews_correlation": 0.816982446237566, "eval_precision": 0.9833333333333333, "eval_recall": 0.8194444444444444, "eval_roc_auc": 0.9525462962962963, "eval_runtime": 1.5821, "eval_samples_per_second": 91.016, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.632, "eval_tn": 71, "eval_tp": 59, "step": 612 }, { "epoch": 18.0, "eval_accuracy": 0.9027777777777778, "eval_auc": 0.957175925925926, "eval_balanced_acc": 0.9027777777777777, "eval_f1": 0.9014084507042254, "eval_fn": 8, "eval_fp": 6, "eval_gmean": 0.90267093384844, "eval_loss": 0.2676469385623932, "eval_matthews_correlation": 0.8058665208462562, "eval_precision": 0.9142857142857143, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.957175925925926, "eval_runtime": 1.6038, "eval_samples_per_second": 89.787, "eval_specificity": 0.9166666666666666, "eval_steps_per_second": 0.624, "eval_tn": 66, "eval_tp": 64, "step": 648 }, { "epoch": 19.0, "eval_accuracy": 0.9097222222222222, "eval_auc": 0.961033950617284, "eval_balanced_acc": 0.9097222222222223, "eval_f1": 0.9022556390977443, "eval_fn": 12, "eval_fp": 1, "eval_gmean": 0.9065093817822623, "eval_loss": 0.2535494863986969, "eval_matthews_correlation": 0.8291785292561664, "eval_precision": 0.9836065573770492, "eval_recall": 0.8333333333333334, "eval_roc_auc": 0.961033950617284, "eval_runtime": 1.5679, "eval_samples_per_second": 91.842, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.638, "eval_tn": 71, "eval_tp": 60, "step": 684 }, { "epoch": 20.0, "eval_accuracy": 0.8958333333333334, "eval_auc": 0.964891975308642, "eval_balanced_acc": 0.8958333333333334, "eval_f1": 0.8888888888888888, "eval_fn": 12, "eval_fp": 3, "eval_gmean": 0.8936504412303007, "eval_loss": 0.2748485803604126, "eval_matthews_correlation": 0.7979249985750352, "eval_precision": 0.9523809523809523, "eval_recall": 0.8333333333333334, "eval_roc_auc": 0.964891975308642, "eval_runtime": 1.5824, "eval_samples_per_second": 91.003, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.632, "eval_tn": 69, "eval_tp": 60, "step": 720 }, { "epoch": 21.0, "eval_accuracy": 0.8819444444444444, "eval_auc": 0.9456018518518517, "eval_balanced_acc": 0.8819444444444444, "eval_f1": 0.8874172185430463, "eval_fn": 5, "eval_fp": 12, "eval_gmean": 0.8806037491192977, "eval_loss": 0.36086082458496094, "eval_matthews_correlation": 0.7675248854948896, "eval_precision": 0.8481012658227848, "eval_recall": 0.9305555555555556, "eval_roc_auc": 0.9456018518518517, "eval_runtime": 1.5692, "eval_samples_per_second": 91.769, "eval_specificity": 0.8333333333333334, "eval_steps_per_second": 0.637, "eval_tn": 60, "eval_tp": 67, "step": 756 }, { "epoch": 22.0, "eval_accuracy": 0.8888888888888888, "eval_auc": 0.9533179012345679, "eval_balanced_acc": 0.8888888888888888, "eval_f1": 0.8873239436619719, "eval_fn": 9, "eval_fp": 7, "eval_gmean": 0.8887803753208976, "eval_loss": 0.32595178484916687, "eval_matthews_correlation": 0.7780780201274198, "eval_precision": 0.9, "eval_recall": 0.875, "eval_roc_auc": 0.9533179012345679, "eval_runtime": 1.5845, "eval_samples_per_second": 90.883, "eval_specificity": 0.9027777777777778, "eval_steps_per_second": 0.631, "eval_tn": 65, "eval_tp": 63, "step": 792 }, { "epoch": 23.0, "eval_accuracy": 0.9027777777777778, "eval_auc": 0.9672067901234568, "eval_balanced_acc": 0.9027777777777778, "eval_f1": 0.9, "eval_fn": 9, "eval_fp": 5, "eval_gmean": 0.9023503261544882, "eval_loss": 0.25206753611564636, "eval_matthews_correlation": 0.806801581908253, "eval_precision": 0.9264705882352942, "eval_recall": 0.875, "eval_roc_auc": 0.9672067901234568, "eval_runtime": 1.5931, "eval_samples_per_second": 90.391, "eval_specificity": 0.9305555555555556, "eval_steps_per_second": 0.628, "eval_tn": 67, "eval_tp": 63, "step": 828 }, { "epoch": 24.0, "eval_accuracy": 0.9166666666666666, "eval_auc": 0.9457947530864197, "eval_balanced_acc": 0.9166666666666667, "eval_f1": 0.9117647058823529, "eval_fn": 10, "eval_fp": 2, "eval_gmean": 0.9149816162222558, "eval_loss": 0.24512597918510437, "eval_matthews_correlation": 0.8385254915624211, "eval_precision": 0.96875, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9457947530864197, "eval_runtime": 1.5739, "eval_samples_per_second": 91.49, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.635, "eval_tn": 70, "eval_tp": 62, "step": 864 }, { "epoch": 25.0, "eval_accuracy": 0.9097222222222222, "eval_auc": 0.9637345679012346, "eval_balanced_acc": 0.9097222222222223, "eval_f1": 0.9051094890510949, "eval_fn": 10, "eval_fp": 3, "eval_gmean": 0.9084225236537685, "eval_loss": 0.2579743564128876, "eval_matthews_correlation": 0.8233448771672452, "eval_precision": 0.9538461538461539, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9637345679012346, "eval_runtime": 1.5981, "eval_samples_per_second": 90.107, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.626, "eval_tn": 69, "eval_tp": 62, "step": 900 }, { "epoch": 26.0, "eval_accuracy": 0.9166666666666666, "eval_auc": 0.9591049382716049, "eval_balanced_acc": 0.9166666666666667, "eval_f1": 0.9130434782608695, "eval_fn": 9, "eval_fp": 3, "eval_gmean": 0.9157192073264963, "eval_loss": 0.23186571896076202, "eval_matthews_correlation": 0.8362420100070908, "eval_precision": 0.9545454545454546, "eval_recall": 0.875, "eval_roc_auc": 0.9591049382716049, "eval_runtime": 1.5707, "eval_samples_per_second": 91.676, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.637, "eval_tn": 69, "eval_tp": 63, "step": 936 }, { "epoch": 27.0, "eval_accuracy": 0.9097222222222222, "eval_auc": 0.961033950617284, "eval_balanced_acc": 0.9097222222222222, "eval_f1": 0.9037037037037037, "eval_fn": 11, "eval_fp": 2, "eval_gmean": 0.9075727362613634, "eval_loss": 0.24382635951042175, "eval_matthews_correlation": 0.8259223669460891, "eval_precision": 0.9682539682539683, "eval_recall": 0.8472222222222222, "eval_roc_auc": 0.961033950617284, "eval_runtime": 1.5701, "eval_samples_per_second": 91.714, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.637, "eval_tn": 70, "eval_tp": 61, "step": 972 }, { "epoch": 27.77777777777778, "grad_norm": 0.2868950664997101, "learning_rate": 0.00023391812865497074, "loss": 0.1759, "step": 1000 }, { "epoch": 28.0, "eval_accuracy": 0.9236111111111112, "eval_auc": 0.9716435185185186, "eval_balanced_acc": 0.9236111111111112, "eval_f1": 0.9185185185185185, "eval_fn": 10, "eval_fp": 1, "eval_gmean": 0.9214940230776874, "eval_loss": 0.21144364774227142, "eval_matthews_correlation": 0.8539197353171429, "eval_precision": 0.9841269841269841, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9716435185185186, "eval_runtime": 1.5758, "eval_samples_per_second": 91.382, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.635, "eval_tn": 71, "eval_tp": 62, "step": 1008 }, { "epoch": 29.0, "eval_accuracy": 0.9236111111111112, "eval_auc": 0.9670138888888891, "eval_balanced_acc": 0.9236111111111112, "eval_f1": 0.9230769230769231, "eval_fn": 6, "eval_fp": 5, "eval_gmean": 0.9235850038081277, "eval_loss": 0.2606896162033081, "eval_matthews_correlation": 0.8473039491526416, "eval_precision": 0.9295774647887324, "eval_recall": 0.9166666666666666, "eval_roc_auc": 0.9670138888888891, "eval_runtime": 1.609, "eval_samples_per_second": 89.498, "eval_specificity": 0.9305555555555556, "eval_steps_per_second": 0.622, "eval_tn": 67, "eval_tp": 66, "step": 1044 }, { "epoch": 30.0, "eval_accuracy": 0.9236111111111112, "eval_auc": 0.9658564814814816, "eval_balanced_acc": 0.9236111111111112, "eval_f1": 0.920863309352518, "eval_fn": 8, "eval_fp": 3, "eval_gmean": 0.9229582069908973, "eval_loss": 0.24626360833644867, "eval_matthews_correlation": 0.8492725185804906, "eval_precision": 0.9552238805970149, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9658564814814816, "eval_runtime": 1.5802, "eval_samples_per_second": 91.126, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.633, "eval_tn": 69, "eval_tp": 64, "step": 1080 }, { "epoch": 31.0, "eval_accuracy": 0.9097222222222222, "eval_auc": 0.9635416666666667, "eval_balanced_acc": 0.9097222222222223, "eval_f1": 0.9051094890510949, "eval_fn": 10, "eval_fp": 3, "eval_gmean": 0.9084225236537685, "eval_loss": 0.2524122893810272, "eval_matthews_correlation": 0.8233448771672452, "eval_precision": 0.9538461538461539, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9635416666666667, "eval_runtime": 1.606, "eval_samples_per_second": 89.664, "eval_specificity": 0.9583333333333334, "eval_steps_per_second": 0.623, "eval_tn": 69, "eval_tp": 62, "step": 1116 }, { "epoch": 32.0, "eval_accuracy": 0.9236111111111112, "eval_auc": 0.9363425925925926, "eval_balanced_acc": 0.9236111111111112, "eval_f1": 0.9172932330827067, "eval_fn": 11, "eval_fp": 0, "eval_gmean": 0.9204467514322717, "eval_loss": 0.2489766776561737, "eval_matthews_correlation": 0.8572862760106127, "eval_precision": 1.0, "eval_recall": 0.8472222222222222, "eval_roc_auc": 0.9363425925925926, "eval_runtime": 1.6096, "eval_samples_per_second": 89.462, "eval_specificity": 1.0, "eval_steps_per_second": 0.621, "eval_tn": 72, "eval_tp": 61, "step": 1152 }, { "epoch": 33.0, "eval_accuracy": 0.9305555555555556, "eval_auc": 0.9567901234567903, "eval_balanced_acc": 0.9305555555555556, "eval_f1": 0.927536231884058, "eval_fn": 8, "eval_fp": 2, "eval_gmean": 0.9296222517045284, "eval_loss": 0.26165008544921875, "eval_matthews_correlation": 0.8641167436739938, "eval_precision": 0.9696969696969697, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9567901234567903, "eval_runtime": 1.6127, "eval_samples_per_second": 89.292, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.62, "eval_tn": 70, "eval_tp": 64, "step": 1188 }, { "epoch": 34.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9633487654320988, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.20786191523075104, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9633487654320988, "eval_runtime": 1.574, "eval_samples_per_second": 91.488, "eval_specificity": 1.0, "eval_steps_per_second": 0.635, "eval_tn": 72, "eval_tp": 64, "step": 1224 }, { "epoch": 35.0, "eval_accuracy": 0.9166666666666666, "eval_auc": 0.9575617283950617, "eval_balanced_acc": 0.9166666666666667, "eval_f1": 0.9090909090909091, "eval_fn": 12, "eval_fp": 0, "eval_gmean": 0.9128709291752769, "eval_loss": 0.23990610241889954, "eval_matthews_correlation": 0.8451542547285166, "eval_precision": 1.0, "eval_recall": 0.8333333333333334, "eval_roc_auc": 0.9575617283950617, "eval_runtime": 1.5748, "eval_samples_per_second": 91.441, "eval_specificity": 1.0, "eval_steps_per_second": 0.635, "eval_tn": 72, "eval_tp": 60, "step": 1260 }, { "epoch": 36.0, "eval_accuracy": 0.9236111111111112, "eval_auc": 0.9538966049382716, "eval_balanced_acc": 0.9236111111111112, "eval_f1": 0.9185185185185185, "eval_fn": 10, "eval_fp": 1, "eval_gmean": 0.9214940230776874, "eval_loss": 0.23596133291721344, "eval_matthews_correlation": 0.8539197353171429, "eval_precision": 0.9841269841269841, "eval_recall": 0.8611111111111112, "eval_roc_auc": 0.9538966049382716, "eval_runtime": 1.5725, "eval_samples_per_second": 91.573, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.636, "eval_tn": 71, "eval_tp": 62, "step": 1296 }, { "epoch": 37.0, "eval_accuracy": 0.9305555555555556, "eval_auc": 0.9683641975308642, "eval_balanced_acc": 0.9305555555555556, "eval_f1": 0.927536231884058, "eval_fn": 8, "eval_fp": 2, "eval_gmean": 0.9296222517045284, "eval_loss": 0.24645011126995087, "eval_matthews_correlation": 0.8641167436739938, "eval_precision": 0.9696969696969697, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9683641975308642, "eval_runtime": 1.5741, "eval_samples_per_second": 91.483, "eval_specificity": 0.9722222222222222, "eval_steps_per_second": 0.635, "eval_tn": 70, "eval_tp": 64, "step": 1332 }, { "epoch": 38.0, "eval_accuracy": 0.9375, "eval_auc": 0.9710648148148149, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.20392011106014252, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9710648148148149, "eval_runtime": 1.5784, "eval_samples_per_second": 91.233, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.634, "eval_tn": 71, "eval_tp": 64, "step": 1368 }, { "epoch": 39.0, "eval_accuracy": 0.9375, "eval_auc": 0.9737654320987655, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.1912021040916443, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9737654320987655, "eval_runtime": 1.5696, "eval_samples_per_second": 91.745, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.637, "eval_tn": 71, "eval_tp": 64, "step": 1404 }, { "epoch": 40.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.970679012345679, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.20200136303901672, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.970679012345679, "eval_runtime": 1.6039, "eval_samples_per_second": 89.78, "eval_specificity": 1.0, "eval_steps_per_second": 0.623, "eval_tn": 72, "eval_tp": 64, "step": 1440 }, { "epoch": 41.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9758873456790124, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.1961589753627777, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9758873456790124, "eval_runtime": 1.5711, "eval_samples_per_second": 91.653, "eval_specificity": 1.0, "eval_steps_per_second": 0.636, "eval_tn": 72, "eval_tp": 64, "step": 1476 }, { "epoch": 41.666666666666664, "grad_norm": 0.13324905931949615, "learning_rate": 8.771929824561403e-05, "loss": 0.1136, "step": 1500 }, { "epoch": 42.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9751157407407407, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.1993894726037979, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9751157407407407, "eval_runtime": 1.5781, "eval_samples_per_second": 91.25, "eval_specificity": 1.0, "eval_steps_per_second": 0.634, "eval_tn": 72, "eval_tp": 64, "step": 1512 }, { "epoch": 43.0, "eval_accuracy": 0.9375, "eval_auc": 0.9810956790123457, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.1959426999092102, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9810956790123457, "eval_runtime": 1.5846, "eval_samples_per_second": 90.874, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.631, "eval_tn": 71, "eval_tp": 64, "step": 1548 }, { "epoch": 44.0, "eval_accuracy": 0.9375, "eval_auc": 0.9824459876543209, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.19525253772735596, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9824459876543209, "eval_runtime": 1.5729, "eval_samples_per_second": 91.553, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.636, "eval_tn": 71, "eval_tp": 64, "step": 1584 }, { "epoch": 45.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9836033950617284, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.19979047775268555, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9836033950617284, "eval_runtime": 1.5771, "eval_samples_per_second": 91.309, "eval_specificity": 1.0, "eval_steps_per_second": 0.634, "eval_tn": 72, "eval_tp": 64, "step": 1620 }, { "epoch": 46.0, "eval_accuracy": 0.9375, "eval_auc": 0.9818672839506173, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.19916905462741852, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9818672839506173, "eval_runtime": 1.5731, "eval_samples_per_second": 91.542, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.636, "eval_tn": 71, "eval_tp": 64, "step": 1656 }, { "epoch": 47.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9820601851851852, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.20321370661258698, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9820601851851852, "eval_runtime": 1.5764, "eval_samples_per_second": 91.349, "eval_specificity": 1.0, "eval_steps_per_second": 0.634, "eval_tn": 72, "eval_tp": 64, "step": 1692 }, { "epoch": 48.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9809027777777778, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.2023700326681137, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9809027777777778, "eval_runtime": 1.5713, "eval_samples_per_second": 91.644, "eval_specificity": 1.0, "eval_steps_per_second": 0.636, "eval_tn": 72, "eval_tp": 64, "step": 1728 }, { "epoch": 49.0, "eval_accuracy": 0.9444444444444444, "eval_auc": 0.9803240740740742, "eval_balanced_acc": 0.9444444444444444, "eval_f1": 0.9411764705882353, "eval_fn": 8, "eval_fp": 0, "eval_gmean": 0.9428090415820634, "eval_loss": 0.20228758454322815, "eval_matthews_correlation": 0.8944271909999159, "eval_precision": 1.0, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9803240740740742, "eval_runtime": 1.5796, "eval_samples_per_second": 91.16, "eval_specificity": 1.0, "eval_steps_per_second": 0.633, "eval_tn": 72, "eval_tp": 64, "step": 1764 }, { "epoch": 50.0, "eval_accuracy": 0.9375, "eval_auc": 0.9797453703703703, "eval_balanced_acc": 0.9375, "eval_f1": 0.9343065693430657, "eval_fn": 8, "eval_fp": 1, "eval_gmean": 0.9362388636862621, "eval_loss": 0.20149865746498108, "eval_matthews_correlation": 0.8791648688396009, "eval_precision": 0.9846153846153847, "eval_recall": 0.8888888888888888, "eval_roc_auc": 0.9797453703703703, "eval_runtime": 1.5697, "eval_samples_per_second": 91.74, "eval_specificity": 0.9861111111111112, "eval_steps_per_second": 0.637, "eval_tn": 71, "eval_tp": 64, "step": 1800 } ], "logging_steps": 500, "max_steps": 1800, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 7568362736557056.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }