|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 50.0, |
|
"eval_steps": 500, |
|
"global_step": 1800, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.7152777777777778, |
|
"eval_auc": 0.7881944444444445, |
|
"eval_balanced_acc": 0.7152777777777778, |
|
"eval_f1": 0.7320261437908496, |
|
"eval_fn": 16, |
|
"eval_fp": 25, |
|
"eval_gmean": 0.71254196324337, |
|
"eval_loss": 0.660514771938324, |
|
"eval_matthews_correlation": 0.43395920975133495, |
|
"eval_precision": 0.691358024691358, |
|
"eval_recall": 0.7777777777777778, |
|
"eval_roc_auc": 0.7881944444444445, |
|
"eval_runtime": 1.7448, |
|
"eval_samples_per_second": 82.531, |
|
"eval_specificity": 0.6527777777777778, |
|
"eval_steps_per_second": 0.573, |
|
"eval_tn": 47, |
|
"eval_tp": 56, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7291666666666666, |
|
"eval_auc": 0.8784722222222222, |
|
"eval_balanced_acc": 0.7291666666666666, |
|
"eval_f1": 0.6285714285714286, |
|
"eval_fn": 39, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.67700320038633, |
|
"eval_loss": 0.5545561909675598, |
|
"eval_matthews_correlation": 0.5452497568062706, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.4583333333333333, |
|
"eval_roc_auc": 0.8784722222222222, |
|
"eval_runtime": 1.564, |
|
"eval_samples_per_second": 92.072, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.639, |
|
"eval_tn": 72, |
|
"eval_tp": 33, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.8055555555555556, |
|
"eval_auc": 0.8809799382716048, |
|
"eval_balanced_acc": 0.8055555555555556, |
|
"eval_f1": 0.7704918032786885, |
|
"eval_fn": 25, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.7909353347168805, |
|
"eval_loss": 0.41891196370124817, |
|
"eval_matthews_correlation": 0.6418059625907361, |
|
"eval_precision": 0.94, |
|
"eval_recall": 0.6527777777777778, |
|
"eval_roc_auc": 0.8809799382716048, |
|
"eval_runtime": 1.5621, |
|
"eval_samples_per_second": 92.185, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.64, |
|
"eval_tn": 69, |
|
"eval_tp": 47, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.875, |
|
"eval_auc": 0.9261188271604939, |
|
"eval_balanced_acc": 0.875, |
|
"eval_f1": 0.8695652173913043, |
|
"eval_fn": 12, |
|
"eval_fp": 6, |
|
"eval_gmean": 0.8740073734751262, |
|
"eval_loss": 0.3357275724411011, |
|
"eval_matthews_correlation": 0.7526178090063818, |
|
"eval_precision": 0.9090909090909091, |
|
"eval_recall": 0.8333333333333334, |
|
"eval_roc_auc": 0.9261188271604939, |
|
"eval_runtime": 1.5641, |
|
"eval_samples_per_second": 92.065, |
|
"eval_specificity": 0.9166666666666666, |
|
"eval_steps_per_second": 0.639, |
|
"eval_tn": 66, |
|
"eval_tp": 60, |
|
"step": 144 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.8611111111111112, |
|
"eval_auc": 0.91820987654321, |
|
"eval_balanced_acc": 0.8611111111111112, |
|
"eval_f1": 0.8529411764705882, |
|
"eval_fn": 14, |
|
"eval_fp": 6, |
|
"eval_gmean": 0.8593171276810011, |
|
"eval_loss": 0.3432258367538452, |
|
"eval_matthews_correlation": 0.7267220926874316, |
|
"eval_precision": 0.90625, |
|
"eval_recall": 0.8055555555555556, |
|
"eval_roc_auc": 0.91820987654321, |
|
"eval_runtime": 1.6068, |
|
"eval_samples_per_second": 89.618, |
|
"eval_specificity": 0.9166666666666666, |
|
"eval_steps_per_second": 0.622, |
|
"eval_tn": 66, |
|
"eval_tp": 58, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.8541666666666666, |
|
"eval_auc": 0.9330632716049384, |
|
"eval_balanced_acc": 0.8541666666666667, |
|
"eval_f1": 0.8372093023255814, |
|
"eval_fn": 18, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.8477912478906585, |
|
"eval_loss": 0.34070253372192383, |
|
"eval_matthews_correlation": 0.7242243488319184, |
|
"eval_precision": 0.9473684210526315, |
|
"eval_recall": 0.75, |
|
"eval_roc_auc": 0.9330632716049384, |
|
"eval_runtime": 1.5703, |
|
"eval_samples_per_second": 91.705, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 69, |
|
"eval_tp": 54, |
|
"step": 216 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.8611111111111112, |
|
"eval_auc": 0.9386574074074074, |
|
"eval_balanced_acc": 0.8611111111111112, |
|
"eval_f1": 0.8591549295774648, |
|
"eval_fn": 11, |
|
"eval_fp": 9, |
|
"eval_gmean": 0.8609990966571593, |
|
"eval_loss": 0.36071789264678955, |
|
"eval_matthews_correlation": 0.7225010186897469, |
|
"eval_precision": 0.8714285714285714, |
|
"eval_recall": 0.8472222222222222, |
|
"eval_roc_auc": 0.9386574074074074, |
|
"eval_runtime": 1.5692, |
|
"eval_samples_per_second": 91.766, |
|
"eval_specificity": 0.875, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 63, |
|
"eval_tp": 61, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.8680555555555556, |
|
"eval_auc": 0.9415509259259259, |
|
"eval_balanced_acc": 0.8680555555555556, |
|
"eval_f1": 0.8527131782945736, |
|
"eval_fn": 17, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.8617828920826983, |
|
"eval_loss": 0.3144780695438385, |
|
"eval_matthews_correlation": 0.7526253036880721, |
|
"eval_precision": 0.9649122807017544, |
|
"eval_recall": 0.7638888888888888, |
|
"eval_roc_auc": 0.9415509259259259, |
|
"eval_runtime": 1.564, |
|
"eval_samples_per_second": 92.069, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.639, |
|
"eval_tn": 70, |
|
"eval_tp": 55, |
|
"step": 288 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_auc": 0.9461805555555556, |
|
"eval_balanced_acc": 0.8888888888888888, |
|
"eval_f1": 0.875, |
|
"eval_fn": 16, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.8819171036881969, |
|
"eval_loss": 0.29493772983551025, |
|
"eval_matthews_correlation": 0.7977240352174656, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.7777777777777778, |
|
"eval_roc_auc": 0.9461805555555556, |
|
"eval_runtime": 1.5731, |
|
"eval_samples_per_second": 91.538, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 72, |
|
"eval_tp": 56, |
|
"step": 324 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_auc": 0.9157021604938271, |
|
"eval_balanced_acc": 0.8888888888888888, |
|
"eval_f1": 0.8787878787878788, |
|
"eval_fn": 14, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.8849740178929996, |
|
"eval_loss": 0.28407514095306396, |
|
"eval_matthews_correlation": 0.7888106377466154, |
|
"eval_precision": 0.9666666666666667, |
|
"eval_recall": 0.8055555555555556, |
|
"eval_roc_auc": 0.9157021604938271, |
|
"eval_runtime": 1.5699, |
|
"eval_samples_per_second": 91.725, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 70, |
|
"eval_tp": 58, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_auc": 0.929398148148148, |
|
"eval_balanced_acc": 0.8888888888888888, |
|
"eval_f1": 0.8873239436619719, |
|
"eval_fn": 9, |
|
"eval_fp": 7, |
|
"eval_gmean": 0.8887803753208976, |
|
"eval_loss": 0.33784234523773193, |
|
"eval_matthews_correlation": 0.7780780201274198, |
|
"eval_precision": 0.9, |
|
"eval_recall": 0.875, |
|
"eval_roc_auc": 0.929398148148148, |
|
"eval_runtime": 1.5762, |
|
"eval_samples_per_second": 91.359, |
|
"eval_specificity": 0.9027777777777778, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 65, |
|
"eval_tp": 63, |
|
"step": 396 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_accuracy": 0.875, |
|
"eval_auc": 0.9430941358024691, |
|
"eval_balanced_acc": 0.875, |
|
"eval_f1": 0.8676470588235294, |
|
"eval_fn": 13, |
|
"eval_fp": 5, |
|
"eval_gmean": 0.8732345505343416, |
|
"eval_loss": 0.30290982127189636, |
|
"eval_matthews_correlation": 0.754672942406179, |
|
"eval_precision": 0.921875, |
|
"eval_recall": 0.8194444444444444, |
|
"eval_roc_auc": 0.9430941358024691, |
|
"eval_runtime": 1.5674, |
|
"eval_samples_per_second": 91.874, |
|
"eval_specificity": 0.9305555555555556, |
|
"eval_steps_per_second": 0.638, |
|
"eval_tn": 67, |
|
"eval_tp": 59, |
|
"step": 432 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_accuracy": 0.875, |
|
"eval_auc": 0.9290123456790124, |
|
"eval_balanced_acc": 0.875, |
|
"eval_f1": 0.8732394366197183, |
|
"eval_fn": 10, |
|
"eval_fp": 8, |
|
"eval_gmean": 0.8748897637790901, |
|
"eval_loss": 0.33074280619621277, |
|
"eval_matthews_correlation": 0.7502895194085833, |
|
"eval_precision": 0.8857142857142857, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9290123456790124, |
|
"eval_runtime": 1.5785, |
|
"eval_samples_per_second": 91.228, |
|
"eval_specificity": 0.8888888888888888, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 64, |
|
"eval_tp": 62, |
|
"step": 468 |
|
}, |
|
{ |
|
"epoch": 13.88888888888889, |
|
"grad_norm": 1.0406557321548462, |
|
"learning_rate": 0.00038011695906432747, |
|
"loss": 0.3831, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_accuracy": 0.8819444444444444, |
|
"eval_auc": 0.9479166666666667, |
|
"eval_balanced_acc": 0.8819444444444444, |
|
"eval_f1": 0.8794326241134752, |
|
"eval_fn": 10, |
|
"eval_fp": 7, |
|
"eval_gmean": 0.8816983471168822, |
|
"eval_loss": 0.31016406416893005, |
|
"eval_matthews_correlation": 0.7645528515426074, |
|
"eval_precision": 0.8985507246376812, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9479166666666667, |
|
"eval_runtime": 1.5778, |
|
"eval_samples_per_second": 91.264, |
|
"eval_specificity": 0.9027777777777778, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 65, |
|
"eval_tp": 62, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_accuracy": 0.9097222222222222, |
|
"eval_auc": 0.9479166666666666, |
|
"eval_balanced_acc": 0.9097222222222223, |
|
"eval_f1": 0.9051094890510949, |
|
"eval_fn": 10, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.9084225236537685, |
|
"eval_loss": 0.26771771907806396, |
|
"eval_matthews_correlation": 0.8233448771672452, |
|
"eval_precision": 0.9538461538461539, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9479166666666666, |
|
"eval_runtime": 1.5734, |
|
"eval_samples_per_second": 91.52, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 69, |
|
"eval_tp": 62, |
|
"step": 540 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_auc": 0.9598765432098766, |
|
"eval_balanced_acc": 0.8888888888888888, |
|
"eval_f1": 0.875, |
|
"eval_fn": 16, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.8819171036881969, |
|
"eval_loss": 0.28312918543815613, |
|
"eval_matthews_correlation": 0.7977240352174656, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.7777777777777778, |
|
"eval_roc_auc": 0.9598765432098766, |
|
"eval_runtime": 1.5683, |
|
"eval_samples_per_second": 91.821, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.638, |
|
"eval_tn": 72, |
|
"eval_tp": 56, |
|
"step": 576 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_accuracy": 0.9027777777777778, |
|
"eval_auc": 0.9525462962962963, |
|
"eval_balanced_acc": 0.9027777777777778, |
|
"eval_f1": 0.8939393939393939, |
|
"eval_fn": 13, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.8989233958491337, |
|
"eval_loss": 0.27800989151000977, |
|
"eval_matthews_correlation": 0.816982446237566, |
|
"eval_precision": 0.9833333333333333, |
|
"eval_recall": 0.8194444444444444, |
|
"eval_roc_auc": 0.9525462962962963, |
|
"eval_runtime": 1.5821, |
|
"eval_samples_per_second": 91.016, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.632, |
|
"eval_tn": 71, |
|
"eval_tp": 59, |
|
"step": 612 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_accuracy": 0.9027777777777778, |
|
"eval_auc": 0.957175925925926, |
|
"eval_balanced_acc": 0.9027777777777777, |
|
"eval_f1": 0.9014084507042254, |
|
"eval_fn": 8, |
|
"eval_fp": 6, |
|
"eval_gmean": 0.90267093384844, |
|
"eval_loss": 0.2676469385623932, |
|
"eval_matthews_correlation": 0.8058665208462562, |
|
"eval_precision": 0.9142857142857143, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.957175925925926, |
|
"eval_runtime": 1.6038, |
|
"eval_samples_per_second": 89.787, |
|
"eval_specificity": 0.9166666666666666, |
|
"eval_steps_per_second": 0.624, |
|
"eval_tn": 66, |
|
"eval_tp": 64, |
|
"step": 648 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_accuracy": 0.9097222222222222, |
|
"eval_auc": 0.961033950617284, |
|
"eval_balanced_acc": 0.9097222222222223, |
|
"eval_f1": 0.9022556390977443, |
|
"eval_fn": 12, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9065093817822623, |
|
"eval_loss": 0.2535494863986969, |
|
"eval_matthews_correlation": 0.8291785292561664, |
|
"eval_precision": 0.9836065573770492, |
|
"eval_recall": 0.8333333333333334, |
|
"eval_roc_auc": 0.961033950617284, |
|
"eval_runtime": 1.5679, |
|
"eval_samples_per_second": 91.842, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.638, |
|
"eval_tn": 71, |
|
"eval_tp": 60, |
|
"step": 684 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_accuracy": 0.8958333333333334, |
|
"eval_auc": 0.964891975308642, |
|
"eval_balanced_acc": 0.8958333333333334, |
|
"eval_f1": 0.8888888888888888, |
|
"eval_fn": 12, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.8936504412303007, |
|
"eval_loss": 0.2748485803604126, |
|
"eval_matthews_correlation": 0.7979249985750352, |
|
"eval_precision": 0.9523809523809523, |
|
"eval_recall": 0.8333333333333334, |
|
"eval_roc_auc": 0.964891975308642, |
|
"eval_runtime": 1.5824, |
|
"eval_samples_per_second": 91.003, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.632, |
|
"eval_tn": 69, |
|
"eval_tp": 60, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_accuracy": 0.8819444444444444, |
|
"eval_auc": 0.9456018518518517, |
|
"eval_balanced_acc": 0.8819444444444444, |
|
"eval_f1": 0.8874172185430463, |
|
"eval_fn": 5, |
|
"eval_fp": 12, |
|
"eval_gmean": 0.8806037491192977, |
|
"eval_loss": 0.36086082458496094, |
|
"eval_matthews_correlation": 0.7675248854948896, |
|
"eval_precision": 0.8481012658227848, |
|
"eval_recall": 0.9305555555555556, |
|
"eval_roc_auc": 0.9456018518518517, |
|
"eval_runtime": 1.5692, |
|
"eval_samples_per_second": 91.769, |
|
"eval_specificity": 0.8333333333333334, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 60, |
|
"eval_tp": 67, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_accuracy": 0.8888888888888888, |
|
"eval_auc": 0.9533179012345679, |
|
"eval_balanced_acc": 0.8888888888888888, |
|
"eval_f1": 0.8873239436619719, |
|
"eval_fn": 9, |
|
"eval_fp": 7, |
|
"eval_gmean": 0.8887803753208976, |
|
"eval_loss": 0.32595178484916687, |
|
"eval_matthews_correlation": 0.7780780201274198, |
|
"eval_precision": 0.9, |
|
"eval_recall": 0.875, |
|
"eval_roc_auc": 0.9533179012345679, |
|
"eval_runtime": 1.5845, |
|
"eval_samples_per_second": 90.883, |
|
"eval_specificity": 0.9027777777777778, |
|
"eval_steps_per_second": 0.631, |
|
"eval_tn": 65, |
|
"eval_tp": 63, |
|
"step": 792 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_accuracy": 0.9027777777777778, |
|
"eval_auc": 0.9672067901234568, |
|
"eval_balanced_acc": 0.9027777777777778, |
|
"eval_f1": 0.9, |
|
"eval_fn": 9, |
|
"eval_fp": 5, |
|
"eval_gmean": 0.9023503261544882, |
|
"eval_loss": 0.25206753611564636, |
|
"eval_matthews_correlation": 0.806801581908253, |
|
"eval_precision": 0.9264705882352942, |
|
"eval_recall": 0.875, |
|
"eval_roc_auc": 0.9672067901234568, |
|
"eval_runtime": 1.5931, |
|
"eval_samples_per_second": 90.391, |
|
"eval_specificity": 0.9305555555555556, |
|
"eval_steps_per_second": 0.628, |
|
"eval_tn": 67, |
|
"eval_tp": 63, |
|
"step": 828 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_accuracy": 0.9166666666666666, |
|
"eval_auc": 0.9457947530864197, |
|
"eval_balanced_acc": 0.9166666666666667, |
|
"eval_f1": 0.9117647058823529, |
|
"eval_fn": 10, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.9149816162222558, |
|
"eval_loss": 0.24512597918510437, |
|
"eval_matthews_correlation": 0.8385254915624211, |
|
"eval_precision": 0.96875, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9457947530864197, |
|
"eval_runtime": 1.5739, |
|
"eval_samples_per_second": 91.49, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.635, |
|
"eval_tn": 70, |
|
"eval_tp": 62, |
|
"step": 864 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.9097222222222222, |
|
"eval_auc": 0.9637345679012346, |
|
"eval_balanced_acc": 0.9097222222222223, |
|
"eval_f1": 0.9051094890510949, |
|
"eval_fn": 10, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.9084225236537685, |
|
"eval_loss": 0.2579743564128876, |
|
"eval_matthews_correlation": 0.8233448771672452, |
|
"eval_precision": 0.9538461538461539, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9637345679012346, |
|
"eval_runtime": 1.5981, |
|
"eval_samples_per_second": 90.107, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.626, |
|
"eval_tn": 69, |
|
"eval_tp": 62, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_accuracy": 0.9166666666666666, |
|
"eval_auc": 0.9591049382716049, |
|
"eval_balanced_acc": 0.9166666666666667, |
|
"eval_f1": 0.9130434782608695, |
|
"eval_fn": 9, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.9157192073264963, |
|
"eval_loss": 0.23186571896076202, |
|
"eval_matthews_correlation": 0.8362420100070908, |
|
"eval_precision": 0.9545454545454546, |
|
"eval_recall": 0.875, |
|
"eval_roc_auc": 0.9591049382716049, |
|
"eval_runtime": 1.5707, |
|
"eval_samples_per_second": 91.676, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 69, |
|
"eval_tp": 63, |
|
"step": 936 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_accuracy": 0.9097222222222222, |
|
"eval_auc": 0.961033950617284, |
|
"eval_balanced_acc": 0.9097222222222222, |
|
"eval_f1": 0.9037037037037037, |
|
"eval_fn": 11, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.9075727362613634, |
|
"eval_loss": 0.24382635951042175, |
|
"eval_matthews_correlation": 0.8259223669460891, |
|
"eval_precision": 0.9682539682539683, |
|
"eval_recall": 0.8472222222222222, |
|
"eval_roc_auc": 0.961033950617284, |
|
"eval_runtime": 1.5701, |
|
"eval_samples_per_second": 91.714, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 70, |
|
"eval_tp": 61, |
|
"step": 972 |
|
}, |
|
{ |
|
"epoch": 27.77777777777778, |
|
"grad_norm": 0.2868950664997101, |
|
"learning_rate": 0.00023391812865497074, |
|
"loss": 0.1759, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_accuracy": 0.9236111111111112, |
|
"eval_auc": 0.9716435185185186, |
|
"eval_balanced_acc": 0.9236111111111112, |
|
"eval_f1": 0.9185185185185185, |
|
"eval_fn": 10, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9214940230776874, |
|
"eval_loss": 0.21144364774227142, |
|
"eval_matthews_correlation": 0.8539197353171429, |
|
"eval_precision": 0.9841269841269841, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9716435185185186, |
|
"eval_runtime": 1.5758, |
|
"eval_samples_per_second": 91.382, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.635, |
|
"eval_tn": 71, |
|
"eval_tp": 62, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_accuracy": 0.9236111111111112, |
|
"eval_auc": 0.9670138888888891, |
|
"eval_balanced_acc": 0.9236111111111112, |
|
"eval_f1": 0.9230769230769231, |
|
"eval_fn": 6, |
|
"eval_fp": 5, |
|
"eval_gmean": 0.9235850038081277, |
|
"eval_loss": 0.2606896162033081, |
|
"eval_matthews_correlation": 0.8473039491526416, |
|
"eval_precision": 0.9295774647887324, |
|
"eval_recall": 0.9166666666666666, |
|
"eval_roc_auc": 0.9670138888888891, |
|
"eval_runtime": 1.609, |
|
"eval_samples_per_second": 89.498, |
|
"eval_specificity": 0.9305555555555556, |
|
"eval_steps_per_second": 0.622, |
|
"eval_tn": 67, |
|
"eval_tp": 66, |
|
"step": 1044 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_accuracy": 0.9236111111111112, |
|
"eval_auc": 0.9658564814814816, |
|
"eval_balanced_acc": 0.9236111111111112, |
|
"eval_f1": 0.920863309352518, |
|
"eval_fn": 8, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.9229582069908973, |
|
"eval_loss": 0.24626360833644867, |
|
"eval_matthews_correlation": 0.8492725185804906, |
|
"eval_precision": 0.9552238805970149, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9658564814814816, |
|
"eval_runtime": 1.5802, |
|
"eval_samples_per_second": 91.126, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.633, |
|
"eval_tn": 69, |
|
"eval_tp": 64, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_accuracy": 0.9097222222222222, |
|
"eval_auc": 0.9635416666666667, |
|
"eval_balanced_acc": 0.9097222222222223, |
|
"eval_f1": 0.9051094890510949, |
|
"eval_fn": 10, |
|
"eval_fp": 3, |
|
"eval_gmean": 0.9084225236537685, |
|
"eval_loss": 0.2524122893810272, |
|
"eval_matthews_correlation": 0.8233448771672452, |
|
"eval_precision": 0.9538461538461539, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9635416666666667, |
|
"eval_runtime": 1.606, |
|
"eval_samples_per_second": 89.664, |
|
"eval_specificity": 0.9583333333333334, |
|
"eval_steps_per_second": 0.623, |
|
"eval_tn": 69, |
|
"eval_tp": 62, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_accuracy": 0.9236111111111112, |
|
"eval_auc": 0.9363425925925926, |
|
"eval_balanced_acc": 0.9236111111111112, |
|
"eval_f1": 0.9172932330827067, |
|
"eval_fn": 11, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9204467514322717, |
|
"eval_loss": 0.2489766776561737, |
|
"eval_matthews_correlation": 0.8572862760106127, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8472222222222222, |
|
"eval_roc_auc": 0.9363425925925926, |
|
"eval_runtime": 1.6096, |
|
"eval_samples_per_second": 89.462, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.621, |
|
"eval_tn": 72, |
|
"eval_tp": 61, |
|
"step": 1152 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_accuracy": 0.9305555555555556, |
|
"eval_auc": 0.9567901234567903, |
|
"eval_balanced_acc": 0.9305555555555556, |
|
"eval_f1": 0.927536231884058, |
|
"eval_fn": 8, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.9296222517045284, |
|
"eval_loss": 0.26165008544921875, |
|
"eval_matthews_correlation": 0.8641167436739938, |
|
"eval_precision": 0.9696969696969697, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9567901234567903, |
|
"eval_runtime": 1.6127, |
|
"eval_samples_per_second": 89.292, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.62, |
|
"eval_tn": 70, |
|
"eval_tp": 64, |
|
"step": 1188 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9633487654320988, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.20786191523075104, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9633487654320988, |
|
"eval_runtime": 1.574, |
|
"eval_samples_per_second": 91.488, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.635, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1224 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_accuracy": 0.9166666666666666, |
|
"eval_auc": 0.9575617283950617, |
|
"eval_balanced_acc": 0.9166666666666667, |
|
"eval_f1": 0.9090909090909091, |
|
"eval_fn": 12, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9128709291752769, |
|
"eval_loss": 0.23990610241889954, |
|
"eval_matthews_correlation": 0.8451542547285166, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8333333333333334, |
|
"eval_roc_auc": 0.9575617283950617, |
|
"eval_runtime": 1.5748, |
|
"eval_samples_per_second": 91.441, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.635, |
|
"eval_tn": 72, |
|
"eval_tp": 60, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_accuracy": 0.9236111111111112, |
|
"eval_auc": 0.9538966049382716, |
|
"eval_balanced_acc": 0.9236111111111112, |
|
"eval_f1": 0.9185185185185185, |
|
"eval_fn": 10, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9214940230776874, |
|
"eval_loss": 0.23596133291721344, |
|
"eval_matthews_correlation": 0.8539197353171429, |
|
"eval_precision": 0.9841269841269841, |
|
"eval_recall": 0.8611111111111112, |
|
"eval_roc_auc": 0.9538966049382716, |
|
"eval_runtime": 1.5725, |
|
"eval_samples_per_second": 91.573, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 71, |
|
"eval_tp": 62, |
|
"step": 1296 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_accuracy": 0.9305555555555556, |
|
"eval_auc": 0.9683641975308642, |
|
"eval_balanced_acc": 0.9305555555555556, |
|
"eval_f1": 0.927536231884058, |
|
"eval_fn": 8, |
|
"eval_fp": 2, |
|
"eval_gmean": 0.9296222517045284, |
|
"eval_loss": 0.24645011126995087, |
|
"eval_matthews_correlation": 0.8641167436739938, |
|
"eval_precision": 0.9696969696969697, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9683641975308642, |
|
"eval_runtime": 1.5741, |
|
"eval_samples_per_second": 91.483, |
|
"eval_specificity": 0.9722222222222222, |
|
"eval_steps_per_second": 0.635, |
|
"eval_tn": 70, |
|
"eval_tp": 64, |
|
"step": 1332 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9710648148148149, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.20392011106014252, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9710648148148149, |
|
"eval_runtime": 1.5784, |
|
"eval_samples_per_second": 91.233, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1368 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9737654320987655, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.1912021040916443, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9737654320987655, |
|
"eval_runtime": 1.5696, |
|
"eval_samples_per_second": 91.745, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1404 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.970679012345679, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.20200136303901672, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.970679012345679, |
|
"eval_runtime": 1.6039, |
|
"eval_samples_per_second": 89.78, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.623, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9758873456790124, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.1961589753627777, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9758873456790124, |
|
"eval_runtime": 1.5711, |
|
"eval_samples_per_second": 91.653, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1476 |
|
}, |
|
{ |
|
"epoch": 41.666666666666664, |
|
"grad_norm": 0.13324905931949615, |
|
"learning_rate": 8.771929824561403e-05, |
|
"loss": 0.1136, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9751157407407407, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.1993894726037979, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9751157407407407, |
|
"eval_runtime": 1.5781, |
|
"eval_samples_per_second": 91.25, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9810956790123457, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.1959426999092102, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9810956790123457, |
|
"eval_runtime": 1.5846, |
|
"eval_samples_per_second": 90.874, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.631, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1548 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9824459876543209, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.19525253772735596, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9824459876543209, |
|
"eval_runtime": 1.5729, |
|
"eval_samples_per_second": 91.553, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1584 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9836033950617284, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.19979047775268555, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9836033950617284, |
|
"eval_runtime": 1.5771, |
|
"eval_samples_per_second": 91.309, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1620 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9818672839506173, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.19916905462741852, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9818672839506173, |
|
"eval_runtime": 1.5731, |
|
"eval_samples_per_second": 91.542, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1656 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9820601851851852, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.20321370661258698, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9820601851851852, |
|
"eval_runtime": 1.5764, |
|
"eval_samples_per_second": 91.349, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.634, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1692 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9809027777777778, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.2023700326681137, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9809027777777778, |
|
"eval_runtime": 1.5713, |
|
"eval_samples_per_second": 91.644, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.636, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1728 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_accuracy": 0.9444444444444444, |
|
"eval_auc": 0.9803240740740742, |
|
"eval_balanced_acc": 0.9444444444444444, |
|
"eval_f1": 0.9411764705882353, |
|
"eval_fn": 8, |
|
"eval_fp": 0, |
|
"eval_gmean": 0.9428090415820634, |
|
"eval_loss": 0.20228758454322815, |
|
"eval_matthews_correlation": 0.8944271909999159, |
|
"eval_precision": 1.0, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9803240740740742, |
|
"eval_runtime": 1.5796, |
|
"eval_samples_per_second": 91.16, |
|
"eval_specificity": 1.0, |
|
"eval_steps_per_second": 0.633, |
|
"eval_tn": 72, |
|
"eval_tp": 64, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.9375, |
|
"eval_auc": 0.9797453703703703, |
|
"eval_balanced_acc": 0.9375, |
|
"eval_f1": 0.9343065693430657, |
|
"eval_fn": 8, |
|
"eval_fp": 1, |
|
"eval_gmean": 0.9362388636862621, |
|
"eval_loss": 0.20149865746498108, |
|
"eval_matthews_correlation": 0.8791648688396009, |
|
"eval_precision": 0.9846153846153847, |
|
"eval_recall": 0.8888888888888888, |
|
"eval_roc_auc": 0.9797453703703703, |
|
"eval_runtime": 1.5697, |
|
"eval_samples_per_second": 91.74, |
|
"eval_specificity": 0.9861111111111112, |
|
"eval_steps_per_second": 0.637, |
|
"eval_tn": 71, |
|
"eval_tp": 64, |
|
"step": 1800 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 1800, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 50, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 7568362736557056.0, |
|
"train_batch_size": 16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|