xBitterT5-720 / trainer_state.json
ndhieunguyen's picture
Upload 12 files
7865125 verified
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 50.0,
"eval_steps": 500,
"global_step": 1800,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.7152777777777778,
"eval_auc": 0.7881944444444445,
"eval_balanced_acc": 0.7152777777777778,
"eval_f1": 0.7320261437908496,
"eval_fn": 16,
"eval_fp": 25,
"eval_gmean": 0.71254196324337,
"eval_loss": 0.660514771938324,
"eval_matthews_correlation": 0.43395920975133495,
"eval_precision": 0.691358024691358,
"eval_recall": 0.7777777777777778,
"eval_roc_auc": 0.7881944444444445,
"eval_runtime": 1.7448,
"eval_samples_per_second": 82.531,
"eval_specificity": 0.6527777777777778,
"eval_steps_per_second": 0.573,
"eval_tn": 47,
"eval_tp": 56,
"step": 36
},
{
"epoch": 2.0,
"eval_accuracy": 0.7291666666666666,
"eval_auc": 0.8784722222222222,
"eval_balanced_acc": 0.7291666666666666,
"eval_f1": 0.6285714285714286,
"eval_fn": 39,
"eval_fp": 0,
"eval_gmean": 0.67700320038633,
"eval_loss": 0.5545561909675598,
"eval_matthews_correlation": 0.5452497568062706,
"eval_precision": 1.0,
"eval_recall": 0.4583333333333333,
"eval_roc_auc": 0.8784722222222222,
"eval_runtime": 1.564,
"eval_samples_per_second": 92.072,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.639,
"eval_tn": 72,
"eval_tp": 33,
"step": 72
},
{
"epoch": 3.0,
"eval_accuracy": 0.8055555555555556,
"eval_auc": 0.8809799382716048,
"eval_balanced_acc": 0.8055555555555556,
"eval_f1": 0.7704918032786885,
"eval_fn": 25,
"eval_fp": 3,
"eval_gmean": 0.7909353347168805,
"eval_loss": 0.41891196370124817,
"eval_matthews_correlation": 0.6418059625907361,
"eval_precision": 0.94,
"eval_recall": 0.6527777777777778,
"eval_roc_auc": 0.8809799382716048,
"eval_runtime": 1.5621,
"eval_samples_per_second": 92.185,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.64,
"eval_tn": 69,
"eval_tp": 47,
"step": 108
},
{
"epoch": 4.0,
"eval_accuracy": 0.875,
"eval_auc": 0.9261188271604939,
"eval_balanced_acc": 0.875,
"eval_f1": 0.8695652173913043,
"eval_fn": 12,
"eval_fp": 6,
"eval_gmean": 0.8740073734751262,
"eval_loss": 0.3357275724411011,
"eval_matthews_correlation": 0.7526178090063818,
"eval_precision": 0.9090909090909091,
"eval_recall": 0.8333333333333334,
"eval_roc_auc": 0.9261188271604939,
"eval_runtime": 1.5641,
"eval_samples_per_second": 92.065,
"eval_specificity": 0.9166666666666666,
"eval_steps_per_second": 0.639,
"eval_tn": 66,
"eval_tp": 60,
"step": 144
},
{
"epoch": 5.0,
"eval_accuracy": 0.8611111111111112,
"eval_auc": 0.91820987654321,
"eval_balanced_acc": 0.8611111111111112,
"eval_f1": 0.8529411764705882,
"eval_fn": 14,
"eval_fp": 6,
"eval_gmean": 0.8593171276810011,
"eval_loss": 0.3432258367538452,
"eval_matthews_correlation": 0.7267220926874316,
"eval_precision": 0.90625,
"eval_recall": 0.8055555555555556,
"eval_roc_auc": 0.91820987654321,
"eval_runtime": 1.6068,
"eval_samples_per_second": 89.618,
"eval_specificity": 0.9166666666666666,
"eval_steps_per_second": 0.622,
"eval_tn": 66,
"eval_tp": 58,
"step": 180
},
{
"epoch": 6.0,
"eval_accuracy": 0.8541666666666666,
"eval_auc": 0.9330632716049384,
"eval_balanced_acc": 0.8541666666666667,
"eval_f1": 0.8372093023255814,
"eval_fn": 18,
"eval_fp": 3,
"eval_gmean": 0.8477912478906585,
"eval_loss": 0.34070253372192383,
"eval_matthews_correlation": 0.7242243488319184,
"eval_precision": 0.9473684210526315,
"eval_recall": 0.75,
"eval_roc_auc": 0.9330632716049384,
"eval_runtime": 1.5703,
"eval_samples_per_second": 91.705,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.637,
"eval_tn": 69,
"eval_tp": 54,
"step": 216
},
{
"epoch": 7.0,
"eval_accuracy": 0.8611111111111112,
"eval_auc": 0.9386574074074074,
"eval_balanced_acc": 0.8611111111111112,
"eval_f1": 0.8591549295774648,
"eval_fn": 11,
"eval_fp": 9,
"eval_gmean": 0.8609990966571593,
"eval_loss": 0.36071789264678955,
"eval_matthews_correlation": 0.7225010186897469,
"eval_precision": 0.8714285714285714,
"eval_recall": 0.8472222222222222,
"eval_roc_auc": 0.9386574074074074,
"eval_runtime": 1.5692,
"eval_samples_per_second": 91.766,
"eval_specificity": 0.875,
"eval_steps_per_second": 0.637,
"eval_tn": 63,
"eval_tp": 61,
"step": 252
},
{
"epoch": 8.0,
"eval_accuracy": 0.8680555555555556,
"eval_auc": 0.9415509259259259,
"eval_balanced_acc": 0.8680555555555556,
"eval_f1": 0.8527131782945736,
"eval_fn": 17,
"eval_fp": 2,
"eval_gmean": 0.8617828920826983,
"eval_loss": 0.3144780695438385,
"eval_matthews_correlation": 0.7526253036880721,
"eval_precision": 0.9649122807017544,
"eval_recall": 0.7638888888888888,
"eval_roc_auc": 0.9415509259259259,
"eval_runtime": 1.564,
"eval_samples_per_second": 92.069,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.639,
"eval_tn": 70,
"eval_tp": 55,
"step": 288
},
{
"epoch": 9.0,
"eval_accuracy": 0.8888888888888888,
"eval_auc": 0.9461805555555556,
"eval_balanced_acc": 0.8888888888888888,
"eval_f1": 0.875,
"eval_fn": 16,
"eval_fp": 0,
"eval_gmean": 0.8819171036881969,
"eval_loss": 0.29493772983551025,
"eval_matthews_correlation": 0.7977240352174656,
"eval_precision": 1.0,
"eval_recall": 0.7777777777777778,
"eval_roc_auc": 0.9461805555555556,
"eval_runtime": 1.5731,
"eval_samples_per_second": 91.538,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.636,
"eval_tn": 72,
"eval_tp": 56,
"step": 324
},
{
"epoch": 10.0,
"eval_accuracy": 0.8888888888888888,
"eval_auc": 0.9157021604938271,
"eval_balanced_acc": 0.8888888888888888,
"eval_f1": 0.8787878787878788,
"eval_fn": 14,
"eval_fp": 2,
"eval_gmean": 0.8849740178929996,
"eval_loss": 0.28407514095306396,
"eval_matthews_correlation": 0.7888106377466154,
"eval_precision": 0.9666666666666667,
"eval_recall": 0.8055555555555556,
"eval_roc_auc": 0.9157021604938271,
"eval_runtime": 1.5699,
"eval_samples_per_second": 91.725,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.637,
"eval_tn": 70,
"eval_tp": 58,
"step": 360
},
{
"epoch": 11.0,
"eval_accuracy": 0.8888888888888888,
"eval_auc": 0.929398148148148,
"eval_balanced_acc": 0.8888888888888888,
"eval_f1": 0.8873239436619719,
"eval_fn": 9,
"eval_fp": 7,
"eval_gmean": 0.8887803753208976,
"eval_loss": 0.33784234523773193,
"eval_matthews_correlation": 0.7780780201274198,
"eval_precision": 0.9,
"eval_recall": 0.875,
"eval_roc_auc": 0.929398148148148,
"eval_runtime": 1.5762,
"eval_samples_per_second": 91.359,
"eval_specificity": 0.9027777777777778,
"eval_steps_per_second": 0.634,
"eval_tn": 65,
"eval_tp": 63,
"step": 396
},
{
"epoch": 12.0,
"eval_accuracy": 0.875,
"eval_auc": 0.9430941358024691,
"eval_balanced_acc": 0.875,
"eval_f1": 0.8676470588235294,
"eval_fn": 13,
"eval_fp": 5,
"eval_gmean": 0.8732345505343416,
"eval_loss": 0.30290982127189636,
"eval_matthews_correlation": 0.754672942406179,
"eval_precision": 0.921875,
"eval_recall": 0.8194444444444444,
"eval_roc_auc": 0.9430941358024691,
"eval_runtime": 1.5674,
"eval_samples_per_second": 91.874,
"eval_specificity": 0.9305555555555556,
"eval_steps_per_second": 0.638,
"eval_tn": 67,
"eval_tp": 59,
"step": 432
},
{
"epoch": 13.0,
"eval_accuracy": 0.875,
"eval_auc": 0.9290123456790124,
"eval_balanced_acc": 0.875,
"eval_f1": 0.8732394366197183,
"eval_fn": 10,
"eval_fp": 8,
"eval_gmean": 0.8748897637790901,
"eval_loss": 0.33074280619621277,
"eval_matthews_correlation": 0.7502895194085833,
"eval_precision": 0.8857142857142857,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9290123456790124,
"eval_runtime": 1.5785,
"eval_samples_per_second": 91.228,
"eval_specificity": 0.8888888888888888,
"eval_steps_per_second": 0.634,
"eval_tn": 64,
"eval_tp": 62,
"step": 468
},
{
"epoch": 13.88888888888889,
"grad_norm": 1.0406557321548462,
"learning_rate": 0.00038011695906432747,
"loss": 0.3831,
"step": 500
},
{
"epoch": 14.0,
"eval_accuracy": 0.8819444444444444,
"eval_auc": 0.9479166666666667,
"eval_balanced_acc": 0.8819444444444444,
"eval_f1": 0.8794326241134752,
"eval_fn": 10,
"eval_fp": 7,
"eval_gmean": 0.8816983471168822,
"eval_loss": 0.31016406416893005,
"eval_matthews_correlation": 0.7645528515426074,
"eval_precision": 0.8985507246376812,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9479166666666667,
"eval_runtime": 1.5778,
"eval_samples_per_second": 91.264,
"eval_specificity": 0.9027777777777778,
"eval_steps_per_second": 0.634,
"eval_tn": 65,
"eval_tp": 62,
"step": 504
},
{
"epoch": 15.0,
"eval_accuracy": 0.9097222222222222,
"eval_auc": 0.9479166666666666,
"eval_balanced_acc": 0.9097222222222223,
"eval_f1": 0.9051094890510949,
"eval_fn": 10,
"eval_fp": 3,
"eval_gmean": 0.9084225236537685,
"eval_loss": 0.26771771907806396,
"eval_matthews_correlation": 0.8233448771672452,
"eval_precision": 0.9538461538461539,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9479166666666666,
"eval_runtime": 1.5734,
"eval_samples_per_second": 91.52,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.636,
"eval_tn": 69,
"eval_tp": 62,
"step": 540
},
{
"epoch": 16.0,
"eval_accuracy": 0.8888888888888888,
"eval_auc": 0.9598765432098766,
"eval_balanced_acc": 0.8888888888888888,
"eval_f1": 0.875,
"eval_fn": 16,
"eval_fp": 0,
"eval_gmean": 0.8819171036881969,
"eval_loss": 0.28312918543815613,
"eval_matthews_correlation": 0.7977240352174656,
"eval_precision": 1.0,
"eval_recall": 0.7777777777777778,
"eval_roc_auc": 0.9598765432098766,
"eval_runtime": 1.5683,
"eval_samples_per_second": 91.821,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.638,
"eval_tn": 72,
"eval_tp": 56,
"step": 576
},
{
"epoch": 17.0,
"eval_accuracy": 0.9027777777777778,
"eval_auc": 0.9525462962962963,
"eval_balanced_acc": 0.9027777777777778,
"eval_f1": 0.8939393939393939,
"eval_fn": 13,
"eval_fp": 1,
"eval_gmean": 0.8989233958491337,
"eval_loss": 0.27800989151000977,
"eval_matthews_correlation": 0.816982446237566,
"eval_precision": 0.9833333333333333,
"eval_recall": 0.8194444444444444,
"eval_roc_auc": 0.9525462962962963,
"eval_runtime": 1.5821,
"eval_samples_per_second": 91.016,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.632,
"eval_tn": 71,
"eval_tp": 59,
"step": 612
},
{
"epoch": 18.0,
"eval_accuracy": 0.9027777777777778,
"eval_auc": 0.957175925925926,
"eval_balanced_acc": 0.9027777777777777,
"eval_f1": 0.9014084507042254,
"eval_fn": 8,
"eval_fp": 6,
"eval_gmean": 0.90267093384844,
"eval_loss": 0.2676469385623932,
"eval_matthews_correlation": 0.8058665208462562,
"eval_precision": 0.9142857142857143,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.957175925925926,
"eval_runtime": 1.6038,
"eval_samples_per_second": 89.787,
"eval_specificity": 0.9166666666666666,
"eval_steps_per_second": 0.624,
"eval_tn": 66,
"eval_tp": 64,
"step": 648
},
{
"epoch": 19.0,
"eval_accuracy": 0.9097222222222222,
"eval_auc": 0.961033950617284,
"eval_balanced_acc": 0.9097222222222223,
"eval_f1": 0.9022556390977443,
"eval_fn": 12,
"eval_fp": 1,
"eval_gmean": 0.9065093817822623,
"eval_loss": 0.2535494863986969,
"eval_matthews_correlation": 0.8291785292561664,
"eval_precision": 0.9836065573770492,
"eval_recall": 0.8333333333333334,
"eval_roc_auc": 0.961033950617284,
"eval_runtime": 1.5679,
"eval_samples_per_second": 91.842,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.638,
"eval_tn": 71,
"eval_tp": 60,
"step": 684
},
{
"epoch": 20.0,
"eval_accuracy": 0.8958333333333334,
"eval_auc": 0.964891975308642,
"eval_balanced_acc": 0.8958333333333334,
"eval_f1": 0.8888888888888888,
"eval_fn": 12,
"eval_fp": 3,
"eval_gmean": 0.8936504412303007,
"eval_loss": 0.2748485803604126,
"eval_matthews_correlation": 0.7979249985750352,
"eval_precision": 0.9523809523809523,
"eval_recall": 0.8333333333333334,
"eval_roc_auc": 0.964891975308642,
"eval_runtime": 1.5824,
"eval_samples_per_second": 91.003,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.632,
"eval_tn": 69,
"eval_tp": 60,
"step": 720
},
{
"epoch": 21.0,
"eval_accuracy": 0.8819444444444444,
"eval_auc": 0.9456018518518517,
"eval_balanced_acc": 0.8819444444444444,
"eval_f1": 0.8874172185430463,
"eval_fn": 5,
"eval_fp": 12,
"eval_gmean": 0.8806037491192977,
"eval_loss": 0.36086082458496094,
"eval_matthews_correlation": 0.7675248854948896,
"eval_precision": 0.8481012658227848,
"eval_recall": 0.9305555555555556,
"eval_roc_auc": 0.9456018518518517,
"eval_runtime": 1.5692,
"eval_samples_per_second": 91.769,
"eval_specificity": 0.8333333333333334,
"eval_steps_per_second": 0.637,
"eval_tn": 60,
"eval_tp": 67,
"step": 756
},
{
"epoch": 22.0,
"eval_accuracy": 0.8888888888888888,
"eval_auc": 0.9533179012345679,
"eval_balanced_acc": 0.8888888888888888,
"eval_f1": 0.8873239436619719,
"eval_fn": 9,
"eval_fp": 7,
"eval_gmean": 0.8887803753208976,
"eval_loss": 0.32595178484916687,
"eval_matthews_correlation": 0.7780780201274198,
"eval_precision": 0.9,
"eval_recall": 0.875,
"eval_roc_auc": 0.9533179012345679,
"eval_runtime": 1.5845,
"eval_samples_per_second": 90.883,
"eval_specificity": 0.9027777777777778,
"eval_steps_per_second": 0.631,
"eval_tn": 65,
"eval_tp": 63,
"step": 792
},
{
"epoch": 23.0,
"eval_accuracy": 0.9027777777777778,
"eval_auc": 0.9672067901234568,
"eval_balanced_acc": 0.9027777777777778,
"eval_f1": 0.9,
"eval_fn": 9,
"eval_fp": 5,
"eval_gmean": 0.9023503261544882,
"eval_loss": 0.25206753611564636,
"eval_matthews_correlation": 0.806801581908253,
"eval_precision": 0.9264705882352942,
"eval_recall": 0.875,
"eval_roc_auc": 0.9672067901234568,
"eval_runtime": 1.5931,
"eval_samples_per_second": 90.391,
"eval_specificity": 0.9305555555555556,
"eval_steps_per_second": 0.628,
"eval_tn": 67,
"eval_tp": 63,
"step": 828
},
{
"epoch": 24.0,
"eval_accuracy": 0.9166666666666666,
"eval_auc": 0.9457947530864197,
"eval_balanced_acc": 0.9166666666666667,
"eval_f1": 0.9117647058823529,
"eval_fn": 10,
"eval_fp": 2,
"eval_gmean": 0.9149816162222558,
"eval_loss": 0.24512597918510437,
"eval_matthews_correlation": 0.8385254915624211,
"eval_precision": 0.96875,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9457947530864197,
"eval_runtime": 1.5739,
"eval_samples_per_second": 91.49,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.635,
"eval_tn": 70,
"eval_tp": 62,
"step": 864
},
{
"epoch": 25.0,
"eval_accuracy": 0.9097222222222222,
"eval_auc": 0.9637345679012346,
"eval_balanced_acc": 0.9097222222222223,
"eval_f1": 0.9051094890510949,
"eval_fn": 10,
"eval_fp": 3,
"eval_gmean": 0.9084225236537685,
"eval_loss": 0.2579743564128876,
"eval_matthews_correlation": 0.8233448771672452,
"eval_precision": 0.9538461538461539,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9637345679012346,
"eval_runtime": 1.5981,
"eval_samples_per_second": 90.107,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.626,
"eval_tn": 69,
"eval_tp": 62,
"step": 900
},
{
"epoch": 26.0,
"eval_accuracy": 0.9166666666666666,
"eval_auc": 0.9591049382716049,
"eval_balanced_acc": 0.9166666666666667,
"eval_f1": 0.9130434782608695,
"eval_fn": 9,
"eval_fp": 3,
"eval_gmean": 0.9157192073264963,
"eval_loss": 0.23186571896076202,
"eval_matthews_correlation": 0.8362420100070908,
"eval_precision": 0.9545454545454546,
"eval_recall": 0.875,
"eval_roc_auc": 0.9591049382716049,
"eval_runtime": 1.5707,
"eval_samples_per_second": 91.676,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.637,
"eval_tn": 69,
"eval_tp": 63,
"step": 936
},
{
"epoch": 27.0,
"eval_accuracy": 0.9097222222222222,
"eval_auc": 0.961033950617284,
"eval_balanced_acc": 0.9097222222222222,
"eval_f1": 0.9037037037037037,
"eval_fn": 11,
"eval_fp": 2,
"eval_gmean": 0.9075727362613634,
"eval_loss": 0.24382635951042175,
"eval_matthews_correlation": 0.8259223669460891,
"eval_precision": 0.9682539682539683,
"eval_recall": 0.8472222222222222,
"eval_roc_auc": 0.961033950617284,
"eval_runtime": 1.5701,
"eval_samples_per_second": 91.714,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.637,
"eval_tn": 70,
"eval_tp": 61,
"step": 972
},
{
"epoch": 27.77777777777778,
"grad_norm": 0.2868950664997101,
"learning_rate": 0.00023391812865497074,
"loss": 0.1759,
"step": 1000
},
{
"epoch": 28.0,
"eval_accuracy": 0.9236111111111112,
"eval_auc": 0.9716435185185186,
"eval_balanced_acc": 0.9236111111111112,
"eval_f1": 0.9185185185185185,
"eval_fn": 10,
"eval_fp": 1,
"eval_gmean": 0.9214940230776874,
"eval_loss": 0.21144364774227142,
"eval_matthews_correlation": 0.8539197353171429,
"eval_precision": 0.9841269841269841,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9716435185185186,
"eval_runtime": 1.5758,
"eval_samples_per_second": 91.382,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.635,
"eval_tn": 71,
"eval_tp": 62,
"step": 1008
},
{
"epoch": 29.0,
"eval_accuracy": 0.9236111111111112,
"eval_auc": 0.9670138888888891,
"eval_balanced_acc": 0.9236111111111112,
"eval_f1": 0.9230769230769231,
"eval_fn": 6,
"eval_fp": 5,
"eval_gmean": 0.9235850038081277,
"eval_loss": 0.2606896162033081,
"eval_matthews_correlation": 0.8473039491526416,
"eval_precision": 0.9295774647887324,
"eval_recall": 0.9166666666666666,
"eval_roc_auc": 0.9670138888888891,
"eval_runtime": 1.609,
"eval_samples_per_second": 89.498,
"eval_specificity": 0.9305555555555556,
"eval_steps_per_second": 0.622,
"eval_tn": 67,
"eval_tp": 66,
"step": 1044
},
{
"epoch": 30.0,
"eval_accuracy": 0.9236111111111112,
"eval_auc": 0.9658564814814816,
"eval_balanced_acc": 0.9236111111111112,
"eval_f1": 0.920863309352518,
"eval_fn": 8,
"eval_fp": 3,
"eval_gmean": 0.9229582069908973,
"eval_loss": 0.24626360833644867,
"eval_matthews_correlation": 0.8492725185804906,
"eval_precision": 0.9552238805970149,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9658564814814816,
"eval_runtime": 1.5802,
"eval_samples_per_second": 91.126,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.633,
"eval_tn": 69,
"eval_tp": 64,
"step": 1080
},
{
"epoch": 31.0,
"eval_accuracy": 0.9097222222222222,
"eval_auc": 0.9635416666666667,
"eval_balanced_acc": 0.9097222222222223,
"eval_f1": 0.9051094890510949,
"eval_fn": 10,
"eval_fp": 3,
"eval_gmean": 0.9084225236537685,
"eval_loss": 0.2524122893810272,
"eval_matthews_correlation": 0.8233448771672452,
"eval_precision": 0.9538461538461539,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9635416666666667,
"eval_runtime": 1.606,
"eval_samples_per_second": 89.664,
"eval_specificity": 0.9583333333333334,
"eval_steps_per_second": 0.623,
"eval_tn": 69,
"eval_tp": 62,
"step": 1116
},
{
"epoch": 32.0,
"eval_accuracy": 0.9236111111111112,
"eval_auc": 0.9363425925925926,
"eval_balanced_acc": 0.9236111111111112,
"eval_f1": 0.9172932330827067,
"eval_fn": 11,
"eval_fp": 0,
"eval_gmean": 0.9204467514322717,
"eval_loss": 0.2489766776561737,
"eval_matthews_correlation": 0.8572862760106127,
"eval_precision": 1.0,
"eval_recall": 0.8472222222222222,
"eval_roc_auc": 0.9363425925925926,
"eval_runtime": 1.6096,
"eval_samples_per_second": 89.462,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.621,
"eval_tn": 72,
"eval_tp": 61,
"step": 1152
},
{
"epoch": 33.0,
"eval_accuracy": 0.9305555555555556,
"eval_auc": 0.9567901234567903,
"eval_balanced_acc": 0.9305555555555556,
"eval_f1": 0.927536231884058,
"eval_fn": 8,
"eval_fp": 2,
"eval_gmean": 0.9296222517045284,
"eval_loss": 0.26165008544921875,
"eval_matthews_correlation": 0.8641167436739938,
"eval_precision": 0.9696969696969697,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9567901234567903,
"eval_runtime": 1.6127,
"eval_samples_per_second": 89.292,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.62,
"eval_tn": 70,
"eval_tp": 64,
"step": 1188
},
{
"epoch": 34.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9633487654320988,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.20786191523075104,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9633487654320988,
"eval_runtime": 1.574,
"eval_samples_per_second": 91.488,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.635,
"eval_tn": 72,
"eval_tp": 64,
"step": 1224
},
{
"epoch": 35.0,
"eval_accuracy": 0.9166666666666666,
"eval_auc": 0.9575617283950617,
"eval_balanced_acc": 0.9166666666666667,
"eval_f1": 0.9090909090909091,
"eval_fn": 12,
"eval_fp": 0,
"eval_gmean": 0.9128709291752769,
"eval_loss": 0.23990610241889954,
"eval_matthews_correlation": 0.8451542547285166,
"eval_precision": 1.0,
"eval_recall": 0.8333333333333334,
"eval_roc_auc": 0.9575617283950617,
"eval_runtime": 1.5748,
"eval_samples_per_second": 91.441,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.635,
"eval_tn": 72,
"eval_tp": 60,
"step": 1260
},
{
"epoch": 36.0,
"eval_accuracy": 0.9236111111111112,
"eval_auc": 0.9538966049382716,
"eval_balanced_acc": 0.9236111111111112,
"eval_f1": 0.9185185185185185,
"eval_fn": 10,
"eval_fp": 1,
"eval_gmean": 0.9214940230776874,
"eval_loss": 0.23596133291721344,
"eval_matthews_correlation": 0.8539197353171429,
"eval_precision": 0.9841269841269841,
"eval_recall": 0.8611111111111112,
"eval_roc_auc": 0.9538966049382716,
"eval_runtime": 1.5725,
"eval_samples_per_second": 91.573,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.636,
"eval_tn": 71,
"eval_tp": 62,
"step": 1296
},
{
"epoch": 37.0,
"eval_accuracy": 0.9305555555555556,
"eval_auc": 0.9683641975308642,
"eval_balanced_acc": 0.9305555555555556,
"eval_f1": 0.927536231884058,
"eval_fn": 8,
"eval_fp": 2,
"eval_gmean": 0.9296222517045284,
"eval_loss": 0.24645011126995087,
"eval_matthews_correlation": 0.8641167436739938,
"eval_precision": 0.9696969696969697,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9683641975308642,
"eval_runtime": 1.5741,
"eval_samples_per_second": 91.483,
"eval_specificity": 0.9722222222222222,
"eval_steps_per_second": 0.635,
"eval_tn": 70,
"eval_tp": 64,
"step": 1332
},
{
"epoch": 38.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9710648148148149,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.20392011106014252,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9710648148148149,
"eval_runtime": 1.5784,
"eval_samples_per_second": 91.233,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.634,
"eval_tn": 71,
"eval_tp": 64,
"step": 1368
},
{
"epoch": 39.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9737654320987655,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.1912021040916443,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9737654320987655,
"eval_runtime": 1.5696,
"eval_samples_per_second": 91.745,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.637,
"eval_tn": 71,
"eval_tp": 64,
"step": 1404
},
{
"epoch": 40.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.970679012345679,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.20200136303901672,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.970679012345679,
"eval_runtime": 1.6039,
"eval_samples_per_second": 89.78,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.623,
"eval_tn": 72,
"eval_tp": 64,
"step": 1440
},
{
"epoch": 41.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9758873456790124,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.1961589753627777,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9758873456790124,
"eval_runtime": 1.5711,
"eval_samples_per_second": 91.653,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.636,
"eval_tn": 72,
"eval_tp": 64,
"step": 1476
},
{
"epoch": 41.666666666666664,
"grad_norm": 0.13324905931949615,
"learning_rate": 8.771929824561403e-05,
"loss": 0.1136,
"step": 1500
},
{
"epoch": 42.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9751157407407407,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.1993894726037979,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9751157407407407,
"eval_runtime": 1.5781,
"eval_samples_per_second": 91.25,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.634,
"eval_tn": 72,
"eval_tp": 64,
"step": 1512
},
{
"epoch": 43.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9810956790123457,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.1959426999092102,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9810956790123457,
"eval_runtime": 1.5846,
"eval_samples_per_second": 90.874,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.631,
"eval_tn": 71,
"eval_tp": 64,
"step": 1548
},
{
"epoch": 44.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9824459876543209,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.19525253772735596,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9824459876543209,
"eval_runtime": 1.5729,
"eval_samples_per_second": 91.553,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.636,
"eval_tn": 71,
"eval_tp": 64,
"step": 1584
},
{
"epoch": 45.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9836033950617284,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.19979047775268555,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9836033950617284,
"eval_runtime": 1.5771,
"eval_samples_per_second": 91.309,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.634,
"eval_tn": 72,
"eval_tp": 64,
"step": 1620
},
{
"epoch": 46.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9818672839506173,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.19916905462741852,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9818672839506173,
"eval_runtime": 1.5731,
"eval_samples_per_second": 91.542,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.636,
"eval_tn": 71,
"eval_tp": 64,
"step": 1656
},
{
"epoch": 47.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9820601851851852,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.20321370661258698,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9820601851851852,
"eval_runtime": 1.5764,
"eval_samples_per_second": 91.349,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.634,
"eval_tn": 72,
"eval_tp": 64,
"step": 1692
},
{
"epoch": 48.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9809027777777778,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.2023700326681137,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9809027777777778,
"eval_runtime": 1.5713,
"eval_samples_per_second": 91.644,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.636,
"eval_tn": 72,
"eval_tp": 64,
"step": 1728
},
{
"epoch": 49.0,
"eval_accuracy": 0.9444444444444444,
"eval_auc": 0.9803240740740742,
"eval_balanced_acc": 0.9444444444444444,
"eval_f1": 0.9411764705882353,
"eval_fn": 8,
"eval_fp": 0,
"eval_gmean": 0.9428090415820634,
"eval_loss": 0.20228758454322815,
"eval_matthews_correlation": 0.8944271909999159,
"eval_precision": 1.0,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9803240740740742,
"eval_runtime": 1.5796,
"eval_samples_per_second": 91.16,
"eval_specificity": 1.0,
"eval_steps_per_second": 0.633,
"eval_tn": 72,
"eval_tp": 64,
"step": 1764
},
{
"epoch": 50.0,
"eval_accuracy": 0.9375,
"eval_auc": 0.9797453703703703,
"eval_balanced_acc": 0.9375,
"eval_f1": 0.9343065693430657,
"eval_fn": 8,
"eval_fp": 1,
"eval_gmean": 0.9362388636862621,
"eval_loss": 0.20149865746498108,
"eval_matthews_correlation": 0.8791648688396009,
"eval_precision": 0.9846153846153847,
"eval_recall": 0.8888888888888888,
"eval_roc_auc": 0.9797453703703703,
"eval_runtime": 1.5697,
"eval_samples_per_second": 91.74,
"eval_specificity": 0.9861111111111112,
"eval_steps_per_second": 0.637,
"eval_tn": 71,
"eval_tp": 64,
"step": 1800
}
],
"logging_steps": 500,
"max_steps": 1800,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 7568362736557056.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}