{ "best_metric": 0.646713977167541, "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/ffossils/roberta-finetuned-v6/models/checkpoint-400", "epoch": 14.716981132075471, "global_step": 585, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.25, "learning_rate": 2.0000000000000003e-06, "loss": 2.785, "step": 10 }, { "epoch": 0.5, "learning_rate": 4.000000000000001e-06, "loss": 2.592, "step": 20 }, { "epoch": 0.63, "eval_AGE_f1": 0.0, "eval_AGE_number": 159, "eval_AGE_precision": 0.0, "eval_AGE_recall": 0.0, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.013565891472868219, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.006958250497017893, "eval_EMAIL_recall": 0.2692307692307692, "eval_GEOG_f1": 0.0, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.0, "eval_GEOG_recall": 0.0, "eval_REGION_f1": 0.0, "eval_REGION_number": 351, "eval_REGION_precision": 0.0, "eval_REGION_recall": 0.0, "eval_SITE_f1": 0.0, "eval_SITE_number": 330, "eval_SITE_precision": 0.0, "eval_SITE_recall": 0.0, "eval_TAXA_f1": 0.0, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.0, "eval_TAXA_recall": 0.0, "eval_accuracy_entity": 0.8152934266033001, "eval_accuracy_token": 0.8152934266033001, "eval_f1_entity": 0.022789506227365072, "eval_f1_token": 0.022789506227365072, "eval_loss": 2.0357258319854736, "eval_overall_accuracy": 0.8141186522133818, "eval_overall_f1": 0.004022988505747126, "eval_overall_precision": 0.0025371511417180137, "eval_overall_recall": 0.009708737864077669, "eval_precision_entity": 0.02199113535629049, "eval_precision_token": 0.02199113535629049, "eval_recall_entity": 0.02364802933088909, "eval_recall_token": 0.02364802933088909, "eval_runtime": 10.2464, "eval_samples_per_second": 18.446, "eval_steps_per_second": 2.342, "step": 25 }, { "epoch": 0.75, "learning_rate": 6e-06, "loss": 1.9963, "step": 30 }, { "epoch": 1.01, "learning_rate": 8.000000000000001e-06, "loss": 0.8245, "step": 40 }, { "epoch": 1.26, "learning_rate": 1e-05, "loss": 0.5512, "step": 50 }, { "epoch": 1.26, "eval_AGE_f1": 0.0, "eval_AGE_number": 159, "eval_AGE_precision": 0.0, "eval_AGE_recall": 0.0, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.0, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.0, "eval_EMAIL_recall": 0.0, "eval_GEOG_f1": 0.0, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.0, "eval_GEOG_recall": 0.0, "eval_REGION_f1": 0.0, "eval_REGION_number": 351, "eval_REGION_precision": 0.0, "eval_REGION_recall": 0.0, "eval_SITE_f1": 0.0, "eval_SITE_number": 330, "eval_SITE_precision": 0.0, "eval_SITE_recall": 0.0, "eval_TAXA_f1": 0.0, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.0, "eval_TAXA_recall": 0.0, "eval_accuracy_entity": 0.9028853171000872, "eval_accuracy_token": 0.9028853171000872, "eval_f1_entity": 0.0, "eval_f1_token": 0.0, "eval_loss": 0.4787032902240753, "eval_overall_accuracy": 0.9028853171000872, "eval_overall_f1": 0.0, "eval_overall_precision": 0.0, "eval_overall_recall": 0.0, "eval_precision_entity": 0.0, "eval_precision_token": 0.0, "eval_recall_entity": 0.0, "eval_recall_token": 0.0, "eval_runtime": 10.1567, "eval_samples_per_second": 18.608, "eval_steps_per_second": 2.363, "step": 50 }, { "epoch": 1.51, "learning_rate": 1.2e-05, "loss": 0.4716, "step": 60 }, { "epoch": 1.76, "learning_rate": 1.4e-05, "loss": 0.3759, "step": 70 }, { "epoch": 1.89, "eval_AGE_f1": 0.0, "eval_AGE_number": 159, "eval_AGE_precision": 0.0, "eval_AGE_recall": 0.0, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.0, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.0, "eval_EMAIL_recall": 0.0, "eval_GEOG_f1": 0.0, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.0, "eval_GEOG_recall": 0.0, "eval_REGION_f1": 0.0, "eval_REGION_number": 351, "eval_REGION_precision": 0.0, "eval_REGION_recall": 0.0, "eval_SITE_f1": 0.0, "eval_SITE_number": 330, "eval_SITE_precision": 0.0, "eval_SITE_recall": 0.0, "eval_TAXA_f1": 0.4575645756457565, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.44364937388193204, "eval_TAXA_recall": 0.4723809523809524, "eval_accuracy_entity": 0.9267723963617593, "eval_accuracy_token": 0.9267723963617593, "eval_f1_entity": 0.45445053510832684, "eval_f1_token": 0.45445053510832684, "eval_loss": 0.28952518105506897, "eval_overall_accuracy": 0.9190651643794165, "eval_overall_f1": 0.23732057416267943, "eval_overall_precision": 0.38271604938271603, "eval_overall_recall": 0.17198335644937587, "eval_precision_entity": 0.7888536474852741, "eval_precision_token": 0.7888536474852741, "eval_recall_entity": 0.3191567369385884, "eval_recall_token": 0.3191567369385884, "eval_runtime": 10.7946, "eval_samples_per_second": 17.509, "eval_steps_per_second": 2.223, "step": 75 }, { "epoch": 2.01, "learning_rate": 1.6000000000000003e-05, "loss": 0.3221, "step": 80 }, { "epoch": 2.26, "learning_rate": 1.8e-05, "loss": 0.2555, "step": 90 }, { "epoch": 2.52, "learning_rate": 2e-05, "loss": 0.2161, "step": 100 }, { "epoch": 2.52, "eval_AGE_f1": 0.36414565826330536, "eval_AGE_number": 159, "eval_AGE_precision": 0.3282828282828283, "eval_AGE_recall": 0.4088050314465409, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.0, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.0, "eval_EMAIL_recall": 0.0, "eval_GEOG_f1": 0.058823529411764705, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.04, "eval_GEOG_recall": 0.1111111111111111, "eval_REGION_f1": 0.25806451612903225, "eval_REGION_number": 351, "eval_REGION_precision": 0.1907356948228883, "eval_REGION_recall": 0.39886039886039887, "eval_SITE_f1": 0.028925619834710745, "eval_SITE_number": 330, "eval_SITE_precision": 0.045454545454545456, "eval_SITE_recall": 0.021212121212121213, "eval_TAXA_f1": 0.6412859560067682, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.5768645357686454, "eval_TAXA_recall": 0.7219047619047619, "eval_accuracy_entity": 0.943005642476994, "eval_accuracy_token": 0.943005642476994, "eval_f1_entity": 0.654824165915239, "eval_f1_token": 0.654824165915239, "eval_loss": 0.20675021409988403, "eval_overall_accuracy": 0.9366867802281911, "eval_overall_f1": 0.3688473520249221, "eval_overall_precision": 0.334841628959276, "eval_overall_recall": 0.4105409153952843, "eval_precision_entity": 0.6443655723158829, "eval_precision_token": 0.6443655723158829, "eval_recall_entity": 0.6656278643446379, "eval_recall_token": 0.6656278643446379, "eval_runtime": 11.4868, "eval_samples_per_second": 16.454, "eval_steps_per_second": 2.089, "step": 100 }, { "epoch": 2.77, "learning_rate": 1.9587628865979382e-05, "loss": 0.1805, "step": 110 }, { "epoch": 3.02, "learning_rate": 1.9175257731958766e-05, "loss": 0.1729, "step": 120 }, { "epoch": 3.14, "eval_AGE_f1": 0.47398843930635837, "eval_AGE_number": 159, "eval_AGE_precision": 0.4385026737967914, "eval_AGE_recall": 0.5157232704402516, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.0, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.0, "eval_EMAIL_recall": 0.0, "eval_GEOG_f1": 0.2758620689655173, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2, "eval_GEOG_recall": 0.4444444444444444, "eval_REGION_f1": 0.3544813695871098, "eval_REGION_number": 351, "eval_REGION_precision": 0.27414330218068533, "eval_REGION_recall": 0.5014245014245015, "eval_SITE_f1": 0.14779874213836475, "eval_SITE_number": 330, "eval_SITE_precision": 0.15359477124183007, "eval_SITE_recall": 0.14242424242424243, "eval_TAXA_f1": 0.7314578005115089, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.6620370370370371, "eval_TAXA_recall": 0.8171428571428572, "eval_accuracy_entity": 0.9479539346042256, "eval_accuracy_token": 0.9479539346042256, "eval_f1_entity": 0.7052475850665739, "eval_f1_token": 0.7052475850665739, "eval_loss": 0.16586871445178986, "eval_overall_accuracy": 0.9440380199711647, "eval_overall_f1": 0.4548536209553159, "eval_overall_precision": 0.40931780366056575, "eval_overall_recall": 0.5117891816920943, "eval_precision_entity": 0.6713055003313453, "eval_precision_token": 0.6713055003313453, "eval_recall_entity": 0.7428047662694776, "eval_recall_token": 0.7428047662694776, "eval_runtime": 12.6888, "eval_samples_per_second": 14.895, "eval_steps_per_second": 1.891, "step": 125 }, { "epoch": 3.27, "learning_rate": 1.8762886597938147e-05, "loss": 0.1471, "step": 130 }, { "epoch": 3.52, "learning_rate": 1.8350515463917527e-05, "loss": 0.1384, "step": 140 }, { "epoch": 3.77, "learning_rate": 1.793814432989691e-05, "loss": 0.1233, "step": 150 }, { "epoch": 3.77, "eval_AGE_f1": 0.42245989304812837, "eval_AGE_number": 159, "eval_AGE_precision": 0.3674418604651163, "eval_AGE_recall": 0.4968553459119497, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.17543859649122806, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 1.0, "eval_EMAIL_recall": 0.09615384615384616, "eval_GEOG_f1": 0.3703703703703704, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2777777777777778, "eval_GEOG_recall": 0.5555555555555556, "eval_REGION_f1": 0.43149946062567424, "eval_REGION_number": 351, "eval_REGION_precision": 0.3472222222222222, "eval_REGION_recall": 0.5698005698005698, "eval_SITE_f1": 0.2934472934472935, "eval_SITE_number": 330, "eval_SITE_precision": 0.2768817204301075, "eval_SITE_recall": 0.31212121212121213, "eval_TAXA_f1": 0.7345890410958905, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.6671850699844479, "eval_TAXA_recall": 0.8171428571428572, "eval_accuracy_entity": 0.9522080418646873, "eval_accuracy_token": 0.9522080418646873, "eval_f1_entity": 0.7402282947077135, "eval_f1_token": 0.7402282947077135, "eval_loss": 0.14876657724380493, "eval_overall_accuracy": 0.9501076876524092, "eval_overall_f1": 0.5018337408312958, "eval_overall_precision": 0.4486338797814208, "eval_overall_recall": 0.5693481276005548, "eval_precision_entity": 0.7006056637747585, "eval_precision_token": 0.7006056637747585, "eval_recall_entity": 0.7846012832263978, "eval_recall_token": 0.7846012832263978, "eval_runtime": 11.4316, "eval_samples_per_second": 16.533, "eval_steps_per_second": 2.099, "step": 150 }, { "epoch": 4.03, "learning_rate": 1.752577319587629e-05, "loss": 0.1231, "step": 160 }, { "epoch": 4.28, "learning_rate": 1.7113402061855672e-05, "loss": 0.1084, "step": 170 }, { "epoch": 4.4, "eval_AGE_f1": 0.6049046321525886, "eval_AGE_number": 159, "eval_AGE_precision": 0.5336538461538461, "eval_AGE_recall": 0.6981132075471698, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.5555555555555556, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 1.0, "eval_EMAIL_recall": 0.38461538461538464, "eval_GEOG_f1": 0.33333333333333326, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.23809523809523808, "eval_GEOG_recall": 0.5555555555555556, "eval_REGION_f1": 0.4647887323943662, "eval_REGION_number": 351, "eval_REGION_precision": 0.39520958083832336, "eval_REGION_recall": 0.5641025641025641, "eval_SITE_f1": 0.3371104815864023, "eval_SITE_number": 330, "eval_SITE_precision": 0.31648936170212766, "eval_SITE_recall": 0.3606060606060606, "eval_TAXA_f1": 0.776173285198556, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7375643224699828, "eval_TAXA_recall": 0.819047619047619, "eval_accuracy_entity": 0.955144977839483, "eval_accuracy_token": 0.955144977839483, "eval_f1_entity": 0.7561658212349135, "eval_f1_token": 0.7561658212349135, "eval_loss": 0.137845978140831, "eval_overall_accuracy": 0.9533828162546056, "eval_overall_f1": 0.5576255131038838, "eval_overall_precision": 0.5118840579710144, "eval_overall_recall": 0.6123439667128987, "eval_precision_entity": 0.7230306071249373, "eval_precision_token": 0.7230306071249373, "eval_recall_entity": 0.7924839596700275, "eval_recall_token": 0.7924839596700275, "eval_runtime": 12.8578, "eval_samples_per_second": 14.699, "eval_steps_per_second": 1.867, "step": 175 }, { "epoch": 4.53, "learning_rate": 1.6701030927835052e-05, "loss": 0.1, "step": 180 }, { "epoch": 4.78, "learning_rate": 1.6288659793814433e-05, "loss": 0.1068, "step": 190 }, { "epoch": 5.03, "learning_rate": 1.5876288659793813e-05, "loss": 0.0984, "step": 200 }, { "epoch": 5.03, "eval_AGE_f1": 0.672316384180791, "eval_AGE_number": 159, "eval_AGE_precision": 0.6102564102564103, "eval_AGE_recall": 0.7484276729559748, "eval_ALTI_f1": 0.06060606060606061, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.058823529411764705, "eval_ALTI_recall": 0.0625, "eval_EMAIL_f1": 0.7826086956521738, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.9, "eval_EMAIL_recall": 0.6923076923076923, "eval_GEOG_f1": 0.42857142857142855, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.3157894736842105, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.44173140954495005, "eval_REGION_number": 351, "eval_REGION_precision": 0.3618181818181818, "eval_REGION_recall": 0.5669515669515669, "eval_SITE_f1": 0.4200792602377807, "eval_SITE_number": 330, "eval_SITE_precision": 0.37236533957845436, "eval_SITE_recall": 0.4818181818181818, "eval_TAXA_f1": 0.7944954128440367, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7663716814159292, "eval_TAXA_recall": 0.8247619047619048, "eval_accuracy_entity": 0.9572097328278244, "eval_accuracy_token": 0.9572097328278244, "eval_f1_entity": 0.7708746230073245, "eval_f1_token": 0.7708746230073245, "eval_loss": 0.13383713364601135, "eval_overall_accuracy": 0.9555721685267261, "eval_overall_f1": 0.5855606758832566, "eval_overall_precision": 0.5256480970766685, "eval_overall_recall": 0.6608876560332871, "eval_precision_entity": 0.7273170731707317, "eval_precision_token": 0.7273170731707317, "eval_recall_entity": 0.8199816681943172, "eval_recall_token": 0.8199816681943172, "eval_runtime": 9.949, "eval_samples_per_second": 18.997, "eval_steps_per_second": 2.412, "step": 200 }, { "epoch": 5.28, "learning_rate": 1.5463917525773197e-05, "loss": 0.0887, "step": 210 }, { "epoch": 5.53, "learning_rate": 1.5051546391752578e-05, "loss": 0.0872, "step": 220 }, { "epoch": 5.66, "eval_AGE_f1": 0.6319018404907976, "eval_AGE_number": 159, "eval_AGE_precision": 0.6167664670658682, "eval_AGE_recall": 0.6477987421383647, "eval_ALTI_f1": 0.07407407407407407, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.09090909090909091, "eval_ALTI_recall": 0.0625, "eval_EMAIL_f1": 0.9622641509433962, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.9444444444444444, "eval_EMAIL_recall": 0.9807692307692307, "eval_GEOG_f1": 0.3870967741935484, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2727272727272727, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.4956709956709957, "eval_REGION_number": 351, "eval_REGION_precision": 0.39965095986038396, "eval_REGION_recall": 0.6524216524216524, "eval_SITE_f1": 0.4276048714479026, "eval_SITE_number": 330, "eval_SITE_precision": 0.3863080684596577, "eval_SITE_recall": 0.47878787878787876, "eval_TAXA_f1": 0.7708703374777975, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7221297836938436, "eval_TAXA_recall": 0.8266666666666667, "eval_accuracy_entity": 0.9552339758993253, "eval_accuracy_token": 0.9552339758993253, "eval_f1_entity": 0.7587956698240865, "eval_f1_token": 0.7587956698240865, "eval_loss": 0.14531326293945312, "eval_overall_accuracy": 0.9539702034495648, "eval_overall_f1": 0.598963098505642, "eval_overall_precision": 0.5345672291780076, "eval_overall_recall": 0.680998613037448, "eval_precision_entity": 0.7043491913958235, "eval_precision_token": 0.7043491913958235, "eval_recall_entity": 0.8223648029330889, "eval_recall_token": 0.8223648029330889, "eval_runtime": 10.0713, "eval_samples_per_second": 18.766, "eval_steps_per_second": 2.383, "step": 225 }, { "epoch": 5.79, "learning_rate": 1.4639175257731958e-05, "loss": 0.086, "step": 230 }, { "epoch": 6.04, "learning_rate": 1.4226804123711342e-05, "loss": 0.0789, "step": 240 }, { "epoch": 6.29, "learning_rate": 1.3814432989690723e-05, "loss": 0.0713, "step": 250 }, { "epoch": 6.29, "eval_AGE_f1": 0.6857142857142857, "eval_AGE_number": 159, "eval_AGE_precision": 0.6282722513089005, "eval_AGE_recall": 0.7547169811320755, "eval_ALTI_f1": 0.07142857142857144, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.08333333333333333, "eval_ALTI_recall": 0.0625, "eval_EMAIL_f1": 0.859504132231405, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.7536231884057971, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.4, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2857142857142857, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.49940262843488653, "eval_REGION_number": 351, "eval_REGION_precision": 0.43004115226337447, "eval_REGION_recall": 0.5954415954415955, "eval_SITE_f1": 0.4341736694677871, "eval_SITE_number": 330, "eval_SITE_precision": 0.4036458333333333, "eval_SITE_recall": 0.4696969696969697, "eval_TAXA_f1": 0.7922437673130194, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7688172043010753, "eval_TAXA_recall": 0.8171428571428572, "eval_accuracy_entity": 0.9578683184706573, "eval_accuracy_token": 0.9578683184706573, "eval_f1_entity": 0.768325871301905, "eval_f1_token": 0.768325871301905, "eval_loss": 0.1395871937274933, "eval_overall_accuracy": 0.9568181413645183, "eval_overall_f1": 0.6146063863420803, "eval_overall_precision": 0.5647879140034864, "eval_overall_recall": 0.6740638002773925, "eval_precision_entity": 0.7371967654986523, "eval_precision_token": 0.7371967654986523, "eval_recall_entity": 0.8021998166819432, "eval_recall_token": 0.8021998166819432, "eval_runtime": 12.126, "eval_samples_per_second": 15.586, "eval_steps_per_second": 1.979, "step": 250 }, { "epoch": 6.54, "learning_rate": 1.3402061855670103e-05, "loss": 0.0761, "step": 260 }, { "epoch": 6.79, "learning_rate": 1.2989690721649485e-05, "loss": 0.0715, "step": 270 }, { "epoch": 6.92, "eval_AGE_f1": 0.7211267605633802, "eval_AGE_number": 159, "eval_AGE_precision": 0.6530612244897959, "eval_AGE_recall": 0.8050314465408805, "eval_ALTI_f1": 0.13333333333333333, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.14285714285714285, "eval_ALTI_recall": 0.125, "eval_EMAIL_f1": 0.8455284552845529, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.7323943661971831, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.3870967741935484, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2727272727272727, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5431818181818181, "eval_REGION_number": 351, "eval_REGION_precision": 0.45179584120982985, "eval_REGION_recall": 0.6809116809116809, "eval_SITE_f1": 0.45517241379310347, "eval_SITE_number": 330, "eval_SITE_precision": 0.4177215189873418, "eval_SITE_recall": 0.5, "eval_TAXA_f1": 0.7958412098298677, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7898686679174484, "eval_TAXA_recall": 0.8019047619047619, "eval_accuracy_entity": 0.9568893398123921, "eval_accuracy_token": 0.9568893398123921, "eval_f1_entity": 0.7651905252317198, "eval_f1_token": 0.7651905252317198, "eval_loss": 0.14375238120555878, "eval_overall_accuracy": 0.9557857638703476, "eval_overall_f1": 0.6327295440349782, "eval_overall_precision": 0.5755681818181818, "eval_overall_recall": 0.70249653259362, "eval_precision_entity": 0.7193803453283847, "eval_precision_token": 0.7193803453283847, "eval_recall_entity": 0.8172318973418882, "eval_recall_token": 0.8172318973418882, "eval_runtime": 12.8036, "eval_samples_per_second": 14.761, "eval_steps_per_second": 1.874, "step": 275 }, { "epoch": 7.04, "learning_rate": 1.2577319587628866e-05, "loss": 0.0779, "step": 280 }, { "epoch": 7.3, "learning_rate": 1.2164948453608248e-05, "loss": 0.0652, "step": 290 }, { "epoch": 7.55, "learning_rate": 1.175257731958763e-05, "loss": 0.0651, "step": 300 }, { "epoch": 7.55, "eval_AGE_f1": 0.7202380952380952, "eval_AGE_number": 159, "eval_AGE_precision": 0.6836158192090396, "eval_AGE_recall": 0.7610062893081762, "eval_ALTI_f1": 0.06896551724137931, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.07692307692307693, "eval_ALTI_recall": 0.0625, "eval_EMAIL_f1": 0.7428571428571429, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5909090909090909, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.42857142857142855, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.3157894736842105, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5471478463329453, "eval_REGION_number": 351, "eval_REGION_precision": 0.4625984251968504, "eval_REGION_recall": 0.6695156695156695, "eval_SITE_f1": 0.4159544159544159, "eval_SITE_number": 330, "eval_SITE_precision": 0.3924731182795699, "eval_SITE_recall": 0.44242424242424244, "eval_TAXA_f1": 0.8036697247706422, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7752212389380531, "eval_TAXA_recall": 0.8342857142857143, "eval_accuracy_entity": 0.9569427386482975, "eval_accuracy_token": 0.9569427386482975, "eval_f1_entity": 0.7655160390516038, "eval_f1_token": 0.7655160390516038, "eval_loss": 0.13883507251739502, "eval_overall_accuracy": 0.9559281607660953, "eval_overall_f1": 0.6275125628140703, "eval_overall_precision": 0.5734787600459242, "eval_overall_recall": 0.6927877947295423, "eval_precision_entity": 0.7297656639521356, "eval_precision_token": 0.7297656639521356, "eval_recall_entity": 0.8049495875343722, "eval_recall_token": 0.8049495875343722, "eval_runtime": 10.0268, "eval_samples_per_second": 18.85, "eval_steps_per_second": 2.394, "step": 300 }, { "epoch": 7.8, "learning_rate": 1.134020618556701e-05, "loss": 0.0616, "step": 310 }, { "epoch": 8.05, "learning_rate": 1.0927835051546391e-05, "loss": 0.0629, "step": 320 }, { "epoch": 8.18, "eval_AGE_f1": 0.702857142857143, "eval_AGE_number": 159, "eval_AGE_precision": 0.643979057591623, "eval_AGE_recall": 0.7735849056603774, "eval_ALTI_f1": 0.07692307692307693, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.1, "eval_ALTI_recall": 0.0625, "eval_EMAIL_f1": 0.787878787878788, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.65, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.41379310344827586, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.3, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5244040862656072, "eval_REGION_number": 351, "eval_REGION_precision": 0.4358490566037736, "eval_REGION_recall": 0.6581196581196581, "eval_SITE_f1": 0.39538239538239534, "eval_SITE_number": 330, "eval_SITE_precision": 0.3774104683195592, "eval_SITE_recall": 0.41515151515151516, "eval_TAXA_f1": 0.7945701357466064, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.756896551724138, "eval_TAXA_recall": 0.8361904761904762, "eval_accuracy_entity": 0.9557857638703476, "eval_accuracy_token": 0.9557857638703476, "eval_f1_entity": 0.7590018133149123, "eval_f1_token": 0.7590018133149123, "eval_loss": 0.14412528276443481, "eval_overall_accuracy": 0.9548245848240509, "eval_overall_f1": 0.6150497512437811, "eval_overall_precision": 0.5574971815107103, "eval_overall_recall": 0.6858529819694869, "eval_precision_entity": 0.7174338883447601, "eval_precision_token": 0.7174338883447601, "eval_recall_entity": 0.8056828597616865, "eval_recall_token": 0.8056828597616865, "eval_runtime": 10.4306, "eval_samples_per_second": 18.12, "eval_steps_per_second": 2.301, "step": 325 }, { "epoch": 8.3, "learning_rate": 1.0515463917525775e-05, "loss": 0.0556, "step": 330 }, { "epoch": 8.55, "learning_rate": 1.0103092783505156e-05, "loss": 0.0609, "step": 340 }, { "epoch": 8.81, "learning_rate": 9.690721649484536e-06, "loss": 0.0558, "step": 350 }, { "epoch": 8.81, "eval_AGE_f1": 0.6822157434402333, "eval_AGE_number": 159, "eval_AGE_precision": 0.6358695652173914, "eval_AGE_recall": 0.7358490566037735, "eval_ALTI_f1": 0.12121212121212122, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.11764705882352941, "eval_ALTI_recall": 0.125, "eval_EMAIL_f1": 0.7482014388489209, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5977011494252874, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.37500000000000006, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2608695652173913, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5439429928741093, "eval_REGION_number": 351, "eval_REGION_precision": 0.4663951120162933, "eval_REGION_recall": 0.6524216524216524, "eval_SITE_f1": 0.4425531914893617, "eval_SITE_number": 330, "eval_SITE_precision": 0.416, "eval_SITE_recall": 0.4727272727272727, "eval_TAXA_f1": 0.7924865831842576, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7470489038785835, "eval_TAXA_recall": 0.8438095238095238, "eval_accuracy_entity": 0.9551983766753884, "eval_accuracy_token": 0.9551983766753884, "eval_f1_entity": 0.7571195044308698, "eval_f1_token": 0.7571195044308698, "eval_loss": 0.14811000227928162, "eval_overall_accuracy": 0.9542371976290916, "eval_overall_f1": 0.6257783312577834, "eval_overall_precision": 0.5677966101694916, "eval_overall_recall": 0.6969486823855756, "eval_precision_entity": 0.7133592736705577, "eval_precision_token": 0.7133592736705577, "eval_recall_entity": 0.8065994500458296, "eval_recall_token": 0.8065994500458296, "eval_runtime": 11.3308, "eval_samples_per_second": 16.68, "eval_steps_per_second": 2.118, "step": 350 }, { "epoch": 9.06, "learning_rate": 9.278350515463918e-06, "loss": 0.0597, "step": 360 }, { "epoch": 9.31, "learning_rate": 8.865979381443299e-06, "loss": 0.056, "step": 370 }, { "epoch": 9.43, "eval_AGE_f1": 0.7079646017699115, "eval_AGE_number": 159, "eval_AGE_precision": 0.6666666666666666, "eval_AGE_recall": 0.7547169811320755, "eval_ALTI_f1": 0.15384615384615385, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.2, "eval_ALTI_recall": 0.125, "eval_EMAIL_f1": 0.6666666666666666, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.4, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2857142857142857, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5555555555555556, "eval_REGION_number": 351, "eval_REGION_precision": 0.4613935969868173, "eval_REGION_recall": 0.698005698005698, "eval_SITE_f1": 0.47632311977715874, "eval_SITE_number": 330, "eval_SITE_precision": 0.44072164948453607, "eval_SITE_recall": 0.5181818181818182, "eval_TAXA_f1": 0.8040109389243391, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7709790209790209, "eval_TAXA_recall": 0.84, "eval_accuracy_entity": 0.9559993592139692, "eval_accuracy_token": 0.9559993592139692, "eval_f1_entity": 0.7634735597229263, "eval_f1_token": 0.7634735597229263, "eval_loss": 0.15191707015037537, "eval_overall_accuracy": 0.9548779836599562, "eval_overall_f1": 0.6385467980295567, "eval_overall_precision": 0.5741971207087486, "eval_overall_recall": 0.7191400832177531, "eval_precision_entity": 0.7079743067523109, "eval_precision_token": 0.7079743067523109, "eval_recall_entity": 0.8284142988084326, "eval_recall_token": 0.8284142988084326, "eval_runtime": 9.9604, "eval_samples_per_second": 18.975, "eval_steps_per_second": 2.41, "step": 375 }, { "epoch": 9.56, "learning_rate": 8.453608247422681e-06, "loss": 0.0579, "step": 380 }, { "epoch": 9.81, "learning_rate": 8.041237113402063e-06, "loss": 0.0499, "step": 390 }, { "epoch": 10.06, "learning_rate": 7.628865979381444e-06, "loss": 0.0529, "step": 400 }, { "epoch": 10.06, "eval_AGE_f1": 0.7025495750708216, "eval_AGE_number": 159, "eval_AGE_precision": 0.6391752577319587, "eval_AGE_recall": 0.779874213836478, "eval_ALTI_f1": 0.3225806451612903, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.3333333333333333, "eval_ALTI_recall": 0.3125, "eval_EMAIL_f1": 0.7819548872180451, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.6419753086419753, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.4, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2857142857142857, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5511811023622047, "eval_REGION_number": 351, "eval_REGION_precision": 0.45539033457249073, "eval_REGION_recall": 0.698005698005698, "eval_SITE_f1": 0.4936530324400564, "eval_SITE_number": 330, "eval_SITE_precision": 0.46174142480211083, "eval_SITE_recall": 0.5303030303030303, "eval_TAXA_f1": 0.8047445255474452, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7723292469352014, "eval_TAXA_recall": 0.84, "eval_accuracy_entity": 0.9571207347679821, "eval_accuracy_token": 0.9571207347679821, "eval_f1_entity": 0.7682700421940929, "eval_f1_token": 0.7682700421940929, "eval_loss": 0.154266357421875, "eval_overall_accuracy": 0.9559993592139692, "eval_overall_f1": 0.646713977167541, "eval_overall_precision": 0.5825458588104503, "eval_overall_recall": 0.7267683772538142, "eval_precision_entity": 0.7118060985144644, "eval_precision_token": 0.7118060985144644, "eval_recall_entity": 0.8344637946837764, "eval_recall_token": 0.8344637946837764, "eval_runtime": 10.1935, "eval_samples_per_second": 18.541, "eval_steps_per_second": 2.354, "step": 400 }, { "epoch": 10.31, "learning_rate": 7.216494845360825e-06, "loss": 0.0504, "step": 410 }, { "epoch": 10.57, "learning_rate": 6.804123711340207e-06, "loss": 0.0527, "step": 420 }, { "epoch": 10.69, "eval_AGE_f1": 0.6966292134831462, "eval_AGE_number": 159, "eval_AGE_precision": 0.6294416243654822, "eval_AGE_recall": 0.779874213836478, "eval_ALTI_f1": 0.2962962962962963, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.36363636363636365, "eval_ALTI_recall": 0.25, "eval_EMAIL_f1": 0.7938931297709924, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.6582278481012658, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.37500000000000006, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2608695652173913, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5187878787878788, "eval_REGION_number": 351, "eval_REGION_precision": 0.45147679324894513, "eval_REGION_recall": 0.6096866096866097, "eval_SITE_f1": 0.36940836940836935, "eval_SITE_number": 330, "eval_SITE_precision": 0.3526170798898072, "eval_SITE_recall": 0.3878787878787879, "eval_TAXA_f1": 0.7914735866543096, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7707581227436823, "eval_TAXA_recall": 0.8133333333333334, "eval_accuracy_entity": 0.9547355867642086, "eval_accuracy_token": 0.9547355867642086, "eval_f1_entity": 0.7530343007915568, "eval_f1_token": 0.7530343007915568, "eval_loss": 0.15111711621284485, "eval_overall_accuracy": 0.9537744077179118, "eval_overall_f1": 0.6076996500159084, "eval_overall_precision": 0.5614344503233392, "eval_overall_recall": 0.6622746185852982, "eval_precision_entity": 0.7237531699070161, "eval_precision_token": 0.7237531699070161, "eval_recall_entity": 0.7847846012832264, "eval_recall_token": 0.7847846012832264, "eval_runtime": 10.0406, "eval_samples_per_second": 18.824, "eval_steps_per_second": 2.39, "step": 425 }, { "epoch": 10.82, "learning_rate": 6.391752577319588e-06, "loss": 0.0483, "step": 430 }, { "epoch": 11.07, "learning_rate": 5.979381443298969e-06, "loss": 0.0487, "step": 440 }, { "epoch": 11.32, "learning_rate": 5.567010309278351e-06, "loss": 0.0508, "step": 450 }, { "epoch": 11.32, "eval_AGE_f1": 0.7130434782608696, "eval_AGE_number": 159, "eval_AGE_precision": 0.6612903225806451, "eval_AGE_recall": 0.7735849056603774, "eval_ALTI_f1": 0.21428571428571427, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.25, "eval_ALTI_recall": 0.1875, "eval_EMAIL_f1": 0.7428571428571429, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5909090909090909, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.4, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2857142857142857, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.525030525030525, "eval_REGION_number": 351, "eval_REGION_precision": 0.4594017094017094, "eval_REGION_recall": 0.6125356125356125, "eval_SITE_f1": 0.38904899135446686, "eval_SITE_number": 330, "eval_SITE_precision": 0.3708791208791209, "eval_SITE_recall": 0.4090909090909091, "eval_TAXA_f1": 0.7802197802197802, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7513227513227513, "eval_TAXA_recall": 0.8114285714285714, "eval_accuracy_entity": 0.9558925615421584, "eval_accuracy_token": 0.9558925615421584, "eval_f1_entity": 0.7576967438559136, "eval_f1_token": 0.7576967438559136, "eval_loss": 0.15142428874969482, "eval_overall_accuracy": 0.9549135828838932, "eval_overall_f1": 0.6099110546378654, "eval_overall_precision": 0.5627198124267292, "eval_overall_recall": 0.665742024965326, "eval_precision_entity": 0.734181568088033, "eval_precision_token": 0.734181568088033, "eval_recall_entity": 0.7827681026581118, "eval_recall_token": 0.7827681026581118, "eval_runtime": 9.85, "eval_samples_per_second": 19.188, "eval_steps_per_second": 2.437, "step": 450 }, { "epoch": 11.57, "learning_rate": 5.154639175257732e-06, "loss": 0.0464, "step": 460 }, { "epoch": 11.82, "learning_rate": 4.742268041237113e-06, "loss": 0.0459, "step": 470 }, { "epoch": 11.95, "eval_AGE_f1": 0.6956521739130435, "eval_AGE_number": 159, "eval_AGE_precision": 0.6451612903225806, "eval_AGE_recall": 0.7547169811320755, "eval_ALTI_f1": 0.13793103448275862, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.15384615384615385, "eval_ALTI_recall": 0.125, "eval_EMAIL_f1": 0.732394366197183, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5777777777777777, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.3870967741935484, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2727272727272727, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5467980295566502, "eval_REGION_number": 351, "eval_REGION_precision": 0.48156182212581344, "eval_REGION_recall": 0.6324786324786325, "eval_SITE_f1": 0.41466854724964736, "eval_SITE_number": 330, "eval_SITE_precision": 0.38786279683377306, "eval_SITE_recall": 0.44545454545454544, "eval_TAXA_f1": 0.7944700460829494, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7696428571428572, "eval_TAXA_recall": 0.820952380952381, "eval_accuracy_entity": 0.9552161762873569, "eval_accuracy_token": 0.9552161762873569, "eval_f1_entity": 0.7573407684935088, "eval_f1_token": 0.7573407684935088, "eval_loss": 0.15560036897659302, "eval_overall_accuracy": 0.9541481995692493, "eval_overall_f1": 0.6216301934665398, "eval_overall_precision": 0.5727644652250146, "eval_overall_recall": 0.6796116504854369, "eval_precision_entity": 0.7216871471272003, "eval_precision_token": 0.7216871471272003, "eval_recall_entity": 0.7967002749770853, "eval_recall_token": 0.7967002749770853, "eval_runtime": 10.1795, "eval_samples_per_second": 18.567, "eval_steps_per_second": 2.358, "step": 475 }, { "epoch": 12.08, "learning_rate": 4.329896907216495e-06, "loss": 0.0418, "step": 480 }, { "epoch": 12.33, "learning_rate": 3.917525773195877e-06, "loss": 0.045, "step": 490 }, { "epoch": 12.58, "learning_rate": 3.5051546391752577e-06, "loss": 0.0484, "step": 500 }, { "epoch": 12.58, "eval_AGE_f1": 0.7134502923976608, "eval_AGE_number": 159, "eval_AGE_precision": 0.6666666666666666, "eval_AGE_recall": 0.7672955974842768, "eval_ALTI_f1": 0.20689655172413793, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.23076923076923078, "eval_ALTI_recall": 0.1875, "eval_EMAIL_f1": 0.7172413793103448, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5591397849462365, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.3870967741935484, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.2727272727272727, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.560093348891482, "eval_REGION_number": 351, "eval_REGION_precision": 0.4743083003952569, "eval_REGION_recall": 0.6837606837606838, "eval_SITE_f1": 0.44044321329639885, "eval_SITE_number": 330, "eval_SITE_precision": 0.40561224489795916, "eval_SITE_recall": 0.4818181818181818, "eval_TAXA_f1": 0.7956600361663652, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7573149741824441, "eval_TAXA_recall": 0.8380952380952381, "eval_accuracy_entity": 0.9561061568857799, "eval_accuracy_token": 0.9561061568857799, "eval_f1_entity": 0.7653287788215201, "eval_f1_token": 0.7653287788215201, "eval_loss": 0.15589508414268494, "eval_overall_accuracy": 0.9551271782275147, "eval_overall_f1": 0.6324257425742574, "eval_overall_precision": 0.5709497206703911, "eval_overall_recall": 0.7087378640776699, "eval_precision_entity": 0.71638689048761, "eval_precision_token": 0.71638689048761, "eval_recall_entity": 0.821448212648946, "eval_recall_token": 0.821448212648946, "eval_runtime": 12.7467, "eval_samples_per_second": 14.827, "eval_steps_per_second": 1.883, "step": 500 }, { "epoch": 12.83, "learning_rate": 3.0927835051546395e-06, "loss": 0.0461, "step": 510 }, { "epoch": 13.08, "learning_rate": 2.680412371134021e-06, "loss": 0.0386, "step": 520 }, { "epoch": 13.21, "eval_AGE_f1": 0.7055393586005833, "eval_AGE_number": 159, "eval_AGE_precision": 0.657608695652174, "eval_AGE_recall": 0.7610062893081762, "eval_ALTI_f1": 0.0, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.0, "eval_ALTI_recall": 0.0, "eval_EMAIL_f1": 0.6933333333333334, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5306122448979592, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.41379310344827586, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.3, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.558858501783591, "eval_REGION_number": 351, "eval_REGION_precision": 0.47959183673469385, "eval_REGION_recall": 0.6695156695156695, "eval_SITE_f1": 0.42758620689655175, "eval_SITE_number": 330, "eval_SITE_precision": 0.3924050632911392, "eval_SITE_recall": 0.4696969696969697, "eval_TAXA_f1": 0.7948951686417502, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7622377622377622, "eval_TAXA_recall": 0.8304761904761905, "eval_accuracy_entity": 0.9557679642583792, "eval_accuracy_token": 0.9557679642583792, "eval_f1_entity": 0.7621009268795055, "eval_f1_token": 0.7621009268795055, "eval_loss": 0.15739484131336212, "eval_overall_accuracy": 0.9548245848240509, "eval_overall_f1": 0.6255835667600373, "eval_overall_precision": 0.567476002258611, "eval_overall_recall": 0.6969486823855756, "eval_precision_entity": 0.716475714055188, "eval_precision_token": 0.716475714055188, "eval_recall_entity": 0.8139321723189734, "eval_recall_token": 0.8139321723189734, "eval_runtime": 10.5618, "eval_samples_per_second": 17.895, "eval_steps_per_second": 2.272, "step": 525 }, { "epoch": 13.33, "learning_rate": 2.268041237113402e-06, "loss": 0.0405, "step": 530 }, { "epoch": 13.58, "learning_rate": 1.8556701030927837e-06, "loss": 0.0438, "step": 540 }, { "epoch": 13.84, "learning_rate": 1.4432989690721649e-06, "loss": 0.0464, "step": 550 }, { "epoch": 13.84, "eval_AGE_f1": 0.7045454545454547, "eval_AGE_number": 159, "eval_AGE_precision": 0.6424870466321243, "eval_AGE_recall": 0.779874213836478, "eval_ALTI_f1": 0.20689655172413793, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.23076923076923078, "eval_ALTI_recall": 0.1875, "eval_EMAIL_f1": 0.7027027027027027, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5416666666666666, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.36363636363636365, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.25, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.5545023696682464, "eval_REGION_number": 351, "eval_REGION_precision": 0.4746450304259635, "eval_REGION_recall": 0.6666666666666666, "eval_SITE_f1": 0.41408450704225347, "eval_SITE_number": 330, "eval_SITE_precision": 0.3868421052631579, "eval_SITE_recall": 0.44545454545454544, "eval_TAXA_f1": 0.7978241160471441, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7612456747404844, "eval_TAXA_recall": 0.8380952380952381, "eval_accuracy_entity": 0.955144977839483, "eval_accuracy_token": 0.955144977839483, "eval_f1_entity": 0.7586857682079438, "eval_f1_token": 0.7586857682079438, "eval_loss": 0.1583557277917862, "eval_overall_accuracy": 0.9541481995692493, "eval_overall_f1": 0.6250388319353837, "eval_overall_precision": 0.566122678671919, "eval_overall_recall": 0.6976421636615812, "eval_precision_entity": 0.7129958078039342, "eval_precision_token": 0.7129958078039342, "eval_recall_entity": 0.8106324472960587, "eval_recall_token": 0.8106324472960587, "eval_runtime": 12.1366, "eval_samples_per_second": 15.573, "eval_steps_per_second": 1.977, "step": 550 }, { "epoch": 14.09, "learning_rate": 1.0309278350515464e-06, "loss": 0.0405, "step": 560 }, { "epoch": 14.34, "learning_rate": 6.185567010309279e-07, "loss": 0.0448, "step": 570 }, { "epoch": 14.47, "eval_AGE_f1": 0.7163323782234957, "eval_AGE_number": 159, "eval_AGE_precision": 0.6578947368421053, "eval_AGE_recall": 0.7861635220125787, "eval_ALTI_f1": 0.20689655172413793, "eval_ALTI_number": 16, "eval_ALTI_precision": 0.23076923076923078, "eval_ALTI_recall": 0.1875, "eval_EMAIL_f1": 0.732394366197183, "eval_EMAIL_number": 52, "eval_EMAIL_precision": 0.5777777777777777, "eval_EMAIL_recall": 1.0, "eval_GEOG_f1": 0.36363636363636365, "eval_GEOG_number": 9, "eval_GEOG_precision": 0.25, "eval_GEOG_recall": 0.6666666666666666, "eval_REGION_f1": 0.56, "eval_REGION_number": 351, "eval_REGION_precision": 0.47695390781563124, "eval_REGION_recall": 0.6780626780626781, "eval_SITE_f1": 0.41310541310541316, "eval_SITE_number": 330, "eval_SITE_precision": 0.3897849462365591, "eval_SITE_recall": 0.4393939393939394, "eval_TAXA_f1": 0.7981735159817351, "eval_TAXA_number": 525, "eval_TAXA_precision": 0.7666666666666667, "eval_TAXA_recall": 0.8323809523809523, "eval_accuracy_entity": 0.9550203805557039, "eval_accuracy_token": 0.9550203805557039, "eval_f1_entity": 0.7577735784229513, "eval_f1_token": 0.7577735784229513, "eval_loss": 0.1591457575559616, "eval_overall_accuracy": 0.9540236022854702, "eval_overall_f1": 0.62875, "eval_overall_precision": 0.5722411831626849, "eval_overall_recall": 0.6976421636615812, "eval_precision_entity": 0.7129465007273315, "eval_precision_token": 0.7129465007273315, "eval_recall_entity": 0.8086159486709441, "eval_recall_token": 0.8086159486709441, "eval_runtime": 10.2385, "eval_samples_per_second": 18.46, "eval_steps_per_second": 2.344, "step": 575 }, { "epoch": 14.59, "learning_rate": 2.061855670103093e-07, "loss": 0.0413, "step": 580 }, { "epoch": 14.72, "step": 585, "total_flos": 4125504727794096.0, "train_loss": 0.23708797097206116, "train_runtime": 1988.5186, "train_samples_per_second": 9.572, "train_steps_per_second": 0.294 } ], "max_steps": 585, "num_train_epochs": 15, "total_flos": 4125504727794096.0, "trial_name": null, "trial_params": null }