{ "best_metric": 0.9663670629167874, "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/321-camembert-ner-hierarchical-loss-io/checkpoint-2000", "epoch": 5.2493438320209975, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26, "eval_ACT": { "f1": 0.8378378378378379, "number": 519, "precision": 0.7868020304568528, "recall": 0.8959537572254336 }, "eval_ACT_L1": { "f1": 0.850091407678245, "number": 503, "precision": 0.7868020304568528, "recall": 0.9244532803180915 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9687726942628904, "number": 678, "precision": 0.9542203147353362, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.0, "number": 30, "precision": 0.0, "recall": 0.0 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.908150064683053, "number": 761, "precision": 0.8942675159235669, "recall": 0.9224704336399474 }, "eval_PER": { "f1": 0.9078947368421053, "number": 676, "precision": 0.8973988439306358, "recall": 0.9186390532544378 }, "eval_SPAT": { "f1": 0.9194915254237289, "number": 694, "precision": 0.9016620498614959, "recall": 0.9380403458213257 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.0, "number": 33, "precision": 0.0, "recall": 0.0 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.926600860541635, "eval_accuracy-all": 0.950582131106049, "eval_accuracy-das": 0.9424196405973171, "eval_accuracy-l1": 0.9369779802581625, "eval_accuracy-l2": 0.9641862819539357, "eval_f1": 0.9032535473699298, "eval_f1-all": 0.9009427121102248, "eval_f1-das": 0.8991195891415995, "eval_f1-l1": 0.8884910485933504, "eval_f1-l2": 0.917252931323283, "eval_loss": 0.3965435028076172, "eval_precision": 0.8908679672038451, "eval_precision-all": 0.8902264259100029, "eval_precision-das": 0.8857968919407301, "eval_precision-l1": 0.8663341645885286, "eval_precision-l2": 0.9225067385444744, "eval_recall": 0.9159883720930233, "eval_recall-all": 0.9119201409277745, "eval_recall-das": 0.9128491620111732, "eval_recall-l1": 0.9118110236220472, "eval_recall-l2": 0.9120586275816123, "eval_runtime": 5.6993, "eval_samples_per_second": 118.611, "eval_steps_per_second": 7.545, "step": 100 }, { "epoch": 0.52, "eval_ACT": { "f1": 0.888888888888889, "number": 519, "precision": 0.8556149732620321, "recall": 0.9248554913294798 }, "eval_ACT_L1": { "f1": 0.9022556390977442, "number": 503, "precision": 0.8556149732620321, "recall": 0.9542743538767395 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9744338933528124, "number": 678, "precision": 0.9652677279305355, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.0, "number": 30, "precision": 0.0, "recall": 0.0 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9430255402750493, "number": 761, "precision": 0.9399477806788512, "recall": 0.9461235216819974 }, "eval_PER": { "f1": 0.943952802359882, "number": 676, "precision": 0.9411764705882353, "recall": 0.9467455621301775 }, "eval_SPAT": { "f1": 0.9349535382416011, "number": 694, "precision": 0.9276595744680851, "recall": 0.9423631123919308 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.0, "number": 33, "precision": 0.0, "recall": 0.0 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9360921285750443, "eval_accuracy-all": 0.955960516324981, "eval_accuracy-das": 0.9502657555049354, "eval_accuracy-l1": 0.9448240951657808, "eval_accuracy-l2": 0.9670969374841812, "eval_f1": 0.931761967117707, "eval_f1-all": 0.927931894906796, "eval_f1-das": 0.9288500835965074, "eval_f1-l1": 0.9203631647211413, "eval_f1-l2": 0.9377958079783638, "eval_loss": 0.279910147190094, "eval_precision": 0.9327119137780367, "eval_precision-all": 0.9277957147050191, "eval_precision-das": 0.9266123054114158, "eval_precision-l1": 0.9097435897435897, "eval_precision-l2": 0.9519560741249142, "eval_recall": 0.9308139534883721, "eval_recall-all": 0.9280681150910158, "eval_recall-das": 0.931098696461825, "eval_recall-l1": 0.9312335958005249, "eval_recall-l2": 0.9240506329113924, "eval_runtime": 5.3228, "eval_samples_per_second": 127.0, "eval_steps_per_second": 8.078, "step": 200 }, { "epoch": 0.79, "eval_ACT": { "f1": 0.9224880382775119, "number": 519, "precision": 0.9163498098859315, "recall": 0.928709055876686 }, "eval_ACT_L1": { "f1": 0.9368318756073858, "number": 503, "precision": 0.9163498098859315, "recall": 0.9582504970178927 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9773226042428675, "number": 678, "precision": 0.969521044992743, "recall": 0.9852507374631269 }, "eval_DESC": { "f1": 0.07692307692307691, "number": 30, "precision": 0.09090909090909091, "recall": 0.06666666666666667 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9381107491856677, "number": 761, "precision": 0.9302325581395349, "recall": 0.9461235216819974 }, "eval_PER": { "f1": 0.9358879882092852, "number": 676, "precision": 0.9324522760646109, "recall": 0.9393491124260355 }, "eval_SPAT": { "f1": 0.9390070921985816, "number": 694, "precision": 0.9245810055865922, "recall": 0.9538904899135446 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.3921568627450981, "number": 33, "precision": 0.5555555555555556, "recall": 0.30303030303030304 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9426727410782081, "eval_accuracy-all": 0.9577322196912175, "eval_accuracy-das": 0.960389774740572, "eval_accuracy-l1": 0.9483675018982536, "eval_accuracy-l2": 0.9670969374841812, "eval_f1": 0.939160737621606, "eval_f1-all": 0.9306206088992975, "eval_f1-das": 0.9402568397543273, "eval_f1-l1": 0.925194805194805, "eval_f1-l2": 0.937625754527163, "eval_loss": 0.23822064697742462, "eval_precision": 0.938207136640557, "eval_precision-all": 0.9279042615294805, "eval_precision-das": 0.9397321428571429, "eval_precision-l1": 0.9156812339331619, "eval_precision-l2": 0.9439567859554355, "eval_recall": 0.9401162790697675, "eval_recall-all": 0.9333529066353494, "eval_recall-das": 0.9407821229050279, "eval_recall-l1": 0.9349081364829396, "eval_recall-l2": 0.9313790806129247, "eval_runtime": 5.4317, "eval_samples_per_second": 124.456, "eval_steps_per_second": 7.917, "step": 300 }, { "epoch": 1.05, "eval_ACT": { "f1": 0.9135802469135802, "number": 519, "precision": 0.900749063670412, "recall": 0.9267822736030829 }, "eval_ACT_L1": { "f1": 0.9276759884281581, "number": 503, "precision": 0.900749063670412, "recall": 0.9562624254473161 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9852941176470589, "number": 678, "precision": 0.9824046920821115, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.16129032258064516, "number": 30, "precision": 0.15625, "recall": 0.16666666666666666 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9414858645627877, "number": 761, "precision": 0.9421052631578948, "recall": 0.9408672798948752 }, "eval_PER": { "f1": 0.9646539027982327, "number": 676, "precision": 0.9604105571847508, "recall": 0.9689349112426036 }, "eval_SPAT": { "f1": 0.9440459110473458, "number": 694, "precision": 0.94, "recall": 0.9481268011527377 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7118644067796609, "number": 33, "precision": 0.8076923076923077, "recall": 0.6363636363636364 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9511516071880537, "eval_accuracy-all": 0.9660212604403948, "eval_accuracy-das": 0.9677296886864085, "eval_accuracy-l1": 0.9574791192103265, "eval_accuracy-l2": 0.9745634016704632, "eval_f1": 0.9458987783595114, "eval_f1-all": 0.9399003224860745, "eval_f1-das": 0.9493293591654248, "eval_f1-l1": 0.9338178043083311, "eval_f1-l2": 0.9477938699898956, "eval_loss": 0.18405073881149292, "eval_precision": 0.9464493597206054, "eval_precision-all": 0.9385245901639344, "eval_precision-das": 0.9496831904584421, "eval_precision-l1": 0.9235112936344969, "eval_precision-l2": 0.9584468664850136, "eval_recall": 0.9453488372093023, "eval_recall-all": 0.9412800939518496, "eval_recall-das": 0.948975791433892, "eval_recall-l1": 0.9443569553805774, "eval_recall-l2": 0.9373750832778148, "eval_runtime": 5.2971, "eval_samples_per_second": 127.616, "eval_steps_per_second": 8.118, "step": 400 }, { "epoch": 1.31, "learning_rate": 9e-05, "loss": 0.3703, "step": 500 }, { "epoch": 1.31, "eval_ACT": { "f1": 0.9379178605539636, "number": 519, "precision": 0.9299242424242424, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.9524733268671194, "number": 503, "precision": 0.9299242424242424, "recall": 0.9761431411530815 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9816041206769685, "number": 678, "precision": 0.9794419970631424, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.22727272727272724, "number": 30, "precision": 0.35714285714285715, "recall": 0.16666666666666666 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9286640726329443, "number": 761, "precision": 0.9167733674775929, "recall": 0.9408672798948752 }, "eval_PER": { "f1": 0.960294117647059, "number": 676, "precision": 0.9546783625730995, "recall": 0.9659763313609467 }, "eval_SPAT": { "f1": 0.9291784702549575, "number": 694, "precision": 0.9136490250696379, "recall": 0.9452449567723343 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7419354838709677, "number": 33, "precision": 0.7931034482758621, "recall": 0.696969696969697 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.951784358390281, "eval_accuracy-all": 0.964123006833713, "eval_accuracy-das": 0.9651986838774994, "eval_accuracy-l1": 0.9583649708934447, "eval_accuracy-l2": 0.9698810427739812, "eval_f1": 0.9481932956029604, "eval_f1-all": 0.9384772760485167, "eval_f1-das": 0.9487940630797775, "eval_f1-l1": 0.9379059495972979, "eval_f1-l2": 0.9392117568470274, "eval_loss": 0.20227569341659546, "eval_precision": 0.9466821211243118, "eval_precision-all": 0.9342449810881582, "eval_precision-das": 0.945286506469501, "eval_precision-l1": 0.9284979423868313, "eval_precision-l2": 0.941728064300067, "eval_recall": 0.9497093023255814, "eval_recall-all": 0.9427480916030534, "eval_recall-das": 0.9523277467411546, "eval_recall-l1": 0.94750656167979, "eval_recall-l2": 0.9367088607594937, "eval_runtime": 5.4983, "eval_samples_per_second": 122.948, "eval_steps_per_second": 7.821, "step": 500 }, { "epoch": 1.57, "eval_ACT": { "f1": 0.9351145038167938, "number": 519, "precision": 0.9262759924385633, "recall": 0.9441233140655106 }, "eval_ACT_L1": { "f1": 0.9496124031007751, "number": 503, "precision": 0.9262759924385633, "recall": 0.974155069582505 }, "eval_ACT_L2": { "f1": 0.0, "number": 16, "precision": 0.0, "recall": 0.0 }, "eval_CARDINAL": { "f1": 0.9808823529411764, "number": 678, "precision": 0.9780058651026393, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.2711864406779661, "number": 30, "precision": 0.27586206896551724, "recall": 0.26666666666666666 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9541284403669723, "number": 761, "precision": 0.9516339869281045, "recall": 0.9566360052562418 }, "eval_PER": { "f1": 0.9720176730486009, "number": 676, "precision": 0.967741935483871, "recall": 0.9763313609467456 }, "eval_SPAT": { "f1": 0.9633883704235463, "number": 694, "precision": 0.9599427753934192, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.676470588235294, "number": 33, "precision": 0.6571428571428571, "recall": 0.696969696969697 }, "eval_TITREP": { "f1": 0.0, "number": 6, "precision": 0.0, "recall": 0.0 }, "eval_accuracy": 0.9583649708934447, "eval_accuracy-all": 0.9695646671728676, "eval_accuracy-das": 0.9716527461402177, "eval_accuracy-l1": 0.9644393824348266, "eval_accuracy-l2": 0.9746899519109087, "eval_f1": 0.9551458847437944, "eval_f1-all": 0.9510837727006444, "eval_f1-das": 0.9576050576422462, "eval_f1-l1": 0.9516129032258065, "eval_f1-l2": 0.9504021447721179, "eval_loss": 0.16219548881053925, "eval_precision": 0.953899681066976, "eval_precision-all": 0.9488603156049094, "eval_precision-das": 0.9561826958782027, "eval_precision-l1": 0.9432697266632285, "eval_precision-l2": 0.9561699258260283, "eval_recall": 0.9563953488372093, "eval_recall-all": 0.9533176746917205, "eval_recall-das": 0.9590316573556797, "eval_recall-l1": 0.9601049868766404, "eval_recall-l2": 0.9447035309793471, "eval_runtime": 5.458, "eval_samples_per_second": 123.855, "eval_steps_per_second": 7.878, "step": 600 }, { "epoch": 1.84, "eval_ACT": { "f1": 0.9361296472831266, "number": 519, "precision": 0.9264150943396227, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.9483933787731256, "number": 503, "precision": 0.9293893129770993, "recall": 0.9681908548707754 }, "eval_ACT_L2": { "f1": 0.36363636363636365, "number": 16, "precision": 0.6666666666666666, "recall": 0.25 }, "eval_CARDINAL": { "f1": 0.9889298892988929, "number": 678, "precision": 0.9896602658788775, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.4528301886792453, "number": 30, "precision": 0.5217391304347826, "recall": 0.4 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9514435695538058, "number": 761, "precision": 0.9501965923984272, "recall": 0.9526938239159002 }, "eval_PER": { "f1": 0.9666913397483345, "number": 676, "precision": 0.9674074074074074, "recall": 0.9659763313609467 }, "eval_SPAT": { "f1": 0.9519713261648747, "number": 694, "precision": 0.9472182596291013, "recall": 0.9567723342939481 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.6216216216216217, "number": 33, "precision": 0.5609756097560976, "recall": 0.696969696969697 }, "eval_TITREP": { "f1": 0.2222222222222222, "number": 6, "precision": 0.3333333333333333, "recall": 0.16666666666666666 }, "eval_accuracy": 0.9605163249810175, "eval_accuracy-all": 0.9719691217413313, "eval_accuracy-das": 0.9713996456593268, "eval_accuracy-l1": 0.9669703872437357, "eval_accuracy-l2": 0.9769678562389269, "eval_f1": 0.9528096413532743, "eval_f1-all": 0.9499926675465612, "eval_f1-das": 0.9529827169671065, "eval_f1-l1": 0.9487983281086729, "eval_f1-l2": 0.9515212303577398, "eval_loss": 0.1616193950176239, "eval_precision": 0.9518421816071947, "eval_precision-all": 0.9490184588338705, "eval_precision-das": 0.9510385756676558, "eval_precision-l1": 0.9443577743109725, "eval_precision-l2": 0.9550335570469799, "eval_recall": 0.9537790697674419, "eval_recall-all": 0.9509688784497945, "eval_recall-das": 0.9549348230912477, "eval_recall-l1": 0.9532808398950131, "eval_recall-l2": 0.9480346435709527, "eval_runtime": 5.3537, "eval_samples_per_second": 126.267, "eval_steps_per_second": 8.032, "step": 700 }, { "epoch": 2.1, "eval_ACT": { "f1": 0.9180018850141377, "number": 519, "precision": 0.8985239852398524, "recall": 0.9383429672447013 }, "eval_ACT_L1": { "f1": 0.942439024390244, "number": 503, "precision": 0.9252873563218391, "recall": 0.9602385685884692 }, "eval_ACT_L2": { "f1": 0.22222222222222224, "number": 16, "precision": 0.2, "recall": 0.25 }, "eval_CARDINAL": { "f1": 0.986019131714496, "number": 678, "precision": 0.9838472834067548, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.4210526315789474, "number": 30, "precision": 0.34782608695652173, "recall": 0.5333333333333333 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9256844850065189, "number": 761, "precision": 0.9184993531694696, "recall": 0.9329829172141918 }, "eval_PER": { "f1": 0.9558173784977908, "number": 676, "precision": 0.9516129032258065, "recall": 0.9600591715976331 }, "eval_SPAT": { "f1": 0.9461593682699211, "number": 694, "precision": 0.9427753934191703, "recall": 0.9495677233429395 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7605633802816901, "number": 33, "precision": 0.7105263157894737, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9474816502151354, "eval_accuracy-all": 0.9607694254619084, "eval_accuracy-das": 0.967603138445963, "eval_accuracy-l1": 0.9552012148823082, "eval_accuracy-l2": 0.9663376360415085, "eval_f1": 0.9397035544682689, "eval_f1-all": 0.9369998545031283, "eval_f1-das": 0.9450305385896723, "eval_f1-l1": 0.9377270368448366, "eval_f1-l2": 0.9360715468698245, "eval_loss": 0.17993101477622986, "eval_precision": 0.9304645198062126, "eval_precision-all": 0.9287568503028555, "eval_precision-das": 0.9392935982339956, "eval_precision-l1": 0.9271421241662391, "eval_precision-l2": 0.9308300395256917, "eval_recall": 0.9491279069767442, "eval_recall-all": 0.9453904873752202, "eval_recall-das": 0.9508379888268157, "eval_recall-l1": 0.9485564304461942, "eval_recall-l2": 0.9413724183877415, "eval_runtime": 5.7248, "eval_samples_per_second": 118.084, "eval_steps_per_second": 7.511, "step": 800 }, { "epoch": 2.36, "eval_ACT": { "f1": 0.9387370405278038, "number": 519, "precision": 0.9188191881918819, "recall": 0.9595375722543352 }, "eval_ACT_L1": { "f1": 0.9555125725338492, "number": 503, "precision": 0.9303201506591338, "recall": 0.9821073558648111 }, "eval_ACT_L2": { "f1": 0.2962962962962963, "number": 16, "precision": 0.36363636363636365, "recall": 0.25 }, "eval_CARDINAL": { "f1": 0.9845474613686535, "number": 678, "precision": 0.9823788546255506, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.3384615384615384, "number": 30, "precision": 0.3142857142857143, "recall": 0.36666666666666664 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9481967213114754, "number": 761, "precision": 0.9463350785340314, "recall": 0.9500657030223391 }, "eval_PER": { "f1": 0.969786293294031, "number": 676, "precision": 0.9662261380323054, "recall": 0.9733727810650887 }, "eval_SPAT": { "f1": 0.9511494252873564, "number": 694, "precision": 0.9484240687679083, "recall": 0.9538904899135446 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.7936507936507938, "number": 33, "precision": 0.8333333333333334, "recall": 0.7575757575757576 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9600101240192357, "eval_accuracy-all": 0.9705770690964313, "eval_accuracy-das": 0.9731713490255631, "eval_accuracy-l1": 0.9653252341179448, "eval_accuracy-l2": 0.9758289040749177, "eval_f1": 0.9563578367406117, "eval_f1-all": 0.9492912465293001, "eval_f1-das": 0.959539717891611, "eval_f1-l1": 0.9480519480519479, "eval_f1-l2": 0.9508853992649516, "eval_loss": 0.16017325222492218, "eval_precision": 0.9540063638993347, "eval_precision-all": 0.945010183299389, "eval_precision-das": 0.9563448020717721, "eval_precision-l1": 0.9383033419023136, "eval_precision-l2": 0.9537533512064343, "eval_recall": 0.9587209302325581, "eval_recall-all": 0.9536112742219612, "eval_recall-das": 0.962756052141527, "eval_recall-l1": 0.958005249343832, "eval_recall-l2": 0.9480346435709527, "eval_runtime": 5.5031, "eval_samples_per_second": 122.84, "eval_steps_per_second": 7.814, "step": 900 }, { "epoch": 2.62, "learning_rate": 8e-05, "loss": 0.1449, "step": 1000 }, { "epoch": 2.62, "eval_ACT": { "f1": 0.9233716475095786, "number": 519, "precision": 0.9180952380952381, "recall": 0.928709055876686 }, "eval_ACT_L1": { "f1": 0.9397828232971372, "number": 503, "precision": 0.9333333333333333, "recall": 0.9463220675944334 }, "eval_ACT_L2": { "f1": 0.38709677419354843, "number": 16, "precision": 0.4, "recall": 0.375 }, "eval_CARDINAL": { "f1": 0.9823788546255506, "number": 678, "precision": 0.9780701754385965, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.47058823529411764, "number": 30, "precision": 0.42105263157894735, "recall": 0.5333333333333333 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9440104166666667, "number": 761, "precision": 0.9354838709677419, "recall": 0.9526938239159002 }, "eval_PER": { "f1": 0.9690265486725664, "number": 676, "precision": 0.9661764705882353, "recall": 0.9718934911242604 }, "eval_SPAT": { "f1": 0.946236559139785, "number": 694, "precision": 0.9415121255349501, "recall": 0.9510086455331412 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8307692307692308, "number": 33, "precision": 0.84375, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.3636363636363636, "number": 6, "precision": 0.4, "recall": 0.3333333333333333 }, "eval_accuracy": 0.957605669450772, "eval_accuracy-all": 0.9693748418121995, "eval_accuracy-das": 0.9710199949379904, "eval_accuracy-l1": 0.9641862819539357, "eval_accuracy-l2": 0.9745634016704632, "eval_f1": 0.9503177354130561, "eval_f1-all": 0.9459538416593631, "eval_f1-das": 0.953583364277757, "eval_f1-l1": 0.9436619718309859, "eval_f1-l2": 0.948871181938911, "eval_loss": 0.17344143986701965, "eval_precision": 0.9443168771526981, "eval_precision-all": 0.9412790697674419, "eval_precision-das": 0.9507589781562384, "eval_precision-l1": 0.937791601866252, "eval_precision-l2": 0.9457313037723362, "eval_recall": 0.9563953488372093, "eval_recall-all": 0.9506752789195537, "eval_recall-das": 0.9564245810055866, "eval_recall-l1": 0.9496062992125984, "eval_recall-l2": 0.9520319786808794, "eval_runtime": 5.2868, "eval_samples_per_second": 127.865, "eval_steps_per_second": 8.133, "step": 1000 }, { "epoch": 2.89, "eval_ACT": { "f1": 0.9411764705882353, "number": 519, "precision": 0.9271028037383178, "recall": 0.9556840077071291 }, "eval_ACT_L1": { "f1": 0.966403162055336, "number": 503, "precision": 0.9607072691552063, "recall": 0.9721669980119284 }, "eval_ACT_L2": { "f1": 0.33333333333333337, "number": 16, "precision": 0.2692307692307692, "recall": 0.4375 }, "eval_CARDINAL": { "f1": 0.9852724594992636, "number": 678, "precision": 0.9838235294117647, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.4864864864864865, "number": 30, "precision": 0.4090909090909091, "recall": 0.6 }, "eval_FT": { "f1": 0.18181818181818182, "number": 7, "precision": 0.25, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9514435695538058, "number": 761, "precision": 0.9501965923984272, "recall": 0.9526938239159002 }, "eval_PER": { "f1": 0.9807976366322009, "number": 676, "precision": 0.9793510324483776, "recall": 0.9822485207100592 }, "eval_SPAT": { "f1": 0.9503239740820734, "number": 694, "precision": 0.9496402877697842, "recall": 0.9510086455331412 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.819672131147541, "number": 33, "precision": 0.8928571428571429, "recall": 0.7575757575757576 }, "eval_TITREP": { "f1": 0.26666666666666666, "number": 6, "precision": 0.2222222222222222, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9530498607947355, "eval_accuracy-all": 0.964819033156163, "eval_accuracy-das": 0.9724120475828905, "eval_accuracy-l1": 0.960389774740572, "eval_accuracy-l2": 0.969248291571754, "eval_f1": 0.9578566256335989, "eval_f1-all": 0.952937737503654, "eval_f1-das": 0.9619029920089203, "eval_f1-l1": 0.9558861915948839, "eval_f1-l2": 0.9491863168382597, "eval_loss": 0.16722118854522705, "eval_precision": 0.9544011544011544, "eval_precision-all": 0.9487776484284052, "eval_precision-das": 0.9599406528189911, "eval_precision-l1": 0.95067497403946, "eval_precision-l2": 0.9463576158940398, "eval_recall": 0.9613372093023256, "eval_recall-all": 0.9571344685848503, "eval_recall-das": 0.9638733705772812, "eval_recall-l1": 0.9611548556430446, "eval_recall-l2": 0.9520319786808794, "eval_runtime": 5.3735, "eval_samples_per_second": 125.803, "eval_steps_per_second": 8.002, "step": 1100 }, { "epoch": 3.15, "eval_ACT": { "f1": 0.9268755935422602, "number": 519, "precision": 0.9138576779026217, "recall": 0.9402697495183044 }, "eval_ACT_L1": { "f1": 0.95069033530572, "number": 503, "precision": 0.9432485322896281, "recall": 0.9582504970178927 }, "eval_ACT_L2": { "f1": 0.30769230769230765, "number": 16, "precision": 0.2608695652173913, "recall": 0.375 }, "eval_CARDINAL": { "f1": 0.9867647058823529, "number": 678, "precision": 0.9838709677419355, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.43243243243243246, "number": 30, "precision": 0.36363636363636365, "recall": 0.5333333333333333 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9523809523809524, "number": 761, "precision": 0.9455958549222798, "recall": 0.9592641261498029 }, "eval_PER": { "f1": 0.9742078113485629, "number": 676, "precision": 0.9706314243759178, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9633883704235463, "number": 694, "precision": 0.9599427753934192, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8059701492537314, "number": 33, "precision": 0.7941176470588235, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.5, "number": 6, "precision": 0.5, "recall": 0.5 }, "eval_accuracy": 0.9558339660845355, "eval_accuracy-all": 0.9667172867628449, "eval_accuracy-das": 0.9746899519109087, "eval_accuracy-l1": 0.9619083776259175, "eval_accuracy-l2": 0.9715261958997722, "eval_f1": 0.9552411204158244, "eval_f1-all": 0.9526308118350095, "eval_f1-das": 0.9595697329376855, "eval_f1-l1": 0.9531249999999999, "eval_f1-l2": 0.9520026481297584, "eval_loss": 0.15443478524684906, "eval_precision": 0.948938611589214, "eval_precision-all": 0.9458755426917511, "eval_precision-das": 0.9556704839305504, "eval_precision-l1": 0.9457364341085271, "eval_precision-l2": 0.9460526315789474, "eval_recall": 0.9616279069767442, "eval_recall-all": 0.9594832648267763, "eval_recall-das": 0.9635009310986965, "eval_recall-l1": 0.9606299212598425, "eval_recall-l2": 0.9580279813457695, "eval_runtime": 5.4706, "eval_samples_per_second": 123.569, "eval_steps_per_second": 7.86, "step": 1200 }, { "epoch": 3.41, "eval_ACT": { "f1": 0.9435406698564592, "number": 519, "precision": 0.9372623574144486, "recall": 0.9499036608863198 }, "eval_ACT_L1": { "f1": 0.9560975609756097, "number": 503, "precision": 0.9386973180076629, "recall": 0.974155069582505 }, "eval_ACT_L2": { "f1": 0.3, "number": 16, "precision": 0.75, "recall": 0.1875 }, "eval_CARDINAL": { "f1": 0.9882179675994109, "number": 678, "precision": 0.986764705882353, "recall": 0.9896755162241888 }, "eval_DESC": { "f1": 0.48, "number": 30, "precision": 0.6, "recall": 0.4 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9551656920077972, "number": 761, "precision": 0.9447300771208226, "recall": 0.9658344283837057 }, "eval_PER": { "f1": 0.9756457564575647, "number": 676, "precision": 0.9734904270986745, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9558404558404557, "number": 694, "precision": 0.9450704225352112, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8307692307692308, "number": 33, "precision": 0.84375, "recall": 0.8181818181818182 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9607694254619084, "eval_accuracy-all": 0.9705770690964313, "eval_accuracy-das": 0.9731713490255631, "eval_accuracy-l1": 0.9668438370032904, "eval_accuracy-l2": 0.9743103011895723, "eval_f1": 0.9611481588866339, "eval_f1-all": 0.9570175438596491, "eval_f1-das": 0.9630866258579114, "eval_f1-l1": 0.9562043795620437, "eval_f1-l2": 0.9580559254327563, "eval_loss": 0.17625676095485687, "eval_precision": 0.9586466165413534, "eval_precision-all": 0.9531158998252767, "eval_precision-das": 0.959349593495935, "eval_precision-l1": 0.949766960124288, "eval_precision-l2": 0.957418496340652, "eval_recall": 0.9636627906976745, "eval_recall-all": 0.96095126247798, "eval_recall-das": 0.966852886405959, "eval_recall-l1": 0.9627296587926509, "eval_recall-l2": 0.9586942038640907, "eval_runtime": 5.5364, "eval_samples_per_second": 122.101, "eval_steps_per_second": 7.767, "step": 1300 }, { "epoch": 3.67, "eval_ACT": { "f1": 0.9299242424242424, "number": 519, "precision": 0.9143389199255121, "recall": 0.9460500963391136 }, "eval_ACT_L1": { "f1": 0.9517241379310345, "number": 503, "precision": 0.943359375, "recall": 0.9602385685884692 }, "eval_ACT_L2": { "f1": 0.39024390243902435, "number": 16, "precision": 0.32, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9830757910228108, "number": 678, "precision": 0.9809104258443465, "recall": 0.9852507374631269 }, "eval_DESC": { "f1": 0.49315068493150693, "number": 30, "precision": 0.4186046511627907, "recall": 0.6 }, "eval_FT": { "f1": 0.22222222222222224, "number": 7, "precision": 0.5, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9440832249674903, "number": 761, "precision": 0.9343629343629344, "recall": 0.9540078843626807 }, "eval_PER": { "f1": 0.9756457564575647, "number": 676, "precision": 0.9734904270986745, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9613180515759313, "number": 694, "precision": 0.9558404558404558, "recall": 0.9668587896253602 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8484848484848486, "number": 33, "precision": 0.8484848484848485, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.4, "number": 6, "precision": 0.3333333333333333, "recall": 0.5 }, "eval_accuracy": 0.9524171095925082, "eval_accuracy-all": 0.9641862819539357, "eval_accuracy-das": 0.9696279422930904, "eval_accuracy-l1": 0.9610225259427992, "eval_accuracy-l2": 0.9673500379650721, "eval_f1": 0.9534112216933507, "eval_f1-all": 0.9512301645072062, "eval_f1-das": 0.9583101723179546, "eval_f1-l1": 0.9544389481905754, "eval_f1-l2": 0.9471598414795244, "eval_loss": 0.17374566197395325, "eval_precision": 0.9461780704265674, "eval_precision-all": 0.9434016748483973, "eval_precision-das": 0.9535398230088495, "eval_precision-l1": 0.9467975206611571, "eval_precision-l2": 0.9390962671905697, "eval_recall": 0.9607558139534884, "eval_recall-all": 0.9591896652965355, "eval_recall-das": 0.9631284916201117, "eval_recall-l1": 0.9622047244094488, "eval_recall-l2": 0.955363091272485, "eval_runtime": 5.5496, "eval_samples_per_second": 121.811, "eval_steps_per_second": 7.748, "step": 1400 }, { "epoch": 3.94, "learning_rate": 7e-05, "loss": 0.0874, "step": 1500 }, { "epoch": 3.94, "eval_ACT": { "f1": 0.9458689458689458, "number": 519, "precision": 0.9325842696629213, "recall": 0.9595375722543352 }, "eval_ACT_L1": { "f1": 0.9647749510763209, "number": 503, "precision": 0.9499036608863198, "recall": 0.9801192842942346 }, "eval_ACT_L2": { "f1": 0.3225806451612903, "number": 16, "precision": 0.3333333333333333, "recall": 0.3125 }, "eval_CARDINAL": { "f1": 0.9823788546255506, "number": 678, "precision": 0.9780701754385965, "recall": 0.9867256637168141 }, "eval_DESC": { "f1": 0.3225806451612903, "number": 30, "precision": 0.3125, "recall": 0.3333333333333333 }, "eval_FT": { "f1": 0.25, "number": 7, "precision": 0.2222222222222222, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.954367666232073, "number": 761, "precision": 0.9469598965071151, "recall": 0.961892247043364 }, "eval_PER": { "f1": 0.9764011799410028, "number": 676, "precision": 0.9735294117647059, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9601706970128022, "number": 694, "precision": 0.9480337078651685, "recall": 0.9726224783861671 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8358208955223881, "number": 33, "precision": 0.8235294117647058, "recall": 0.8484848484848485 }, "eval_TITREP": { "f1": 0.28571428571428575, "number": 6, "precision": 0.25, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9526702100733991, "eval_accuracy-all": 0.9644393824348266, "eval_accuracy-das": 0.9700075930144267, "eval_accuracy-l1": 0.9602632245001266, "eval_accuracy-l2": 0.9686155403695267, "eval_f1": 0.9585320040456581, "eval_f1-all": 0.9540162980209547, "eval_f1-das": 0.9615384615384616, "eval_f1-l1": 0.9563409563409563, "eval_f1-l2": 0.9510582010582012, "eval_loss": 0.1944604068994522, "eval_precision": 0.9528871014076414, "eval_precision-all": 0.9457587997691864, "eval_precision-das": 0.9548292324641939, "eval_precision-l1": 0.9469891919711786, "eval_precision-l2": 0.9441891004596191, "eval_recall": 0.9642441860465116, "eval_recall-all": 0.9624192601291838, "eval_recall-das": 0.9683426443202979, "eval_recall-l1": 0.9658792650918635, "eval_recall-l2": 0.9580279813457695, "eval_runtime": 5.5418, "eval_samples_per_second": 121.983, "eval_steps_per_second": 7.759, "step": 1500 }, { "epoch": 4.2, "eval_ACT": { "f1": 0.9579349904397705, "number": 519, "precision": 0.9506641366223909, "recall": 0.9653179190751445 }, "eval_ACT_L1": { "f1": 0.973293768545994, "number": 503, "precision": 0.968503937007874, "recall": 0.9781312127236581 }, "eval_ACT_L2": { "f1": 0.5142857142857142, "number": 16, "precision": 0.47368421052631576, "recall": 0.5625 }, "eval_CARDINAL": { "f1": 0.9801031687546058, "number": 678, "precision": 0.979381443298969, "recall": 0.9808259587020649 }, "eval_DESC": { "f1": 0.5901639344262295, "number": 30, "precision": 0.5806451612903226, "recall": 0.6 }, "eval_FT": { "f1": 0.30769230769230765, "number": 7, "precision": 0.3333333333333333, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9542483660130721, "number": 761, "precision": 0.9492847854356307, "recall": 0.9592641261498029 }, "eval_PER": { "f1": 0.9793510324483775, "number": 676, "precision": 0.9764705882352941, "recall": 0.9822485207100592 }, "eval_SPAT": { "f1": 0.9649749821300929, "number": 694, "precision": 0.9574468085106383, "recall": 0.9726224783861671 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8064516129032258, "number": 33, "precision": 0.8620689655172413, "recall": 0.7575757575757576 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9616552771450265, "eval_accuracy-all": 0.9713996456593268, "eval_accuracy-das": 0.9751961528726905, "eval_accuracy-l1": 0.9691217413313086, "eval_accuracy-l2": 0.973677549987345, "eval_f1": 0.9617391304347827, "eval_f1-all": 0.9599298040362678, "eval_f1-das": 0.9646971386101821, "eval_f1-l1": 0.9657874118568817, "eval_f1-l2": 0.9524759056164839, "eval_loss": 0.18698786199092865, "eval_precision": 0.9589595375722544, "eval_precision-all": 0.9562937062937062, "eval_precision-das": 0.9625509825732295, "eval_precision-l1": 0.9610187110187111, "eval_precision-l2": 0.9502652519893899, "eval_recall": 0.9645348837209302, "eval_recall-all": 0.9635936582501468, "eval_recall-das": 0.966852886405959, "eval_recall-l1": 0.9706036745406824, "eval_recall-l2": 0.9546968687541639, "eval_runtime": 5.912, "eval_samples_per_second": 114.344, "eval_steps_per_second": 7.273, "step": 1600 }, { "epoch": 4.46, "eval_ACT": { "f1": 0.9420702754036088, "number": 519, "precision": 0.9288389513108615, "recall": 0.9556840077071291 }, "eval_ACT_L1": { "f1": 0.9663366336633663, "number": 503, "precision": 0.9625246548323472, "recall": 0.9701789264413518 }, "eval_ACT_L2": { "f1": 0.37209302325581395, "number": 16, "precision": 0.2962962962962963, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9823269513991163, "number": 678, "precision": 0.9808823529411764, "recall": 0.9837758112094396 }, "eval_DESC": { "f1": 0.4927536231884058, "number": 30, "precision": 0.4358974358974359, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.4, "number": 7, "precision": 0.6666666666666666, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9489528795811519, "number": 761, "precision": 0.9452411994784876, "recall": 0.9526938239159002 }, "eval_PER": { "f1": 0.9778434268833086, "number": 676, "precision": 0.976401179941003, "recall": 0.9792899408284024 }, "eval_SPAT": { "f1": 0.9577060931899642, "number": 694, "precision": 0.9529243937232525, "recall": 0.962536023054755 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8405797101449276, "number": 33, "precision": 0.8055555555555556, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.3333333333333333, "number": 6, "precision": 0.3333333333333333, "recall": 0.3333333333333333 }, "eval_accuracy": 0.9578587699316629, "eval_accuracy-all": 0.9679827891672994, "eval_accuracy-das": 0.9738041002277904, "eval_accuracy-l1": 0.9646924829157175, "eval_accuracy-l2": 0.9712730954188813, "eval_f1": 0.9567731675581899, "eval_f1-all": 0.9541605839416059, "eval_f1-das": 0.962109955423477, "eval_f1-l1": 0.9582245430809399, "eval_f1-l2": 0.9490066225165563, "eval_loss": 0.1859915405511856, "eval_precision": 0.9516824849007766, "eval_precision-all": 0.9488966318234611, "eval_precision-das": 0.9596146721007781, "eval_precision-l1": 0.9532467532467532, "eval_precision-l2": 0.9433838051349572, "eval_recall": 0.9619186046511627, "eval_recall-all": 0.9594832648267763, "eval_recall-das": 0.9646182495344506, "eval_recall-l1": 0.963254593175853, "eval_recall-l2": 0.9546968687541639, "eval_runtime": 5.5062, "eval_samples_per_second": 122.771, "eval_steps_per_second": 7.809, "step": 1700 }, { "epoch": 4.72, "eval_ACT": { "f1": 0.9666348903717827, "number": 519, "precision": 0.9566037735849057, "recall": 0.976878612716763 }, "eval_ACT_L1": { "f1": 0.9764705882352941, "number": 503, "precision": 0.9632495164410058, "recall": 0.9900596421471173 }, "eval_ACT_L2": { "f1": 0.6206896551724138, "number": 16, "precision": 0.6923076923076923, "recall": 0.5625 }, "eval_CARDINAL": { "f1": 0.9852941176470589, "number": 678, "precision": 0.9824046920821115, "recall": 0.9882005899705014 }, "eval_DESC": { "f1": 0.5666666666666667, "number": 30, "precision": 0.5666666666666667, "recall": 0.5666666666666667 }, "eval_FT": { "f1": 0.2, "number": 7, "precision": 0.3333333333333333, "recall": 0.14285714285714285 }, "eval_LOC": { "f1": 0.9542483660130721, "number": 761, "precision": 0.9492847854356307, "recall": 0.9592641261498029 }, "eval_PER": { "f1": 0.9793205317577548, "number": 676, "precision": 0.9778761061946902, "recall": 0.9807692307692307 }, "eval_SPAT": { "f1": 0.9547738693467337, "number": 694, "precision": 0.9513590844062947, "recall": 0.9582132564841499 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.8823529411764706, "number": 33, "precision": 0.8571428571428571, "recall": 0.9090909090909091 }, "eval_TITREP": { "f1": 0.4615384615384615, "number": 6, "precision": 0.42857142857142855, "recall": 0.5 }, "eval_accuracy": 0.9643128321943811, "eval_accuracy-all": 0.974120475828904, "eval_accuracy-das": 0.9757023538344722, "eval_accuracy-l1": 0.9711465451784358, "eval_accuracy-l2": 0.9770944064793723, "eval_f1": 0.9649580075296842, "eval_f1-all": 0.9609592045620704, "eval_f1-das": 0.968651456130588, "eval_f1-l1": 0.9626534343170541, "eval_f1-l2": 0.9588039867109635, "eval_loss": 0.16283993422985077, "eval_precision": 0.96133871898442, "eval_precision-all": 0.9571803087678415, "eval_precision-das": 0.9648928307464892, "eval_precision-l1": 0.9579002079002079, "eval_precision-l2": 0.9562624254473161, "eval_recall": 0.9686046511627907, "eval_recall-all": 0.9647680563711099, "eval_recall-das": 0.97243947858473, "eval_recall-l1": 0.9674540682414698, "eval_recall-l2": 0.9613590939373751, "eval_runtime": 5.4991, "eval_samples_per_second": 122.928, "eval_steps_per_second": 7.819, "step": 1800 }, { "epoch": 4.99, "eval_ACT": { "f1": 0.941398865784499, "number": 519, "precision": 0.9239332096474954, "recall": 0.9595375722543352 }, "eval_ACT_L1": { "f1": 0.9655172413793103, "number": 503, "precision": 0.95703125, "recall": 0.974155069582505 }, "eval_ACT_L2": { "f1": 0.37209302325581395, "number": 16, "precision": 0.2962962962962963, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9852507374631269, "number": 678, "precision": 0.9852507374631269, "recall": 0.9852507374631269 }, "eval_DESC": { "f1": 0.49315068493150693, "number": 30, "precision": 0.4186046511627907, "recall": 0.6 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9614126880313931, "number": 761, "precision": 0.95703125, "recall": 0.9658344283837057 }, "eval_PER": { "f1": 0.9815225424981524, "number": 676, "precision": 0.9807976366322009, "recall": 0.9822485207100592 }, "eval_SPAT": { "f1": 0.9555236728837877, "number": 694, "precision": 0.9514285714285714, "recall": 0.9596541786743515 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.923076923076923, "number": 33, "precision": 0.9375, "recall": 0.9090909090909091 }, "eval_TITREP": { "f1": 0.28571428571428575, "number": 6, "precision": 0.25, "recall": 0.3333333333333333 }, "eval_accuracy": 0.960389774740572, "eval_accuracy-all": 0.9701341432548722, "eval_accuracy-das": 0.9759554543153632, "eval_accuracy-l1": 0.9659579853201721, "eval_accuracy-l2": 0.9743103011895723, "eval_f1": 0.9632523148148149, "eval_f1-all": 0.9577012835472578, "eval_f1-das": 0.9673226884515411, "eval_f1-l1": 0.9580401355225436, "eval_f1-l2": 0.9572706194104007, "eval_loss": 0.16160346567630768, "eval_precision": 0.9588133640552995, "eval_precision-all": 0.9515942028985507, "eval_precision-das": 0.9644576082932247, "eval_precision-l1": 0.9513457556935818, "eval_precision-l2": 0.9519104084321476, "eval_recall": 0.9677325581395348, "eval_recall-all": 0.9638872577803875, "eval_recall-das": 0.9702048417132216, "eval_recall-l1": 0.9648293963254593, "eval_recall-l2": 0.9626915389740173, "eval_runtime": 5.4066, "eval_samples_per_second": 125.032, "eval_steps_per_second": 7.953, "step": 1900 }, { "epoch": 5.25, "learning_rate": 6e-05, "loss": 0.0496, "step": 2000 }, { "epoch": 5.25, "eval_ACT": { "f1": 0.9627507163323782, "number": 519, "precision": 0.9545454545454546, "recall": 0.9710982658959537 }, "eval_ACT_L1": { "f1": 0.9735034347399412, "number": 503, "precision": 0.9612403100775194, "recall": 0.9860834990059643 }, "eval_ACT_L2": { "f1": 0.5714285714285715, "number": 16, "precision": 0.6666666666666666, "recall": 0.5 }, "eval_CARDINAL": { "f1": 0.9852507374631269, "number": 678, "precision": 0.9852507374631269, "recall": 0.9852507374631269 }, "eval_DESC": { "f1": 0.5901639344262295, "number": 30, "precision": 0.5806451612903226, "recall": 0.6 }, "eval_FT": { "f1": 0.4615384615384615, "number": 7, "precision": 0.5, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9574328749181402, "number": 761, "precision": 0.9543080939947781, "recall": 0.9605781865965834 }, "eval_PER": { "f1": 0.9785344189489268, "number": 676, "precision": 0.9792592592592593, "recall": 0.977810650887574 }, "eval_SPAT": { "f1": 0.9619526202440775, "number": 694, "precision": 0.9585121602288984, "recall": 0.9654178674351584 }, "eval_TITRE": { "f1": 0.0, "number": 2, "precision": 0.0, "recall": 0.0 }, "eval_TITREH": { "f1": 0.9206349206349207, "number": 33, "precision": 0.9666666666666667, "recall": 0.8787878787878788 }, "eval_TITREP": { "f1": 0.4615384615384615, "number": 6, "precision": 0.42857142857142855, "recall": 0.5 }, "eval_accuracy": 0.9693748418121995, "eval_accuracy-all": 0.9779169830422678, "eval_accuracy-das": 0.9788661098456087, "eval_accuracy-l1": 0.9744368514300177, "eval_accuracy-l2": 0.9813971146545178, "eval_f1": 0.9663670629167874, "eval_f1-all": 0.9630823322590096, "eval_f1-das": 0.9693137437232657, "eval_f1-l1": 0.964453737584945, "eval_f1-l2": 0.9613333333333334, "eval_loss": 0.1529596447944641, "eval_precision": 0.9638519375361481, "eval_precision-all": 0.9611111111111111, "eval_precision-das": 0.9680534918276374, "eval_precision-l1": 0.9604372722540343, "eval_precision-l2": 0.961974649766511, "eval_recall": 0.9688953488372093, "eval_recall-all": 0.9650616559013505, "eval_recall-das": 0.9705772811918063, "eval_recall-l1": 0.968503937007874, "eval_recall-l2": 0.960692871419054, "eval_runtime": 5.5475, "eval_samples_per_second": 121.856, "eval_steps_per_second": 7.751, "step": 2000 } ], "max_steps": 5000, "num_train_epochs": 14, "total_flos": 813927239246016.0, "trial_name": null, "trial_params": null }