{ "best_metric": 0.9306620270961232, "best_model_checkpoint": "models/google-canine-c-typosquat-v3.1-mnrl/checkpoint-868", "epoch": 1.2385861561119293, "eval_steps": 62, "global_step": 868, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.09131075110456553, "grad_norm": 5.324620723724365, "learning_rate": 3e-05, "loss": 1.219, "step": 62 }, { "epoch": 0.09131075110456553, "eval_info_retr_eval_dot_accuracy@1": 0.9574487639003768, "eval_info_retr_eval_dot_accuracy@10": 0.994026284348865, "eval_info_retr_eval_dot_accuracy@3": 0.9816193364580461, "eval_info_retr_eval_dot_accuracy@5": 0.9881444720154398, "eval_info_retr_eval_dot_map@100": 0.9710061189570759, "eval_info_retr_eval_dot_mrr@10": 0.970718399481841, "eval_info_retr_eval_dot_ndcg@10": 0.9764345312554475, "eval_info_retr_eval_dot_precision@1": 0.9574487639003768, "eval_info_retr_eval_dot_precision@10": 0.09940262843488651, "eval_info_retr_eval_dot_precision@3": 0.32720644548601535, "eval_info_retr_eval_dot_precision@5": 0.197628894403088, "eval_info_retr_eval_dot_recall@1": 0.9574487639003768, "eval_info_retr_eval_dot_recall@10": 0.994026284348865, "eval_info_retr_eval_dot_recall@3": 0.9816193364580461, "eval_info_retr_eval_dot_recall@5": 0.9881444720154398, "eval_loss": 0.11100412905216217, "eval_para_mine_eval_average_precision": 0.7672056895535211, "eval_para_mine_eval_f1": 0.7847944762520686, "eval_para_mine_eval_precision": 0.8285314095516364, "eval_para_mine_eval_recall": 0.7454436228787721, "eval_para_mine_eval_threshold": 0.7348841428756714, "eval_runtime": 44.8792, "eval_samples_per_second": 242.451, "eval_sequential_score": 0.9710061189570759, "eval_steps_per_second": 1.916, "step": 62 }, { "epoch": 0.18262150220913106, "grad_norm": 3.005993604660034, "learning_rate": 4.943211151264843e-05, "loss": 0.1012, "step": 124 }, { "epoch": 0.18262150220913106, "eval_info_retr_eval_dot_accuracy@1": 0.9798731734215606, "eval_info_retr_eval_dot_accuracy@10": 0.9973348037864167, "eval_info_retr_eval_dot_accuracy@3": 0.9930153478540575, "eval_info_retr_eval_dot_accuracy@5": 0.9957724473853506, "eval_info_retr_eval_dot_map@100": 0.9868644025653387, "eval_info_retr_eval_dot_mrr@10": 0.9867332819841785, "eval_info_retr_eval_dot_ndcg@10": 0.989378667273856, "eval_info_retr_eval_dot_precision@1": 0.9798731734215606, "eval_info_retr_eval_dot_precision@10": 0.09973348037864167, "eval_info_retr_eval_dot_precision@3": 0.33100511595135246, "eval_info_retr_eval_dot_precision@5": 0.19915448947707012, "eval_info_retr_eval_dot_recall@1": 0.9798731734215606, "eval_info_retr_eval_dot_recall@10": 0.9973348037864167, "eval_info_retr_eval_dot_recall@3": 0.9930153478540575, "eval_info_retr_eval_dot_recall@5": 0.9957724473853506, "eval_loss": 0.04060104861855507, "eval_para_mine_eval_average_precision": 0.8585605463078829, "eval_para_mine_eval_f1": 0.8537043823665016, "eval_para_mine_eval_precision": 0.8957241803604032, "eval_para_mine_eval_recall": 0.8154503529921904, "eval_para_mine_eval_threshold": 0.6834436357021332, "eval_runtime": 44.147, "eval_samples_per_second": 246.472, "eval_sequential_score": 0.9868644025653387, "eval_steps_per_second": 1.948, "step": 124 }, { "epoch": 0.27393225331369664, "grad_norm": 0.6856785416603088, "learning_rate": 4.783169850283944e-05, "loss": 0.0693, "step": 186 }, { "epoch": 0.27393225331369664, "eval_info_retr_eval_dot_accuracy@1": 0.9855711791195663, "eval_info_retr_eval_dot_accuracy@10": 0.9988971601874828, "eval_info_retr_eval_dot_accuracy@3": 0.9959562540207701, "eval_info_retr_eval_dot_accuracy@5": 0.9977943203749655, "eval_info_retr_eval_dot_map@100": 0.9910708474937577, "eval_info_retr_eval_dot_mrr@10": 0.991004780431304, "eval_info_retr_eval_dot_ndcg@10": 0.9929831934334958, "eval_info_retr_eval_dot_precision@1": 0.9855711791195663, "eval_info_retr_eval_dot_precision@10": 0.09988971601874828, "eval_info_retr_eval_dot_precision@3": 0.3319854180069234, "eval_info_retr_eval_dot_precision@5": 0.19955886407499313, "eval_info_retr_eval_dot_recall@1": 0.9855711791195663, "eval_info_retr_eval_dot_recall@10": 0.9988971601874828, "eval_info_retr_eval_dot_recall@3": 0.9959562540207701, "eval_info_retr_eval_dot_recall@5": 0.9977943203749655, "eval_loss": 0.024971680715680122, "eval_para_mine_eval_average_precision": 0.8878504879371486, "eval_para_mine_eval_f1": 0.8765703942488466, "eval_para_mine_eval_precision": 0.9063191861895322, "eval_para_mine_eval_recall": 0.8487124705839841, "eval_para_mine_eval_threshold": 0.6699230670928955, "eval_runtime": 44.4383, "eval_samples_per_second": 244.856, "eval_sequential_score": 0.9910708474937577, "eval_steps_per_second": 1.935, "step": 186 }, { "epoch": 0.36524300441826213, "grad_norm": 0.5819792747497559, "learning_rate": 4.623128549303046e-05, "loss": 0.0424, "step": 248 }, { "epoch": 0.36524300441826213, "eval_info_retr_eval_dot_accuracy@1": 0.9887877952394082, "eval_info_retr_eval_dot_accuracy@10": 0.9994485800937414, "eval_info_retr_eval_dot_accuracy@3": 0.9978862236926753, "eval_info_retr_eval_dot_accuracy@5": 0.9986214502343534, "eval_info_retr_eval_dot_map@100": 0.9933887693878125, "eval_info_retr_eval_dot_mrr@10": 0.993345798632537, "eval_info_retr_eval_dot_ndcg@10": 0.994887605721736, "eval_info_retr_eval_dot_precision@1": 0.9887877952394082, "eval_info_retr_eval_dot_precision@10": 0.09994485800937414, "eval_info_retr_eval_dot_precision@3": 0.33262874123089176, "eval_info_retr_eval_dot_precision@5": 0.19972429004687073, "eval_info_retr_eval_dot_recall@1": 0.9887877952394082, "eval_info_retr_eval_dot_recall@10": 0.9994485800937414, "eval_info_retr_eval_dot_recall@3": 0.9978862236926753, "eval_info_retr_eval_dot_recall@5": 0.9986214502343534, "eval_loss": 0.01834421418607235, "eval_para_mine_eval_average_precision": 0.8919509440660052, "eval_para_mine_eval_f1": 0.8783150608010457, "eval_para_mine_eval_precision": 0.8953218322315484, "eval_para_mine_eval_recall": 0.8619423378336262, "eval_para_mine_eval_threshold": 0.6646433770656586, "eval_runtime": 44.2865, "eval_samples_per_second": 245.696, "eval_sequential_score": 0.9933887693878125, "eval_steps_per_second": 1.942, "step": 248 }, { "epoch": 0.4565537555228277, "grad_norm": 0.2500639259815216, "learning_rate": 4.463087248322148e-05, "loss": 0.0382, "step": 310 }, { "epoch": 0.4565537555228277, "eval_info_retr_eval_dot_accuracy@1": 0.9904420549581839, "eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, "eval_info_retr_eval_dot_accuracy@3": 0.9982538369635143, "eval_info_retr_eval_dot_accuracy@5": 0.998805256869773, "eval_info_retr_eval_dot_map@100": 0.9944206662844655, "eval_info_retr_eval_dot_mrr@10": 0.9944099442307328, "eval_info_retr_eval_dot_ndcg@10": 0.9957667469329782, "eval_info_retr_eval_dot_precision@1": 0.9904420549581839, "eval_info_retr_eval_dot_precision@10": 0.09998161933645805, "eval_info_retr_eval_dot_precision@3": 0.3327512789878381, "eval_info_retr_eval_dot_precision@5": 0.19976105137395464, "eval_info_retr_eval_dot_recall@1": 0.9904420549581839, "eval_info_retr_eval_dot_recall@10": 0.9998161933645805, "eval_info_retr_eval_dot_recall@3": 0.9982538369635143, "eval_info_retr_eval_dot_recall@5": 0.998805256869773, "eval_loss": 0.01802203245460987, "eval_para_mine_eval_average_precision": 0.8868720697863423, "eval_para_mine_eval_f1": 0.8749901834425858, "eval_para_mine_eval_precision": 0.8953481226571621, "eval_para_mine_eval_recall": 0.8555374379497094, "eval_para_mine_eval_threshold": 0.6635497808456421, "eval_runtime": 44.1381, "eval_samples_per_second": 246.521, "eval_sequential_score": 0.9944206662844655, "eval_steps_per_second": 1.948, "step": 310 }, { "epoch": 0.5478645066273933, "grad_norm": 0.8567762970924377, "learning_rate": 4.3030459473412496e-05, "loss": 0.0475, "step": 372 }, { "epoch": 0.5478645066273933, "eval_info_retr_eval_dot_accuracy@1": 0.9909934748644426, "eval_info_retr_eval_dot_accuracy@10": 0.9995404834114512, "eval_info_retr_eval_dot_accuracy@3": 0.9974267071041265, "eval_info_retr_eval_dot_accuracy@5": 0.9978862236926753, "eval_info_retr_eval_dot_map@100": 0.9943151219822102, "eval_info_retr_eval_dot_mrr@10": 0.9942822642643431, "eval_info_retr_eval_dot_ndcg@10": 0.9955792346109411, "eval_info_retr_eval_dot_precision@1": 0.9909934748644426, "eval_info_retr_eval_dot_precision@10": 0.09995404834114513, "eval_info_retr_eval_dot_precision@3": 0.33247556903470876, "eval_info_retr_eval_dot_precision@5": 0.19957724473853508, "eval_info_retr_eval_dot_recall@1": 0.9909934748644426, "eval_info_retr_eval_dot_recall@10": 0.9995404834114512, "eval_info_retr_eval_dot_recall@3": 0.9974267071041265, "eval_info_retr_eval_dot_recall@5": 0.9978862236926753, "eval_loss": 0.020289968699216843, "eval_para_mine_eval_average_precision": 0.9057199011076745, "eval_para_mine_eval_f1": 0.8932047816062182, "eval_para_mine_eval_precision": 0.9151715052081852, "eval_para_mine_eval_recall": 0.8722678675477544, "eval_para_mine_eval_threshold": 0.6722444593906403, "eval_runtime": 44.2598, "eval_samples_per_second": 245.844, "eval_sequential_score": 0.9943151219822102, "eval_steps_per_second": 1.943, "step": 372 }, { "epoch": 0.6391752577319587, "grad_norm": 1.4318528175354004, "learning_rate": 4.1430046463603515e-05, "loss": 0.0377, "step": 434 }, { "epoch": 0.6391752577319587, "eval_info_retr_eval_dot_accuracy@1": 0.9912691848175719, "eval_info_retr_eval_dot_accuracy@10": 0.9997242900468707, "eval_info_retr_eval_dot_accuracy@3": 0.998805256869773, "eval_info_retr_eval_dot_accuracy@5": 0.9995404834114512, "eval_info_retr_eval_dot_map@100": 0.9950291896321672, "eval_info_retr_eval_dot_mrr@10": 0.9950066958131474, "eval_info_retr_eval_dot_ndcg@10": 0.996211640167477, "eval_info_retr_eval_dot_precision@1": 0.9912691848175719, "eval_info_retr_eval_dot_precision@10": 0.09997242900468709, "eval_info_retr_eval_dot_precision@3": 0.33293508562325763, "eval_info_retr_eval_dot_precision@5": 0.1999080966822902, "eval_info_retr_eval_dot_recall@1": 0.9912691848175719, "eval_info_retr_eval_dot_recall@10": 0.9997242900468707, "eval_info_retr_eval_dot_recall@3": 0.998805256869773, "eval_info_retr_eval_dot_recall@5": 0.9995404834114512, "eval_loss": 0.015328879468142986, "eval_para_mine_eval_average_precision": 0.8941081769196199, "eval_para_mine_eval_f1": 0.8799847506361558, "eval_para_mine_eval_precision": 0.8951106127502512, "eval_para_mine_eval_recall": 0.8653615967984535, "eval_para_mine_eval_threshold": 0.6661731898784637, "eval_runtime": 44.1048, "eval_samples_per_second": 246.708, "eval_sequential_score": 0.9950291896321672, "eval_steps_per_second": 1.95, "step": 434 }, { "epoch": 0.7304860088365243, "grad_norm": 0.5837889909744263, "learning_rate": 3.9829633453794526e-05, "loss": 0.0241, "step": 496 }, { "epoch": 0.7304860088365243, "eval_info_retr_eval_dot_accuracy@1": 0.9905339582758937, "eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, "eval_info_retr_eval_dot_accuracy@3": 0.9981619336458046, "eval_info_retr_eval_dot_accuracy@5": 0.9993566767760316, "eval_info_retr_eval_dot_map@100": 0.9944845062676603, "eval_info_retr_eval_dot_mrr@10": 0.994473656570431, "eval_info_retr_eval_dot_ndcg@10": 0.9958242906817244, "eval_info_retr_eval_dot_precision@1": 0.9905339582758937, "eval_info_retr_eval_dot_precision@10": 0.09998161933645805, "eval_info_retr_eval_dot_precision@3": 0.3327206445486015, "eval_info_retr_eval_dot_precision@5": 0.19987133535520635, "eval_info_retr_eval_dot_recall@1": 0.9905339582758937, "eval_info_retr_eval_dot_recall@10": 0.9998161933645805, "eval_info_retr_eval_dot_recall@3": 0.9981619336458046, "eval_info_retr_eval_dot_recall@5": 0.9993566767760316, "eval_loss": 0.016888538375496864, "eval_para_mine_eval_average_precision": 0.8920135475248205, "eval_para_mine_eval_f1": 0.8817566331198535, "eval_para_mine_eval_precision": 0.8931684329053274, "eval_para_mine_eval_recall": 0.870632766166952, "eval_para_mine_eval_threshold": 0.6506930291652679, "eval_runtime": 43.9952, "eval_samples_per_second": 247.322, "eval_sequential_score": 0.9944845062676603, "eval_steps_per_second": 1.955, "step": 496 }, { "epoch": 0.8217967599410898, "grad_norm": 0.7147839069366455, "learning_rate": 3.8229220443985544e-05, "loss": 0.045, "step": 558 }, { "epoch": 0.8217967599410898, "eval_info_retr_eval_dot_accuracy@1": 0.9938424777134455, "eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, "eval_info_retr_eval_dot_accuracy@3": 0.9986214502343534, "eval_info_retr_eval_dot_accuracy@5": 0.9993566767760316, "eval_info_retr_eval_dot_map@100": 0.9963993172223115, "eval_info_retr_eval_dot_mrr@10": 0.9963845891265246, "eval_info_retr_eval_dot_ndcg@10": 0.9972497507624225, "eval_info_retr_eval_dot_precision@1": 0.9938424777134455, "eval_info_retr_eval_dot_precision@10": 0.09998161933645805, "eval_info_retr_eval_dot_precision@3": 0.33287381674478445, "eval_info_retr_eval_dot_precision@5": 0.19987133535520635, "eval_info_retr_eval_dot_recall@1": 0.9938424777134455, "eval_info_retr_eval_dot_recall@10": 0.9998161933645805, "eval_info_retr_eval_dot_recall@3": 0.9986214502343534, "eval_info_retr_eval_dot_recall@5": 0.9993566767760316, "eval_loss": 0.013228075578808784, "eval_para_mine_eval_average_precision": 0.9111664137442287, "eval_para_mine_eval_f1": 0.8942790038822603, "eval_para_mine_eval_precision": 0.9093417624592629, "eval_para_mine_eval_recall": 0.8797071271449414, "eval_para_mine_eval_threshold": 0.6545680165290833, "eval_runtime": 44.1589, "eval_samples_per_second": 246.405, "eval_sequential_score": 0.9963993172223115, "eval_steps_per_second": 1.948, "step": 558 }, { "epoch": 0.9131075110456554, "grad_norm": 1.6569366455078125, "learning_rate": 3.662880743417656e-05, "loss": 0.0302, "step": 620 }, { "epoch": 0.9131075110456554, "eval_info_retr_eval_dot_accuracy@1": 0.9913610881352817, "eval_info_retr_eval_dot_accuracy@10": 0.9992647734583219, "eval_info_retr_eval_dot_accuracy@3": 0.9980700303280948, "eval_info_retr_eval_dot_accuracy@5": 0.9987133535520633, "eval_info_retr_eval_dot_map@100": 0.9947594505678611, "eval_info_retr_eval_dot_mrr@10": 0.9947092135264177, "eval_info_retr_eval_dot_ndcg@10": 0.9958603290565278, "eval_info_retr_eval_dot_precision@1": 0.9913610881352817, "eval_info_retr_eval_dot_precision@10": 0.0999264773458322, "eval_info_retr_eval_dot_precision@3": 0.33269001010936494, "eval_info_retr_eval_dot_precision@5": 0.19974267071041266, "eval_info_retr_eval_dot_recall@1": 0.9913610881352817, "eval_info_retr_eval_dot_recall@10": 0.9992647734583219, "eval_info_retr_eval_dot_recall@3": 0.9980700303280948, "eval_info_retr_eval_dot_recall@5": 0.9987133535520633, "eval_loss": 0.01584717258810997, "eval_para_mine_eval_average_precision": 0.9161096169142061, "eval_para_mine_eval_f1": 0.9015840220385676, "eval_para_mine_eval_precision": 0.9167067369413698, "eval_para_mine_eval_recall": 0.886952161992475, "eval_para_mine_eval_threshold": 0.6570625901222229, "eval_runtime": 44.3069, "eval_samples_per_second": 245.583, "eval_sequential_score": 0.9947594505678611, "eval_steps_per_second": 1.941, "step": 620 }, { "epoch": 1.004418262150221, "grad_norm": 0.12535937130451202, "learning_rate": 3.502839442436758e-05, "loss": 0.0314, "step": 682 }, { "epoch": 1.004418262150221, "eval_info_retr_eval_dot_accuracy@1": 0.9902582483227644, "eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, "eval_info_retr_eval_dot_accuracy@3": 0.9983457402812241, "eval_info_retr_eval_dot_accuracy@5": 0.9994485800937414, "eval_info_retr_eval_dot_map@100": 0.9944195539625648, "eval_info_retr_eval_dot_mrr@10": 0.9944061513953989, "eval_info_retr_eval_dot_ndcg@10": 0.9957806542116834, "eval_info_retr_eval_dot_precision@1": 0.9902582483227644, "eval_info_retr_eval_dot_precision@10": 0.09998161933645805, "eval_info_retr_eval_dot_precision@3": 0.3327819134270747, "eval_info_retr_eval_dot_precision@5": 0.19988971601874833, "eval_info_retr_eval_dot_recall@1": 0.9902582483227644, "eval_info_retr_eval_dot_recall@10": 0.9998161933645805, "eval_info_retr_eval_dot_recall@3": 0.9983457402812241, "eval_info_retr_eval_dot_recall@5": 0.9994485800937414, "eval_loss": 0.01480414904654026, "eval_para_mine_eval_average_precision": 0.9018706893922749, "eval_para_mine_eval_f1": 0.8877219600165349, "eval_para_mine_eval_precision": 0.8927995468022605, "eval_para_mine_eval_recall": 0.8827018017733171, "eval_para_mine_eval_threshold": 0.6474231779575348, "eval_runtime": 43.8665, "eval_samples_per_second": 248.048, "eval_sequential_score": 0.9944195539625648, "eval_steps_per_second": 1.96, "step": 682 }, { "epoch": 1.0559646539027983, "grad_norm": 0.2109777331352234, "learning_rate": 3.342798141455859e-05, "loss": 0.0204, "step": 744 }, { "epoch": 1.0559646539027983, "eval_info_retr_eval_dot_accuracy@1": 0.9939343810311553, "eval_info_retr_eval_dot_accuracy@10": 1.0, "eval_info_retr_eval_dot_accuracy@3": 0.9992647734583219, "eval_info_retr_eval_dot_accuracy@5": 0.9999080966822902, "eval_info_retr_eval_dot_map@100": 0.996594216217872, "eval_info_retr_eval_dot_mrr@10": 0.9965942162178723, "eval_info_retr_eval_dot_ndcg@10": 0.9974631239499567, "eval_info_retr_eval_dot_precision@1": 0.9939343810311553, "eval_info_retr_eval_dot_precision@10": 0.10000000000000002, "eval_info_retr_eval_dot_precision@3": 0.33308825781944057, "eval_info_retr_eval_dot_precision@5": 0.19998161933645806, "eval_info_retr_eval_dot_recall@1": 0.9939343810311553, "eval_info_retr_eval_dot_recall@10": 1.0, "eval_info_retr_eval_dot_recall@3": 0.9992647734583219, "eval_info_retr_eval_dot_recall@5": 0.9999080966822902, "eval_loss": 0.011477422900497913, "eval_para_mine_eval_average_precision": 0.9183526341973961, "eval_para_mine_eval_f1": 0.9008710021688987, "eval_para_mine_eval_precision": 0.9157536675501139, "eval_para_mine_eval_recall": 0.8864643416910201, "eval_para_mine_eval_threshold": 0.6480826139450073, "eval_runtime": 45.0423, "eval_samples_per_second": 241.573, "eval_sequential_score": 0.996594216217872, "eval_steps_per_second": 1.909, "step": 744 }, { "epoch": 1.1472754050073637, "grad_norm": 0.43087926506996155, "learning_rate": 3.182756840474961e-05, "loss": 0.0193, "step": 806 }, { "epoch": 1.1472754050073637, "eval_info_retr_eval_dot_accuracy@1": 0.9939343810311553, "eval_info_retr_eval_dot_accuracy@10": 1.0, "eval_info_retr_eval_dot_accuracy@3": 0.9991728701406121, "eval_info_retr_eval_dot_accuracy@5": 0.9998161933645805, "eval_info_retr_eval_dot_map@100": 0.996541371810189, "eval_info_retr_eval_dot_mrr@10": 0.996541371810189, "eval_info_retr_eval_dot_ndcg@10": 0.9974193893555866, "eval_info_retr_eval_dot_precision@1": 0.9939343810311553, "eval_info_retr_eval_dot_precision@10": 0.10000000000000002, "eval_info_retr_eval_dot_precision@3": 0.333057623380204, "eval_info_retr_eval_dot_precision@5": 0.1999632386729161, "eval_info_retr_eval_dot_recall@1": 0.9939343810311553, "eval_info_retr_eval_dot_recall@10": 1.0, "eval_info_retr_eval_dot_recall@3": 0.9991728701406121, "eval_info_retr_eval_dot_recall@5": 0.9998161933645805, "eval_loss": 0.01137059461325407, "eval_para_mine_eval_average_precision": 0.9152930281344098, "eval_para_mine_eval_f1": 0.8996903771768937, "eval_para_mine_eval_precision": 0.9043090584686712, "eval_para_mine_eval_recall": 0.895118635187201, "eval_para_mine_eval_threshold": 0.6495572626590729, "eval_runtime": 43.8875, "eval_samples_per_second": 247.93, "eval_sequential_score": 0.996541371810189, "eval_steps_per_second": 1.96, "step": 806 }, { "epoch": 1.2385861561119293, "grad_norm": 1.3790454864501953, "learning_rate": 3.0227155394940632e-05, "loss": 0.0164, "step": 868 }, { "epoch": 1.2385861561119293, "eval_info_retr_eval_dot_accuracy@1": 0.9937505743957357, "eval_info_retr_eval_dot_accuracy@10": 1.0, "eval_info_retr_eval_dot_accuracy@3": 0.9990809668229023, "eval_info_retr_eval_dot_accuracy@5": 0.9999080966822902, "eval_info_retr_eval_dot_map@100": 0.9964954201513342, "eval_info_retr_eval_dot_mrr@10": 0.9964954201513342, "eval_info_retr_eval_dot_ndcg@10": 0.9973903161826975, "eval_info_retr_eval_dot_precision@1": 0.9937505743957357, "eval_info_retr_eval_dot_precision@10": 0.10000000000000002, "eval_info_retr_eval_dot_precision@3": 0.3330269889409674, "eval_info_retr_eval_dot_precision@5": 0.19998161933645806, "eval_info_retr_eval_dot_recall@1": 0.9937505743957357, "eval_info_retr_eval_dot_recall@10": 1.0, "eval_info_retr_eval_dot_recall@3": 0.9990809668229023, "eval_info_retr_eval_dot_recall@5": 0.9999080966822902, "eval_loss": 0.009216207079589367, "eval_para_mine_eval_average_precision": 0.9306620270961232, "eval_para_mine_eval_f1": 0.9113359207458677, "eval_para_mine_eval_precision": 0.9197094729482332, "eval_para_mine_eval_recall": 0.9031134679054893, "eval_para_mine_eval_threshold": 0.6408547163009644, "eval_runtime": 44.7336, "eval_samples_per_second": 243.24, "eval_sequential_score": 0.9964954201513342, "eval_steps_per_second": 1.922, "step": 868 } ], "logging_steps": 62, "max_steps": 2037, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 62, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 64, "trial_name": null, "trial_params": null }