{ "best_metric": 0.5714132731149775, "best_model_checkpoint": "models/all-minilm-l6-v2-typosquat-v3.1-gist/checkpoint-1674", "epoch": 2.385861561119293, "eval_steps": 62, "global_step": 1674, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.09131075110456553, "grad_norm": 17.575565338134766, "learning_rate": 3e-05, "loss": 1.9075, "step": 62 }, { "epoch": 0.09131075110456553, "eval_info_retr_eval_dot_accuracy@1": 0.8306221854608952, "eval_info_retr_eval_dot_accuracy@10": 0.9250068927488282, "eval_info_retr_eval_dot_accuracy@3": 0.8876941457586619, "eval_info_retr_eval_dot_accuracy@5": 0.9032258064516129, "eval_info_retr_eval_dot_map@100": 0.8651529300165571, "eval_info_retr_eval_dot_mrr@10": 0.8627116876220815, "eval_info_retr_eval_dot_ndcg@10": 0.8777861364040704, "eval_info_retr_eval_dot_precision@1": 0.8306221854608952, "eval_info_retr_eval_dot_precision@10": 0.09250068927488282, "eval_info_retr_eval_dot_precision@3": 0.2958980485862206, "eval_info_retr_eval_dot_precision@5": 0.18064516129032257, "eval_info_retr_eval_dot_recall@1": 0.8306221854608952, "eval_info_retr_eval_dot_recall@10": 0.9250068927488282, "eval_info_retr_eval_dot_recall@3": 0.8876941457586619, "eval_info_retr_eval_dot_recall@5": 0.9032258064516129, "eval_loss": 0.8926403522491455, "eval_para_mine_eval_average_precision": 0.4175368476477107, "eval_para_mine_eval_f1": 0.5608786555511446, "eval_para_mine_eval_precision": 0.6772723495912615, "eval_para_mine_eval_recall": 0.4786239854015258, "eval_para_mine_eval_threshold": 0.7514148652553558, "eval_runtime": 46.7645, "eval_samples_per_second": 232.676, "eval_sequential_score": 0.8651529300165571, "eval_steps_per_second": 1.839, "step": 62 }, { "epoch": 0.18262150220913106, "grad_norm": 6.875263214111328, "learning_rate": 4.943211151264843e-05, "loss": 0.9074, "step": 124 }, { "epoch": 0.18262150220913106, "eval_info_retr_eval_dot_accuracy@1": 0.8424777134454554, "eval_info_retr_eval_dot_accuracy@10": 0.9359433875562908, "eval_info_retr_eval_dot_accuracy@3": 0.8946787979046044, "eval_info_retr_eval_dot_accuracy@5": 0.9126918481757191, "eval_info_retr_eval_dot_map@100": 0.8756277031952363, "eval_info_retr_eval_dot_mrr@10": 0.873614557485526, "eval_info_retr_eval_dot_ndcg@10": 0.8886439257445581, "eval_info_retr_eval_dot_precision@1": 0.8424777134454554, "eval_info_retr_eval_dot_precision@10": 0.09359433875562909, "eval_info_retr_eval_dot_precision@3": 0.2982262659682014, "eval_info_retr_eval_dot_precision@5": 0.18253836963514383, "eval_info_retr_eval_dot_recall@1": 0.8424777134454554, "eval_info_retr_eval_dot_recall@10": 0.9359433875562908, "eval_info_retr_eval_dot_recall@3": 0.8946787979046044, "eval_info_retr_eval_dot_recall@5": 0.9126918481757191, "eval_loss": 0.6083176732063293, "eval_para_mine_eval_average_precision": 0.458339002373722, "eval_para_mine_eval_f1": 0.5954711973336655, "eval_para_mine_eval_precision": 0.6810695759380306, "eval_para_mine_eval_recall": 0.5289869146720989, "eval_para_mine_eval_threshold": 0.8661167621612549, "eval_runtime": 47.222, "eval_samples_per_second": 230.422, "eval_sequential_score": 0.8756277031952363, "eval_steps_per_second": 1.821, "step": 124 }, { "epoch": 0.27393225331369664, "grad_norm": 5.694400787353516, "learning_rate": 4.783169850283944e-05, "loss": 0.6272, "step": 186 }, { "epoch": 0.27393225331369664, "eval_info_retr_eval_dot_accuracy@1": 0.8515761418987225, "eval_info_retr_eval_dot_accuracy@10": 0.9441227828324602, "eval_info_retr_eval_dot_accuracy@3": 0.903961032993291, "eval_info_retr_eval_dot_accuracy@5": 0.9217902766289863, "eval_info_retr_eval_dot_map@100": 0.8842285240457468, "eval_info_retr_eval_dot_mrr@10": 0.8822831920502171, "eval_info_retr_eval_dot_ndcg@10": 0.8972070930309096, "eval_info_retr_eval_dot_precision@1": 0.8515761418987225, "eval_info_retr_eval_dot_precision@10": 0.09441227828324604, "eval_info_retr_eval_dot_precision@3": 0.301320344331097, "eval_info_retr_eval_dot_precision@5": 0.18435805532579727, "eval_info_retr_eval_dot_recall@1": 0.8515761418987225, "eval_info_retr_eval_dot_recall@10": 0.9441227828324602, "eval_info_retr_eval_dot_recall@3": 0.903961032993291, "eval_info_retr_eval_dot_recall@5": 0.9217902766289863, "eval_loss": 0.5591671466827393, "eval_para_mine_eval_average_precision": 0.4831713388578378, "eval_para_mine_eval_f1": 0.6178009413060559, "eval_para_mine_eval_precision": 0.7009458839715662, "eval_para_mine_eval_recall": 0.5522893677758556, "eval_para_mine_eval_threshold": 0.860432505607605, "eval_runtime": 46.8519, "eval_samples_per_second": 232.242, "eval_sequential_score": 0.8842285240457468, "eval_steps_per_second": 1.836, "step": 186 }, { "epoch": 0.36524300441826213, "grad_norm": 5.078444004058838, "learning_rate": 4.623128549303046e-05, "loss": 0.5353, "step": 248 }, { "epoch": 0.36524300441826213, "eval_info_retr_eval_dot_accuracy@1": 0.8613178935759581, "eval_info_retr_eval_dot_accuracy@10": 0.9482584321293999, "eval_info_retr_eval_dot_accuracy@3": 0.9126918481757191, "eval_info_retr_eval_dot_accuracy@5": 0.9284073155040897, "eval_info_retr_eval_dot_map@100": 0.8925029461858842, "eval_info_retr_eval_dot_mrr@10": 0.8906325355250079, "eval_info_retr_eval_dot_ndcg@10": 0.9045724071765342, "eval_info_retr_eval_dot_precision@1": 0.8613178935759581, "eval_info_retr_eval_dot_precision@10": 0.09482584321294, "eval_info_retr_eval_dot_precision@3": 0.30423061605857304, "eval_info_retr_eval_dot_precision@5": 0.18568146310081796, "eval_info_retr_eval_dot_recall@1": 0.8613178935759581, "eval_info_retr_eval_dot_recall@10": 0.9482584321293999, "eval_info_retr_eval_dot_recall@3": 0.9126918481757191, "eval_info_retr_eval_dot_recall@5": 0.9284073155040897, "eval_loss": 0.49234136939048767, "eval_para_mine_eval_average_precision": 0.5057185080416585, "eval_para_mine_eval_f1": 0.634543585033742, "eval_para_mine_eval_precision": 0.7090381773055578, "eval_para_mine_eval_recall": 0.5742141802134666, "eval_para_mine_eval_threshold": 0.8692877888679504, "eval_runtime": 46.7669, "eval_samples_per_second": 232.665, "eval_sequential_score": 0.8925029461858842, "eval_steps_per_second": 1.839, "step": 248 }, { "epoch": 0.4565537555228277, "grad_norm": 3.5897247791290283, "learning_rate": 4.463087248322148e-05, "loss": 0.4993, "step": 310 }, { "epoch": 0.4565537555228277, "eval_info_retr_eval_dot_accuracy@1": 0.8651778329197684, "eval_info_retr_eval_dot_accuracy@10": 0.9506479183898539, "eval_info_retr_eval_dot_accuracy@3": 0.9142542045767852, "eval_info_retr_eval_dot_accuracy@5": 0.9308887050822535, "eval_info_retr_eval_dot_map@100": 0.8952610946722075, "eval_info_retr_eval_dot_mrr@10": 0.8935005390202521, "eval_info_retr_eval_dot_ndcg@10": 0.9073002136944609, "eval_info_retr_eval_dot_precision@1": 0.8651778329197684, "eval_info_retr_eval_dot_precision@10": 0.09506479183898539, "eval_info_retr_eval_dot_precision@3": 0.3047514015255951, "eval_info_retr_eval_dot_precision@5": 0.18617774101645068, "eval_info_retr_eval_dot_recall@1": 0.8651778329197684, "eval_info_retr_eval_dot_recall@10": 0.9506479183898539, "eval_info_retr_eval_dot_recall@3": 0.9142542045767852, "eval_info_retr_eval_dot_recall@5": 0.9308887050822535, "eval_loss": 0.49423983693122864, "eval_para_mine_eval_average_precision": 0.5094425990878857, "eval_para_mine_eval_f1": 0.6359308330329982, "eval_para_mine_eval_precision": 0.7193390578495433, "eval_para_mine_eval_recall": 0.5698554154828743, "eval_para_mine_eval_threshold": 0.8585812747478485, "eval_runtime": 47.1777, "eval_samples_per_second": 230.639, "eval_sequential_score": 0.8952610946722075, "eval_steps_per_second": 1.823, "step": 310 }, { "epoch": 0.5478645066273933, "grad_norm": 5.185989856719971, "learning_rate": 4.3030459473412496e-05, "loss": 0.5339, "step": 372 }, { "epoch": 0.5478645066273933, "eval_info_retr_eval_dot_accuracy@1": 0.8665563826854149, "eval_info_retr_eval_dot_accuracy@10": 0.9531293079680176, "eval_info_retr_eval_dot_accuracy@3": 0.9180222406028857, "eval_info_retr_eval_dot_accuracy@5": 0.9335539012958368, "eval_info_retr_eval_dot_map@100": 0.8979226074859789, "eval_info_retr_eval_dot_mrr@10": 0.8961890028198282, "eval_info_retr_eval_dot_ndcg@10": 0.9099837143266869, "eval_info_retr_eval_dot_precision@1": 0.8665563826854149, "eval_info_retr_eval_dot_precision@10": 0.09531293079680178, "eval_info_retr_eval_dot_precision@3": 0.3060074135342952, "eval_info_retr_eval_dot_precision@5": 0.18671078025916735, "eval_info_retr_eval_dot_recall@1": 0.8665563826854149, "eval_info_retr_eval_dot_recall@10": 0.9531293079680176, "eval_info_retr_eval_dot_recall@3": 0.9180222406028857, "eval_info_retr_eval_dot_recall@5": 0.9335539012958368, "eval_loss": 0.46397796273231506, "eval_para_mine_eval_average_precision": 0.5171675614798505, "eval_para_mine_eval_f1": 0.6460162421829887, "eval_para_mine_eval_precision": 0.7083665639212813, "eval_para_mine_eval_recall": 0.5937540933995203, "eval_para_mine_eval_threshold": 0.8755151331424713, "eval_runtime": 47.3437, "eval_samples_per_second": 229.83, "eval_sequential_score": 0.8979226074859789, "eval_steps_per_second": 1.817, "step": 372 }, { "epoch": 0.6391752577319587, "grad_norm": 5.517925262451172, "learning_rate": 4.1430046463603515e-05, "loss": 0.4712, "step": 434 }, { "epoch": 0.6391752577319587, "eval_info_retr_eval_dot_accuracy@1": 0.876114327727231, "eval_info_retr_eval_dot_accuracy@10": 0.9580001838066354, "eval_info_retr_eval_dot_accuracy@3": 0.9218821799466961, "eval_info_retr_eval_dot_accuracy@5": 0.9385166804521643, "eval_info_retr_eval_dot_map@100": 0.9048794424295332, "eval_info_retr_eval_dot_mrr@10": 0.9033319693713965, "eval_info_retr_eval_dot_ndcg@10": 0.9165326554505013, "eval_info_retr_eval_dot_precision@1": 0.876114327727231, "eval_info_retr_eval_dot_precision@10": 0.09580001838066356, "eval_info_retr_eval_dot_precision@3": 0.30729405998223197, "eval_info_retr_eval_dot_precision@5": 0.18770333609043288, "eval_info_retr_eval_dot_recall@1": 0.876114327727231, "eval_info_retr_eval_dot_recall@10": 0.9580001838066354, "eval_info_retr_eval_dot_recall@3": 0.9218821799466961, "eval_info_retr_eval_dot_recall@5": 0.9385166804521643, "eval_loss": 0.43524134159088135, "eval_para_mine_eval_average_precision": 0.5120496793668291, "eval_para_mine_eval_f1": 0.6373077701335491, "eval_para_mine_eval_precision": 0.7241775739076951, "eval_para_mine_eval_recall": 0.5690468985017593, "eval_para_mine_eval_threshold": 0.8673346936702728, "eval_runtime": 47.1044, "eval_samples_per_second": 230.997, "eval_sequential_score": 0.9048794424295332, "eval_steps_per_second": 1.826, "step": 434 }, { "epoch": 0.7304860088365243, "grad_norm": 5.404409408569336, "learning_rate": 3.9829633453794526e-05, "loss": 0.4551, "step": 496 }, { "epoch": 0.7304860088365243, "eval_info_retr_eval_dot_accuracy@1": 0.8799742670710413, "eval_info_retr_eval_dot_accuracy@10": 0.9583677970774745, "eval_info_retr_eval_dot_accuracy@3": 0.9246392794779892, "eval_info_retr_eval_dot_accuracy@5": 0.9411818766657476, "eval_info_retr_eval_dot_map@100": 0.9077432063489332, "eval_info_retr_eval_dot_mrr@10": 0.9062031821888451, "eval_info_retr_eval_dot_ndcg@10": 0.9188197267902801, "eval_info_retr_eval_dot_precision@1": 0.8799742670710413, "eval_info_retr_eval_dot_precision@10": 0.09583677970774747, "eval_info_retr_eval_dot_precision@3": 0.30821309315932965, "eval_info_retr_eval_dot_precision@5": 0.18823637533314955, "eval_info_retr_eval_dot_recall@1": 0.8799742670710413, "eval_info_retr_eval_dot_recall@10": 0.9583677970774745, "eval_info_retr_eval_dot_recall@3": 0.9246392794779892, "eval_info_retr_eval_dot_recall@5": 0.9411818766657476, "eval_loss": 0.43508002161979675, "eval_para_mine_eval_average_precision": 0.5098966109274621, "eval_para_mine_eval_f1": 0.6349388484094101, "eval_para_mine_eval_precision": 0.7090408699915318, "eval_para_mine_eval_recall": 0.5748600904274299, "eval_para_mine_eval_threshold": 0.8756376802921295, "eval_runtime": 46.9049, "eval_samples_per_second": 231.98, "eval_sequential_score": 0.9077432063489332, "eval_steps_per_second": 1.833, "step": 496 }, { "epoch": 0.8217967599410898, "grad_norm": 5.574550151824951, "learning_rate": 3.8229220443985544e-05, "loss": 0.5675, "step": 558 }, { "epoch": 0.8217967599410898, "eval_info_retr_eval_dot_accuracy@1": 0.8838342064148516, "eval_info_retr_eval_dot_accuracy@10": 0.9589192169837331, "eval_info_retr_eval_dot_accuracy@3": 0.9250068927488282, "eval_info_retr_eval_dot_accuracy@5": 0.9407223600771988, "eval_info_retr_eval_dot_map@100": 0.9101926203565123, "eval_info_retr_eval_dot_mrr@10": 0.9085925955101584, "eval_info_retr_eval_dot_ndcg@10": 0.9207315014698775, "eval_info_retr_eval_dot_precision@1": 0.8838342064148516, "eval_info_retr_eval_dot_precision@10": 0.09589192169837332, "eval_info_retr_eval_dot_precision@3": 0.3083356309162761, "eval_info_retr_eval_dot_precision@5": 0.18814447201543977, "eval_info_retr_eval_dot_recall@1": 0.8838342064148516, "eval_info_retr_eval_dot_recall@10": 0.9589192169837331, "eval_info_retr_eval_dot_recall@3": 0.9250068927488282, "eval_info_retr_eval_dot_recall@5": 0.9407223600771988, "eval_loss": 0.4080217182636261, "eval_para_mine_eval_average_precision": 0.5334326202140158, "eval_para_mine_eval_f1": 0.6571024883172905, "eval_para_mine_eval_precision": 0.7344628039218969, "eval_para_mine_eval_recall": 0.5944858238517027, "eval_para_mine_eval_threshold": 0.8824244141578674, "eval_runtime": 46.9444, "eval_samples_per_second": 231.785, "eval_sequential_score": 0.9101926203565123, "eval_steps_per_second": 1.832, "step": 558 }, { "epoch": 0.9131075110456554, "grad_norm": 7.1312103271484375, "learning_rate": 3.662880743417656e-05, "loss": 0.5189, "step": 620 }, { "epoch": 0.9131075110456554, "eval_info_retr_eval_dot_accuracy@1": 0.8812609135189781, "eval_info_retr_eval_dot_accuracy@10": 0.9581839904420549, "eval_info_retr_eval_dot_accuracy@3": 0.9273963790092823, "eval_info_retr_eval_dot_accuracy@5": 0.9409061667126183, "eval_info_retr_eval_dot_map@100": 0.9088995825285359, "eval_info_retr_eval_dot_mrr@10": 0.907332134213855, "eval_info_retr_eval_dot_ndcg@10": 0.9196508765398915, "eval_info_retr_eval_dot_precision@1": 0.8812609135189781, "eval_info_retr_eval_dot_precision@10": 0.09581839904420549, "eval_info_retr_eval_dot_precision@3": 0.3091321263364274, "eval_info_retr_eval_dot_precision@5": 0.1881812333425237, "eval_info_retr_eval_dot_recall@1": 0.8812609135189781, "eval_info_retr_eval_dot_recall@10": 0.9581839904420549, "eval_info_retr_eval_dot_recall@3": 0.9273963790092823, "eval_info_retr_eval_dot_recall@5": 0.9409061667126183, "eval_loss": 0.3979346752166748, "eval_para_mine_eval_average_precision": 0.5429228832902425, "eval_para_mine_eval_f1": 0.6632612084554468, "eval_para_mine_eval_precision": 0.7405866363656618, "eval_para_mine_eval_recall": 0.60055647649203, "eval_para_mine_eval_threshold": 0.8737862706184387, "eval_runtime": 47.0589, "eval_samples_per_second": 231.221, "eval_sequential_score": 0.9088995825285359, "eval_steps_per_second": 1.827, "step": 620 }, { "epoch": 1.004418262150221, "grad_norm": 2.313579559326172, "learning_rate": 3.502839442436758e-05, "loss": 0.4278, "step": 682 }, { "epoch": 1.004418262150221, "eval_info_retr_eval_dot_accuracy@1": 0.886039886039886, "eval_info_retr_eval_dot_accuracy@10": 0.9605734767025089, "eval_info_retr_eval_dot_accuracy@3": 0.9296939619520265, "eval_info_retr_eval_dot_accuracy@5": 0.9435713629262016, "eval_info_retr_eval_dot_map@100": 0.912725086164855, "eval_info_retr_eval_dot_mrr@10": 0.9111236201738, "eval_info_retr_eval_dot_ndcg@10": 0.9230849032296308, "eval_info_retr_eval_dot_precision@1": 0.886039886039886, "eval_info_retr_eval_dot_precision@10": 0.0960573476702509, "eval_info_retr_eval_dot_precision@3": 0.30989798731734214, "eval_info_retr_eval_dot_precision@5": 0.18871427258524037, "eval_info_retr_eval_dot_recall@1": 0.886039886039886, "eval_info_retr_eval_dot_recall@10": 0.9605734767025089, "eval_info_retr_eval_dot_recall@3": 0.9296939619520265, "eval_info_retr_eval_dot_recall@5": 0.9435713629262016, "eval_loss": 0.4062098264694214, "eval_para_mine_eval_average_precision": 0.5569159802538414, "eval_para_mine_eval_f1": 0.6778007972895148, "eval_para_mine_eval_precision": 0.7563934207304859, "eval_para_mine_eval_recall": 0.6140031527645409, "eval_para_mine_eval_threshold": 0.8800513744354248, "eval_runtime": 47.9405, "eval_samples_per_second": 226.969, "eval_sequential_score": 0.912725086164855, "eval_steps_per_second": 1.794, "step": 682 }, { "epoch": 1.0559646539027983, "grad_norm": 3.6702966690063477, "learning_rate": 3.342798141455859e-05, "loss": 0.337, "step": 744 }, { "epoch": 1.0559646539027983, "eval_info_retr_eval_dot_accuracy@1": 0.8869589192169838, "eval_info_retr_eval_dot_accuracy@10": 0.9636981895046411, "eval_info_retr_eval_dot_accuracy@3": 0.9324510614833196, "eval_info_retr_eval_dot_accuracy@5": 0.9460527525043654, "eval_info_retr_eval_dot_map@100": 0.9139823556373721, "eval_info_retr_eval_dot_mrr@10": 0.9125556343298289, "eval_info_retr_eval_dot_ndcg@10": 0.924918869014723, "eval_info_retr_eval_dot_precision@1": 0.8869589192169838, "eval_info_retr_eval_dot_precision@10": 0.09636981895046412, "eval_info_retr_eval_dot_precision@3": 0.31081702049443977, "eval_info_retr_eval_dot_precision@5": 0.1892105505008731, "eval_info_retr_eval_dot_recall@1": 0.8869589192169838, "eval_info_retr_eval_dot_recall@10": 0.9636981895046411, "eval_info_retr_eval_dot_recall@3": 0.9324510614833196, "eval_info_retr_eval_dot_recall@5": 0.9460527525043654, "eval_loss": 0.4025246500968933, "eval_para_mine_eval_average_precision": 0.5442347943347751, "eval_para_mine_eval_f1": 0.6641819581357237, "eval_para_mine_eval_precision": 0.7375383953633291, "eval_para_mine_eval_recall": 0.604097690532221, "eval_para_mine_eval_threshold": 0.8758298754692078, "eval_runtime": 47.2224, "eval_samples_per_second": 230.42, "eval_sequential_score": 0.9139823556373721, "eval_steps_per_second": 1.821, "step": 744 }, { "epoch": 1.1472754050073637, "grad_norm": 3.720041036605835, "learning_rate": 3.182756840474961e-05, "loss": 0.3788, "step": 806 }, { "epoch": 1.1472754050073637, "eval_info_retr_eval_dot_accuracy@1": 0.882455656649205, "eval_info_retr_eval_dot_accuracy@10": 0.9624115430567044, "eval_info_retr_eval_dot_accuracy@3": 0.9284073155040897, "eval_info_retr_eval_dot_accuracy@5": 0.9443984927855895, "eval_info_retr_eval_dot_map@100": 0.9105324753022828, "eval_info_retr_eval_dot_mrr@10": 0.9090466051935585, "eval_info_retr_eval_dot_ndcg@10": 0.9219529245233927, "eval_info_retr_eval_dot_precision@1": 0.882455656649205, "eval_info_retr_eval_dot_precision@10": 0.09624115430567044, "eval_info_retr_eval_dot_precision@3": 0.3094691051680299, "eval_info_retr_eval_dot_precision@5": 0.18887969855711795, "eval_info_retr_eval_dot_recall@1": 0.882455656649205, "eval_info_retr_eval_dot_recall@10": 0.9624115430567044, "eval_info_retr_eval_dot_recall@3": 0.9284073155040897, "eval_info_retr_eval_dot_recall@5": 0.9443984927855895, "eval_loss": 0.38206225633621216, "eval_para_mine_eval_average_precision": 0.5650597252874483, "eval_para_mine_eval_f1": 0.684371051800379, "eval_para_mine_eval_precision": 0.7542356748524652, "eval_para_mine_eval_recall": 0.6263522333587783, "eval_para_mine_eval_threshold": 0.8642670810222626, "eval_runtime": 47.1588, "eval_samples_per_second": 230.731, "eval_sequential_score": 0.9105324753022828, "eval_steps_per_second": 1.824, "step": 806 }, { "epoch": 1.2385861561119293, "grad_norm": 2.3984501361846924, "learning_rate": 3.0227155394940632e-05, "loss": 0.2921, "step": 868 }, { "epoch": 1.2385861561119293, "eval_info_retr_eval_dot_accuracy@1": 0.8853046594982079, "eval_info_retr_eval_dot_accuracy@10": 0.9623196397389946, "eval_info_retr_eval_dot_accuracy@3": 0.9301534785405753, "eval_info_retr_eval_dot_accuracy@5": 0.9438470728793309, "eval_info_retr_eval_dot_map@100": 0.9123716441222456, "eval_info_retr_eval_dot_mrr@10": 0.9109295291194935, "eval_info_retr_eval_dot_ndcg@10": 0.9233517208473251, "eval_info_retr_eval_dot_precision@1": 0.8853046594982079, "eval_info_retr_eval_dot_precision@10": 0.09623196397389946, "eval_info_retr_eval_dot_precision@3": 0.3100511595135251, "eval_info_retr_eval_dot_precision@5": 0.18876941457586618, "eval_info_retr_eval_dot_recall@1": 0.8853046594982079, "eval_info_retr_eval_dot_recall@10": 0.9623196397389946, "eval_info_retr_eval_dot_recall@3": 0.9301534785405753, "eval_info_retr_eval_dot_recall@5": 0.9438470728793309, "eval_loss": 0.38938164710998535, "eval_para_mine_eval_average_precision": 0.562639634596526, "eval_para_mine_eval_f1": 0.6812942943315669, "eval_para_mine_eval_precision": 0.756277142164319, "eval_para_mine_eval_recall": 0.6198389289634271, "eval_para_mine_eval_threshold": 0.8650586903095245, "eval_runtime": 47.164, "eval_samples_per_second": 230.706, "eval_sequential_score": 0.9123716441222456, "eval_steps_per_second": 1.823, "step": 868 }, { "epoch": 1.3298969072164948, "grad_norm": 2.1422321796417236, "learning_rate": 2.862674238513165e-05, "loss": 0.2719, "step": 930 }, { "epoch": 1.3298969072164948, "eval_info_retr_eval_dot_accuracy@1": 0.8885212756180498, "eval_info_retr_eval_dot_accuracy@10": 0.9656281591765463, "eval_info_retr_eval_dot_accuracy@3": 0.9345648377906443, "eval_info_retr_eval_dot_accuracy@5": 0.9500045951658855, "eval_info_retr_eval_dot_map@100": 0.9159948831907755, "eval_info_retr_eval_dot_mrr@10": 0.9146445748596291, "eval_info_retr_eval_dot_ndcg@10": 0.9270088047632189, "eval_info_retr_eval_dot_precision@1": 0.8885212756180498, "eval_info_retr_eval_dot_precision@10": 0.09656281591765466, "eval_info_retr_eval_dot_precision@3": 0.3115216125968814, "eval_info_retr_eval_dot_precision@5": 0.19000091903317715, "eval_info_retr_eval_dot_recall@1": 0.8885212756180498, "eval_info_retr_eval_dot_recall@10": 0.9656281591765463, "eval_info_retr_eval_dot_recall@3": 0.9345648377906443, "eval_info_retr_eval_dot_recall@5": 0.9500045951658855, "eval_loss": 0.3813144862651825, "eval_para_mine_eval_average_precision": 0.5562771586743412, "eval_para_mine_eval_f1": 0.6790739258140527, "eval_para_mine_eval_precision": 0.7701738104240424, "eval_para_mine_eval_recall": 0.6072459382184622, "eval_para_mine_eval_threshold": 0.8749864101409912, "eval_runtime": 46.8836, "eval_samples_per_second": 232.085, "eval_sequential_score": 0.9159948831907755, "eval_steps_per_second": 1.834, "step": 930 }, { "epoch": 1.4212076583210604, "grad_norm": 2.2384369373321533, "learning_rate": 2.702632937532267e-05, "loss": 0.2713, "step": 992 }, { "epoch": 1.4212076583210604, "eval_info_retr_eval_dot_accuracy@1": 0.889256502159728, "eval_info_retr_eval_dot_accuracy@10": 0.9640658027754802, "eval_info_retr_eval_dot_accuracy@3": 0.9335539012958368, "eval_info_retr_eval_dot_accuracy@5": 0.9473393989523021, "eval_info_retr_eval_dot_map@100": 0.9160609261046996, "eval_info_retr_eval_dot_mrr@10": 0.9146857125351749, "eval_info_retr_eval_dot_ndcg@10": 0.9266566721638121, "eval_info_retr_eval_dot_precision@1": 0.889256502159728, "eval_info_retr_eval_dot_precision@10": 0.09640658027754802, "eval_info_retr_eval_dot_precision@3": 0.3111846337652789, "eval_info_retr_eval_dot_precision@5": 0.18946787979046048, "eval_info_retr_eval_dot_recall@1": 0.889256502159728, "eval_info_retr_eval_dot_recall@10": 0.9640658027754802, "eval_info_retr_eval_dot_recall@3": 0.9335539012958368, "eval_info_retr_eval_dot_recall@5": 0.9473393989523021, "eval_loss": 0.379529744386673, "eval_para_mine_eval_average_precision": 0.5652640358968563, "eval_para_mine_eval_f1": 0.6830371726971242, "eval_para_mine_eval_precision": 0.7554402272988553, "eval_para_mine_eval_recall": 0.6232988396200422, "eval_para_mine_eval_threshold": 0.8636217713356018, "eval_runtime": 47.0681, "eval_samples_per_second": 231.176, "eval_sequential_score": 0.9160609261046996, "eval_steps_per_second": 1.827, "step": 992 }, { "epoch": 1.5125184094256259, "grad_norm": 1.37623131275177, "learning_rate": 2.542591636551368e-05, "loss": 0.2498, "step": 1054 }, { "epoch": 1.5125184094256259, "eval_info_retr_eval_dot_accuracy@1": 0.8875103391232424, "eval_info_retr_eval_dot_accuracy@10": 0.9651686425879974, "eval_info_retr_eval_dot_accuracy@3": 0.9322672548479, "eval_info_retr_eval_dot_accuracy@5": 0.9468798823637533, "eval_info_retr_eval_dot_map@100": 0.9147389573171367, "eval_info_retr_eval_dot_mrr@10": 0.9134388179191052, "eval_info_retr_eval_dot_ndcg@10": 0.9259428646968195, "eval_info_retr_eval_dot_precision@1": 0.8875103391232424, "eval_info_retr_eval_dot_precision@10": 0.09651686425879975, "eval_info_retr_eval_dot_precision@3": 0.31075575161596664, "eval_info_retr_eval_dot_precision@5": 0.1893759764727507, "eval_info_retr_eval_dot_recall@1": 0.8875103391232424, "eval_info_retr_eval_dot_recall@10": 0.9651686425879974, "eval_info_retr_eval_dot_recall@3": 0.9322672548479, "eval_info_retr_eval_dot_recall@5": 0.9468798823637533, "eval_loss": 0.3791400194168091, "eval_para_mine_eval_average_precision": 0.5531609578399229, "eval_para_mine_eval_f1": 0.6710056459938674, "eval_para_mine_eval_precision": 0.7802172142925567, "eval_para_mine_eval_recall": 0.5886139128156717, "eval_para_mine_eval_threshold": 0.8832797706127167, "eval_runtime": 46.8924, "eval_samples_per_second": 232.042, "eval_sequential_score": 0.9147389573171367, "eval_steps_per_second": 1.834, "step": 1054 }, { "epoch": 1.6038291605301915, "grad_norm": 3.7942512035369873, "learning_rate": 2.38255033557047e-05, "loss": 0.2785, "step": 1116 }, { "epoch": 1.6038291605301915, "eval_info_retr_eval_dot_accuracy@1": 0.8900836320191159, "eval_info_retr_eval_dot_accuracy@10": 0.9648929326348681, "eval_info_retr_eval_dot_accuracy@3": 0.9332781913427075, "eval_info_retr_eval_dot_accuracy@5": 0.9466960757283338, "eval_info_retr_eval_dot_map@100": 0.9161105864746074, "eval_info_retr_eval_dot_mrr@10": 0.9147435168044494, "eval_info_retr_eval_dot_ndcg@10": 0.9268526071520827, "eval_info_retr_eval_dot_precision@1": 0.8900836320191159, "eval_info_retr_eval_dot_precision@10": 0.09648929326348682, "eval_info_retr_eval_dot_precision@3": 0.31109273044756913, "eval_info_retr_eval_dot_precision@5": 0.1893392151456668, "eval_info_retr_eval_dot_recall@1": 0.8900836320191159, "eval_info_retr_eval_dot_recall@10": 0.9648929326348681, "eval_info_retr_eval_dot_recall@3": 0.9332781913427075, "eval_info_retr_eval_dot_recall@5": 0.9466960757283338, "eval_loss": 0.3756929337978363, "eval_para_mine_eval_average_precision": 0.5534577957590571, "eval_para_mine_eval_f1": 0.6721510117453017, "eval_para_mine_eval_precision": 0.763900548546983, "eval_para_mine_eval_recall": 0.6000776898998613, "eval_para_mine_eval_threshold": 0.8725496828556061, "eval_runtime": 47.1739, "eval_samples_per_second": 230.657, "eval_sequential_score": 0.9161105864746074, "eval_steps_per_second": 1.823, "step": 1116 }, { "epoch": 1.695139911634757, "grad_norm": 2.6778645515441895, "learning_rate": 2.2225090345895717e-05, "loss": 0.2428, "step": 1178 }, { "epoch": 1.695139911634757, "eval_info_retr_eval_dot_accuracy@1": 0.8910945685139233, "eval_info_retr_eval_dot_accuracy@10": 0.9671905155776124, "eval_info_retr_eval_dot_accuracy@3": 0.9344729344729344, "eval_info_retr_eval_dot_accuracy@5": 0.9494531752596269, "eval_info_retr_eval_dot_map@100": 0.9174675014460509, "eval_info_retr_eval_dot_mrr@10": 0.916212365226703, "eval_info_retr_eval_dot_ndcg@10": 0.9285204933191614, "eval_info_retr_eval_dot_precision@1": 0.8910945685139233, "eval_info_retr_eval_dot_precision@10": 0.09671905155776124, "eval_info_retr_eval_dot_precision@3": 0.3114909781576448, "eval_info_retr_eval_dot_precision@5": 0.1898906350519254, "eval_info_retr_eval_dot_recall@1": 0.8910945685139233, "eval_info_retr_eval_dot_recall@10": 0.9671905155776124, "eval_info_retr_eval_dot_recall@3": 0.9344729344729344, "eval_info_retr_eval_dot_recall@5": 0.9494531752596269, "eval_loss": 0.36561650037765503, "eval_para_mine_eval_average_precision": 0.5544895514233957, "eval_para_mine_eval_f1": 0.6734225611719457, "eval_para_mine_eval_precision": 0.7675405136740874, "eval_para_mine_eval_recall": 0.5998653977316356, "eval_para_mine_eval_threshold": 0.8776430785655975, "eval_runtime": 47.0859, "eval_samples_per_second": 231.088, "eval_sequential_score": 0.9174675014460509, "eval_steps_per_second": 1.826, "step": 1178 }, { "epoch": 1.7864506627393224, "grad_norm": 3.110546112060547, "learning_rate": 2.0624677336086735e-05, "loss": 0.2935, "step": 1240 }, { "epoch": 1.7864506627393224, "eval_info_retr_eval_dot_accuracy@1": 0.8924731182795699, "eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343, "eval_info_retr_eval_dot_accuracy@3": 0.9348405477437736, "eval_info_retr_eval_dot_accuracy@5": 0.9497288852127562, "eval_info_retr_eval_dot_map@100": 0.9183095474671825, "eval_info_retr_eval_dot_mrr@10": 0.9169947469230629, "eval_info_retr_eval_dot_ndcg@10": 0.9289448948774749, "eval_info_retr_eval_dot_precision@1": 0.8924731182795699, "eval_info_retr_eval_dot_precision@10": 0.09664552890359342, "eval_info_retr_eval_dot_precision@3": 0.31161351591459113, "eval_info_retr_eval_dot_precision@5": 0.18994577704255125, "eval_info_retr_eval_dot_recall@1": 0.8924731182795699, "eval_info_retr_eval_dot_recall@10": 0.9664552890359343, "eval_info_retr_eval_dot_recall@3": 0.9348405477437736, "eval_info_retr_eval_dot_recall@5": 0.9497288852127562, "eval_loss": 0.36679840087890625, "eval_para_mine_eval_average_precision": 0.5492627712847419, "eval_para_mine_eval_f1": 0.6682617615424452, "eval_para_mine_eval_precision": 0.7445174891126459, "eval_para_mine_eval_recall": 0.6061754436680473, "eval_para_mine_eval_threshold": 0.8671578168869019, "eval_runtime": 47.2606, "eval_samples_per_second": 230.234, "eval_sequential_score": 0.9183095474671825, "eval_steps_per_second": 1.82, "step": 1240 }, { "epoch": 1.877761413843888, "grad_norm": 4.477660655975342, "learning_rate": 1.902426432627775e-05, "loss": 0.2823, "step": 1302 }, { "epoch": 1.877761413843888, "eval_info_retr_eval_dot_accuracy@1": 0.8939435713629262, "eval_info_retr_eval_dot_accuracy@10": 0.9648010293171584, "eval_info_retr_eval_dot_accuracy@3": 0.9359433875562908, "eval_info_retr_eval_dot_accuracy@5": 0.9485341420825292, "eval_info_retr_eval_dot_map@100": 0.9191298943799292, "eval_info_retr_eval_dot_mrr@10": 0.9177682665137863, "eval_info_retr_eval_dot_ndcg@10": 0.9291509217029374, "eval_info_retr_eval_dot_precision@1": 0.8939435713629262, "eval_info_retr_eval_dot_precision@10": 0.09648010293171583, "eval_info_retr_eval_dot_precision@3": 0.3119811291854302, "eval_info_retr_eval_dot_precision@5": 0.18970682841650582, "eval_info_retr_eval_dot_recall@1": 0.8939435713629262, "eval_info_retr_eval_dot_recall@10": 0.9648010293171584, "eval_info_retr_eval_dot_recall@3": 0.9359433875562908, "eval_info_retr_eval_dot_recall@5": 0.9485341420825292, "eval_loss": 0.3716655969619751, "eval_para_mine_eval_average_precision": 0.557578455456071, "eval_para_mine_eval_f1": 0.6753797157651423, "eval_para_mine_eval_precision": 0.7440590076966561, "eval_para_mine_eval_recall": 0.6183077152394159, "eval_para_mine_eval_threshold": 0.863526463508606, "eval_runtime": 46.6942, "eval_samples_per_second": 233.027, "eval_sequential_score": 0.9191298943799292, "eval_steps_per_second": 1.842, "step": 1302 }, { "epoch": 1.9690721649484537, "grad_norm": 4.546482563018799, "learning_rate": 1.742385131646877e-05, "loss": 0.2938, "step": 1364 }, { "epoch": 1.9690721649484537, "eval_info_retr_eval_dot_accuracy@1": 0.8946787979046044, "eval_info_retr_eval_dot_accuracy@10": 0.9646172226817388, "eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374, "eval_info_retr_eval_dot_accuracy@5": 0.9487179487179487, "eval_info_retr_eval_dot_map@100": 0.9200289882479742, "eval_info_retr_eval_dot_mrr@10": 0.9186748635673371, "eval_info_retr_eval_dot_ndcg@10": 0.9298216358313898, "eval_info_retr_eval_dot_precision@1": 0.8946787979046044, "eval_info_retr_eval_dot_precision@10": 0.09646172226817387, "eval_info_retr_eval_dot_precision@3": 0.31244064577397906, "eval_info_retr_eval_dot_precision@5": 0.18974358974358976, "eval_info_retr_eval_dot_recall@1": 0.8946787979046044, "eval_info_retr_eval_dot_recall@10": 0.9646172226817388, "eval_info_retr_eval_dot_recall@3": 0.9373219373219374, "eval_info_retr_eval_dot_recall@5": 0.9487179487179487, "eval_loss": 0.3621634840965271, "eval_para_mine_eval_average_precision": 0.5594570173517496, "eval_para_mine_eval_f1": 0.6766163284568192, "eval_para_mine_eval_precision": 0.7421746515327168, "eval_para_mine_eval_recall": 0.6216998730763845, "eval_para_mine_eval_threshold": 0.8676250278949738, "eval_runtime": 47.3006, "eval_samples_per_second": 230.039, "eval_sequential_score": 0.9200289882479742, "eval_steps_per_second": 1.818, "step": 1364 }, { "epoch": 2.020618556701031, "grad_norm": 3.241508722305298, "learning_rate": 1.5823438306659787e-05, "loss": 0.216, "step": 1426 }, { "epoch": 2.020618556701031, "eval_info_retr_eval_dot_accuracy@1": 0.893208344821248, "eval_info_retr_eval_dot_accuracy@10": 0.9661795790828049, "eval_info_retr_eval_dot_accuracy@3": 0.9362190975094201, "eval_info_retr_eval_dot_accuracy@5": 0.9500964984835952, "eval_info_retr_eval_dot_map@100": 0.9191773519681701, "eval_info_retr_eval_dot_mrr@10": 0.9178556476047521, "eval_info_retr_eval_dot_ndcg@10": 0.9295559143323862, "eval_info_retr_eval_dot_precision@1": 0.893208344821248, "eval_info_retr_eval_dot_precision@10": 0.09661795790828051, "eval_info_retr_eval_dot_precision@3": 0.31207303250314, "eval_info_retr_eval_dot_precision@5": 0.19001929969671905, "eval_info_retr_eval_dot_recall@1": 0.893208344821248, "eval_info_retr_eval_dot_recall@10": 0.9661795790828049, "eval_info_retr_eval_dot_recall@3": 0.9362190975094201, "eval_info_retr_eval_dot_recall@5": 0.9500964984835952, "eval_loss": 0.3684485852718353, "eval_para_mine_eval_average_precision": 0.5665176151429165, "eval_para_mine_eval_f1": 0.6839674754190774, "eval_para_mine_eval_precision": 0.7722483633387889, "eval_para_mine_eval_recall": 0.6137998943056013, "eval_para_mine_eval_threshold": 0.886872798204422, "eval_runtime": 47.5509, "eval_samples_per_second": 228.829, "eval_sequential_score": 0.9191773519681701, "eval_steps_per_second": 1.809, "step": 1426 }, { "epoch": 2.1119293078055965, "grad_norm": 2.4362664222717285, "learning_rate": 1.42230252968508e-05, "loss": 0.2363, "step": 1488 }, { "epoch": 2.1119293078055965, "eval_info_retr_eval_dot_accuracy@1": 0.8943111846337652, "eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343, "eval_info_retr_eval_dot_accuracy@3": 0.9374138406396471, "eval_info_retr_eval_dot_accuracy@5": 0.9490855619887878, "eval_info_retr_eval_dot_map@100": 0.9197752678474642, "eval_info_retr_eval_dot_mrr@10": 0.9185011954725225, "eval_info_retr_eval_dot_ndcg@10": 0.9300922809925127, "eval_info_retr_eval_dot_precision@1": 0.8943111846337652, "eval_info_retr_eval_dot_precision@10": 0.09664552890359342, "eval_info_retr_eval_dot_precision@3": 0.31247128021321563, "eval_info_retr_eval_dot_precision@5": 0.18981711239775756, "eval_info_retr_eval_dot_recall@1": 0.8943111846337652, "eval_info_retr_eval_dot_recall@10": 0.9664552890359343, "eval_info_retr_eval_dot_recall@3": 0.9374138406396471, "eval_info_retr_eval_dot_recall@5": 0.9490855619887878, "eval_loss": 0.36409991979599, "eval_para_mine_eval_average_precision": 0.5680857985845322, "eval_para_mine_eval_f1": 0.6845767174265878, "eval_para_mine_eval_precision": 0.7527188630602916, "eval_para_mine_eval_recall": 0.6277479414434964, "eval_para_mine_eval_threshold": 0.874737024307251, "eval_runtime": 46.8373, "eval_samples_per_second": 232.315, "eval_sequential_score": 0.9197752678474642, "eval_steps_per_second": 1.836, "step": 1488 }, { "epoch": 2.203240058910162, "grad_norm": 1.0034995079040527, "learning_rate": 1.2622612287041818e-05, "loss": 0.2336, "step": 1550 }, { "epoch": 2.203240058910162, "eval_info_retr_eval_dot_accuracy@1": 0.8936678614097969, "eval_info_retr_eval_dot_accuracy@10": 0.9655362558588365, "eval_info_retr_eval_dot_accuracy@3": 0.9360352908740005, "eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366, "eval_info_retr_eval_dot_map@100": 0.9191474148366734, "eval_info_retr_eval_dot_mrr@10": 0.9178338388015818, "eval_info_retr_eval_dot_ndcg@10": 0.9293775519635007, "eval_info_retr_eval_dot_precision@1": 0.8936678614097969, "eval_info_retr_eval_dot_precision@10": 0.09655362558588364, "eval_info_retr_eval_dot_precision@3": 0.31201176362466687, "eval_info_retr_eval_dot_precision@5": 0.18990901571546734, "eval_info_retr_eval_dot_recall@1": 0.8936678614097969, "eval_info_retr_eval_dot_recall@10": 0.9655362558588365, "eval_info_retr_eval_dot_recall@3": 0.9360352908740005, "eval_info_retr_eval_dot_recall@5": 0.9495450785773366, "eval_loss": 0.3632822632789612, "eval_para_mine_eval_average_precision": 0.5695600017649123, "eval_para_mine_eval_f1": 0.6885810689948371, "eval_para_mine_eval_precision": 0.7525360184242944, "eval_para_mine_eval_recall": 0.6346451784835112, "eval_para_mine_eval_threshold": 0.8695259690284729, "eval_runtime": 46.9973, "eval_samples_per_second": 231.524, "eval_sequential_score": 0.9191474148366734, "eval_steps_per_second": 1.83, "step": 1550 }, { "epoch": 2.2945508100147274, "grad_norm": 1.5235002040863037, "learning_rate": 1.1022199277232835e-05, "loss": 0.2065, "step": 1612 }, { "epoch": 2.2945508100147274, "eval_info_retr_eval_dot_accuracy@1": 0.8948626045400239, "eval_info_retr_eval_dot_accuracy@10": 0.9658119658119658, "eval_info_retr_eval_dot_accuracy@3": 0.9364029041448396, "eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366, "eval_info_retr_eval_dot_map@100": 0.9201749271580272, "eval_info_retr_eval_dot_mrr@10": 0.9188280722330898, "eval_info_retr_eval_dot_ndcg@10": 0.9302018390100595, "eval_info_retr_eval_dot_precision@1": 0.8948626045400239, "eval_info_retr_eval_dot_precision@10": 0.09658119658119659, "eval_info_retr_eval_dot_precision@3": 0.3121343013816132, "eval_info_retr_eval_dot_precision@5": 0.18990901571546734, "eval_info_retr_eval_dot_recall@1": 0.8948626045400239, "eval_info_retr_eval_dot_recall@10": 0.9658119658119658, "eval_info_retr_eval_dot_recall@3": 0.9364029041448396, "eval_info_retr_eval_dot_recall@5": 0.9495450785773366, "eval_loss": 0.36156603693962097, "eval_para_mine_eval_average_precision": 0.5665696229109317, "eval_para_mine_eval_f1": 0.6860915092192124, "eval_para_mine_eval_precision": 0.7585999354355094, "eval_para_mine_eval_recall": 0.6262347951380577, "eval_para_mine_eval_threshold": 0.8720309436321259, "eval_runtime": 47.7964, "eval_samples_per_second": 227.653, "eval_sequential_score": 0.9201749271580272, "eval_steps_per_second": 1.799, "step": 1612 }, { "epoch": 2.385861561119293, "grad_norm": 1.445999264717102, "learning_rate": 9.421786267423851e-06, "loss": 0.2083, "step": 1674 }, { "epoch": 2.385861561119293, "eval_info_retr_eval_dot_accuracy@1": 0.8960573476702509, "eval_info_retr_eval_dot_accuracy@10": 0.9659957724473853, "eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374, "eval_info_retr_eval_dot_accuracy@5": 0.9503722084367245, "eval_info_retr_eval_dot_map@100": 0.92104627411852, "eval_info_retr_eval_dot_mrr@10": 0.9196911975585806, "eval_info_retr_eval_dot_ndcg@10": 0.9309142349609268, "eval_info_retr_eval_dot_precision@1": 0.8960573476702509, "eval_info_retr_eval_dot_precision@10": 0.09659957724473853, "eval_info_retr_eval_dot_precision@3": 0.3124406457739791, "eval_info_retr_eval_dot_precision@5": 0.19007444168734494, "eval_info_retr_eval_dot_recall@1": 0.8960573476702509, "eval_info_retr_eval_dot_recall@10": 0.9659957724473853, "eval_info_retr_eval_dot_recall@3": 0.9373219373219374, "eval_info_retr_eval_dot_recall@5": 0.9503722084367245, "eval_loss": 0.358325332403183, "eval_para_mine_eval_average_precision": 0.5714132731149775, "eval_para_mine_eval_f1": 0.6871263293961211, "eval_para_mine_eval_precision": 0.7587332430898214, "eval_para_mine_eval_recall": 0.6278698965188602, "eval_para_mine_eval_threshold": 0.8729398548603058, "eval_runtime": 47.2608, "eval_samples_per_second": 230.233, "eval_sequential_score": 0.92104627411852, "eval_steps_per_second": 1.82, "step": 1674 } ], "logging_steps": 62, "max_steps": 2037, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 62, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 64, "trial_name": null, "trial_params": null }