|
{ |
|
"best_metric": 0.5714132731149775, |
|
"best_model_checkpoint": "models/all-minilm-l6-v2-typosquat-v3.1-gist/checkpoint-1674", |
|
"epoch": 2.385861561119293, |
|
"eval_steps": 62, |
|
"global_step": 1674, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.09131075110456553, |
|
"grad_norm": 17.575565338134766, |
|
"learning_rate": 3e-05, |
|
"loss": 1.9075, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 0.09131075110456553, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8306221854608952, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9250068927488282, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.8876941457586619, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9032258064516129, |
|
"eval_info_retr_eval_dot_map@100": 0.8651529300165571, |
|
"eval_info_retr_eval_dot_mrr@10": 0.8627116876220815, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.8777861364040704, |
|
"eval_info_retr_eval_dot_precision@1": 0.8306221854608952, |
|
"eval_info_retr_eval_dot_precision@10": 0.09250068927488282, |
|
"eval_info_retr_eval_dot_precision@3": 0.2958980485862206, |
|
"eval_info_retr_eval_dot_precision@5": 0.18064516129032257, |
|
"eval_info_retr_eval_dot_recall@1": 0.8306221854608952, |
|
"eval_info_retr_eval_dot_recall@10": 0.9250068927488282, |
|
"eval_info_retr_eval_dot_recall@3": 0.8876941457586619, |
|
"eval_info_retr_eval_dot_recall@5": 0.9032258064516129, |
|
"eval_loss": 0.8926403522491455, |
|
"eval_para_mine_eval_average_precision": 0.4175368476477107, |
|
"eval_para_mine_eval_f1": 0.5608786555511446, |
|
"eval_para_mine_eval_precision": 0.6772723495912615, |
|
"eval_para_mine_eval_recall": 0.4786239854015258, |
|
"eval_para_mine_eval_threshold": 0.7514148652553558, |
|
"eval_runtime": 46.7645, |
|
"eval_samples_per_second": 232.676, |
|
"eval_sequential_score": 0.8651529300165571, |
|
"eval_steps_per_second": 1.839, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 0.18262150220913106, |
|
"grad_norm": 6.875263214111328, |
|
"learning_rate": 4.943211151264843e-05, |
|
"loss": 0.9074, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 0.18262150220913106, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8424777134454554, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9359433875562908, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.8946787979046044, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9126918481757191, |
|
"eval_info_retr_eval_dot_map@100": 0.8756277031952363, |
|
"eval_info_retr_eval_dot_mrr@10": 0.873614557485526, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.8886439257445581, |
|
"eval_info_retr_eval_dot_precision@1": 0.8424777134454554, |
|
"eval_info_retr_eval_dot_precision@10": 0.09359433875562909, |
|
"eval_info_retr_eval_dot_precision@3": 0.2982262659682014, |
|
"eval_info_retr_eval_dot_precision@5": 0.18253836963514383, |
|
"eval_info_retr_eval_dot_recall@1": 0.8424777134454554, |
|
"eval_info_retr_eval_dot_recall@10": 0.9359433875562908, |
|
"eval_info_retr_eval_dot_recall@3": 0.8946787979046044, |
|
"eval_info_retr_eval_dot_recall@5": 0.9126918481757191, |
|
"eval_loss": 0.6083176732063293, |
|
"eval_para_mine_eval_average_precision": 0.458339002373722, |
|
"eval_para_mine_eval_f1": 0.5954711973336655, |
|
"eval_para_mine_eval_precision": 0.6810695759380306, |
|
"eval_para_mine_eval_recall": 0.5289869146720989, |
|
"eval_para_mine_eval_threshold": 0.8661167621612549, |
|
"eval_runtime": 47.222, |
|
"eval_samples_per_second": 230.422, |
|
"eval_sequential_score": 0.8756277031952363, |
|
"eval_steps_per_second": 1.821, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 0.27393225331369664, |
|
"grad_norm": 5.694400787353516, |
|
"learning_rate": 4.783169850283944e-05, |
|
"loss": 0.6272, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.27393225331369664, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8515761418987225, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9441227828324602, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.903961032993291, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9217902766289863, |
|
"eval_info_retr_eval_dot_map@100": 0.8842285240457468, |
|
"eval_info_retr_eval_dot_mrr@10": 0.8822831920502171, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.8972070930309096, |
|
"eval_info_retr_eval_dot_precision@1": 0.8515761418987225, |
|
"eval_info_retr_eval_dot_precision@10": 0.09441227828324604, |
|
"eval_info_retr_eval_dot_precision@3": 0.301320344331097, |
|
"eval_info_retr_eval_dot_precision@5": 0.18435805532579727, |
|
"eval_info_retr_eval_dot_recall@1": 0.8515761418987225, |
|
"eval_info_retr_eval_dot_recall@10": 0.9441227828324602, |
|
"eval_info_retr_eval_dot_recall@3": 0.903961032993291, |
|
"eval_info_retr_eval_dot_recall@5": 0.9217902766289863, |
|
"eval_loss": 0.5591671466827393, |
|
"eval_para_mine_eval_average_precision": 0.4831713388578378, |
|
"eval_para_mine_eval_f1": 0.6178009413060559, |
|
"eval_para_mine_eval_precision": 0.7009458839715662, |
|
"eval_para_mine_eval_recall": 0.5522893677758556, |
|
"eval_para_mine_eval_threshold": 0.860432505607605, |
|
"eval_runtime": 46.8519, |
|
"eval_samples_per_second": 232.242, |
|
"eval_sequential_score": 0.8842285240457468, |
|
"eval_steps_per_second": 1.836, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.36524300441826213, |
|
"grad_norm": 5.078444004058838, |
|
"learning_rate": 4.623128549303046e-05, |
|
"loss": 0.5353, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 0.36524300441826213, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8613178935759581, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9482584321293999, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9126918481757191, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9284073155040897, |
|
"eval_info_retr_eval_dot_map@100": 0.8925029461858842, |
|
"eval_info_retr_eval_dot_mrr@10": 0.8906325355250079, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9045724071765342, |
|
"eval_info_retr_eval_dot_precision@1": 0.8613178935759581, |
|
"eval_info_retr_eval_dot_precision@10": 0.09482584321294, |
|
"eval_info_retr_eval_dot_precision@3": 0.30423061605857304, |
|
"eval_info_retr_eval_dot_precision@5": 0.18568146310081796, |
|
"eval_info_retr_eval_dot_recall@1": 0.8613178935759581, |
|
"eval_info_retr_eval_dot_recall@10": 0.9482584321293999, |
|
"eval_info_retr_eval_dot_recall@3": 0.9126918481757191, |
|
"eval_info_retr_eval_dot_recall@5": 0.9284073155040897, |
|
"eval_loss": 0.49234136939048767, |
|
"eval_para_mine_eval_average_precision": 0.5057185080416585, |
|
"eval_para_mine_eval_f1": 0.634543585033742, |
|
"eval_para_mine_eval_precision": 0.7090381773055578, |
|
"eval_para_mine_eval_recall": 0.5742141802134666, |
|
"eval_para_mine_eval_threshold": 0.8692877888679504, |
|
"eval_runtime": 46.7669, |
|
"eval_samples_per_second": 232.665, |
|
"eval_sequential_score": 0.8925029461858842, |
|
"eval_steps_per_second": 1.839, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 0.4565537555228277, |
|
"grad_norm": 3.5897247791290283, |
|
"learning_rate": 4.463087248322148e-05, |
|
"loss": 0.4993, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 0.4565537555228277, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8651778329197684, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9506479183898539, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9142542045767852, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9308887050822535, |
|
"eval_info_retr_eval_dot_map@100": 0.8952610946722075, |
|
"eval_info_retr_eval_dot_mrr@10": 0.8935005390202521, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9073002136944609, |
|
"eval_info_retr_eval_dot_precision@1": 0.8651778329197684, |
|
"eval_info_retr_eval_dot_precision@10": 0.09506479183898539, |
|
"eval_info_retr_eval_dot_precision@3": 0.3047514015255951, |
|
"eval_info_retr_eval_dot_precision@5": 0.18617774101645068, |
|
"eval_info_retr_eval_dot_recall@1": 0.8651778329197684, |
|
"eval_info_retr_eval_dot_recall@10": 0.9506479183898539, |
|
"eval_info_retr_eval_dot_recall@3": 0.9142542045767852, |
|
"eval_info_retr_eval_dot_recall@5": 0.9308887050822535, |
|
"eval_loss": 0.49423983693122864, |
|
"eval_para_mine_eval_average_precision": 0.5094425990878857, |
|
"eval_para_mine_eval_f1": 0.6359308330329982, |
|
"eval_para_mine_eval_precision": 0.7193390578495433, |
|
"eval_para_mine_eval_recall": 0.5698554154828743, |
|
"eval_para_mine_eval_threshold": 0.8585812747478485, |
|
"eval_runtime": 47.1777, |
|
"eval_samples_per_second": 230.639, |
|
"eval_sequential_score": 0.8952610946722075, |
|
"eval_steps_per_second": 1.823, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 0.5478645066273933, |
|
"grad_norm": 5.185989856719971, |
|
"learning_rate": 4.3030459473412496e-05, |
|
"loss": 0.5339, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.5478645066273933, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8665563826854149, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9531293079680176, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9180222406028857, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9335539012958368, |
|
"eval_info_retr_eval_dot_map@100": 0.8979226074859789, |
|
"eval_info_retr_eval_dot_mrr@10": 0.8961890028198282, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9099837143266869, |
|
"eval_info_retr_eval_dot_precision@1": 0.8665563826854149, |
|
"eval_info_retr_eval_dot_precision@10": 0.09531293079680178, |
|
"eval_info_retr_eval_dot_precision@3": 0.3060074135342952, |
|
"eval_info_retr_eval_dot_precision@5": 0.18671078025916735, |
|
"eval_info_retr_eval_dot_recall@1": 0.8665563826854149, |
|
"eval_info_retr_eval_dot_recall@10": 0.9531293079680176, |
|
"eval_info_retr_eval_dot_recall@3": 0.9180222406028857, |
|
"eval_info_retr_eval_dot_recall@5": 0.9335539012958368, |
|
"eval_loss": 0.46397796273231506, |
|
"eval_para_mine_eval_average_precision": 0.5171675614798505, |
|
"eval_para_mine_eval_f1": 0.6460162421829887, |
|
"eval_para_mine_eval_precision": 0.7083665639212813, |
|
"eval_para_mine_eval_recall": 0.5937540933995203, |
|
"eval_para_mine_eval_threshold": 0.8755151331424713, |
|
"eval_runtime": 47.3437, |
|
"eval_samples_per_second": 229.83, |
|
"eval_sequential_score": 0.8979226074859789, |
|
"eval_steps_per_second": 1.817, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.6391752577319587, |
|
"grad_norm": 5.517925262451172, |
|
"learning_rate": 4.1430046463603515e-05, |
|
"loss": 0.4712, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 0.6391752577319587, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.876114327727231, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9580001838066354, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9218821799466961, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9385166804521643, |
|
"eval_info_retr_eval_dot_map@100": 0.9048794424295332, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9033319693713965, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9165326554505013, |
|
"eval_info_retr_eval_dot_precision@1": 0.876114327727231, |
|
"eval_info_retr_eval_dot_precision@10": 0.09580001838066356, |
|
"eval_info_retr_eval_dot_precision@3": 0.30729405998223197, |
|
"eval_info_retr_eval_dot_precision@5": 0.18770333609043288, |
|
"eval_info_retr_eval_dot_recall@1": 0.876114327727231, |
|
"eval_info_retr_eval_dot_recall@10": 0.9580001838066354, |
|
"eval_info_retr_eval_dot_recall@3": 0.9218821799466961, |
|
"eval_info_retr_eval_dot_recall@5": 0.9385166804521643, |
|
"eval_loss": 0.43524134159088135, |
|
"eval_para_mine_eval_average_precision": 0.5120496793668291, |
|
"eval_para_mine_eval_f1": 0.6373077701335491, |
|
"eval_para_mine_eval_precision": 0.7241775739076951, |
|
"eval_para_mine_eval_recall": 0.5690468985017593, |
|
"eval_para_mine_eval_threshold": 0.8673346936702728, |
|
"eval_runtime": 47.1044, |
|
"eval_samples_per_second": 230.997, |
|
"eval_sequential_score": 0.9048794424295332, |
|
"eval_steps_per_second": 1.826, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 0.7304860088365243, |
|
"grad_norm": 5.404409408569336, |
|
"learning_rate": 3.9829633453794526e-05, |
|
"loss": 0.4551, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 0.7304860088365243, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8799742670710413, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9583677970774745, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9246392794779892, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9411818766657476, |
|
"eval_info_retr_eval_dot_map@100": 0.9077432063489332, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9062031821888451, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9188197267902801, |
|
"eval_info_retr_eval_dot_precision@1": 0.8799742670710413, |
|
"eval_info_retr_eval_dot_precision@10": 0.09583677970774747, |
|
"eval_info_retr_eval_dot_precision@3": 0.30821309315932965, |
|
"eval_info_retr_eval_dot_precision@5": 0.18823637533314955, |
|
"eval_info_retr_eval_dot_recall@1": 0.8799742670710413, |
|
"eval_info_retr_eval_dot_recall@10": 0.9583677970774745, |
|
"eval_info_retr_eval_dot_recall@3": 0.9246392794779892, |
|
"eval_info_retr_eval_dot_recall@5": 0.9411818766657476, |
|
"eval_loss": 0.43508002161979675, |
|
"eval_para_mine_eval_average_precision": 0.5098966109274621, |
|
"eval_para_mine_eval_f1": 0.6349388484094101, |
|
"eval_para_mine_eval_precision": 0.7090408699915318, |
|
"eval_para_mine_eval_recall": 0.5748600904274299, |
|
"eval_para_mine_eval_threshold": 0.8756376802921295, |
|
"eval_runtime": 46.9049, |
|
"eval_samples_per_second": 231.98, |
|
"eval_sequential_score": 0.9077432063489332, |
|
"eval_steps_per_second": 1.833, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 0.8217967599410898, |
|
"grad_norm": 5.574550151824951, |
|
"learning_rate": 3.8229220443985544e-05, |
|
"loss": 0.5675, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.8217967599410898, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8838342064148516, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9589192169837331, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9250068927488282, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9407223600771988, |
|
"eval_info_retr_eval_dot_map@100": 0.9101926203565123, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9085925955101584, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9207315014698775, |
|
"eval_info_retr_eval_dot_precision@1": 0.8838342064148516, |
|
"eval_info_retr_eval_dot_precision@10": 0.09589192169837332, |
|
"eval_info_retr_eval_dot_precision@3": 0.3083356309162761, |
|
"eval_info_retr_eval_dot_precision@5": 0.18814447201543977, |
|
"eval_info_retr_eval_dot_recall@1": 0.8838342064148516, |
|
"eval_info_retr_eval_dot_recall@10": 0.9589192169837331, |
|
"eval_info_retr_eval_dot_recall@3": 0.9250068927488282, |
|
"eval_info_retr_eval_dot_recall@5": 0.9407223600771988, |
|
"eval_loss": 0.4080217182636261, |
|
"eval_para_mine_eval_average_precision": 0.5334326202140158, |
|
"eval_para_mine_eval_f1": 0.6571024883172905, |
|
"eval_para_mine_eval_precision": 0.7344628039218969, |
|
"eval_para_mine_eval_recall": 0.5944858238517027, |
|
"eval_para_mine_eval_threshold": 0.8824244141578674, |
|
"eval_runtime": 46.9444, |
|
"eval_samples_per_second": 231.785, |
|
"eval_sequential_score": 0.9101926203565123, |
|
"eval_steps_per_second": 1.832, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.9131075110456554, |
|
"grad_norm": 7.1312103271484375, |
|
"learning_rate": 3.662880743417656e-05, |
|
"loss": 0.5189, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 0.9131075110456554, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8812609135189781, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9581839904420549, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9273963790092823, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9409061667126183, |
|
"eval_info_retr_eval_dot_map@100": 0.9088995825285359, |
|
"eval_info_retr_eval_dot_mrr@10": 0.907332134213855, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9196508765398915, |
|
"eval_info_retr_eval_dot_precision@1": 0.8812609135189781, |
|
"eval_info_retr_eval_dot_precision@10": 0.09581839904420549, |
|
"eval_info_retr_eval_dot_precision@3": 0.3091321263364274, |
|
"eval_info_retr_eval_dot_precision@5": 0.1881812333425237, |
|
"eval_info_retr_eval_dot_recall@1": 0.8812609135189781, |
|
"eval_info_retr_eval_dot_recall@10": 0.9581839904420549, |
|
"eval_info_retr_eval_dot_recall@3": 0.9273963790092823, |
|
"eval_info_retr_eval_dot_recall@5": 0.9409061667126183, |
|
"eval_loss": 0.3979346752166748, |
|
"eval_para_mine_eval_average_precision": 0.5429228832902425, |
|
"eval_para_mine_eval_f1": 0.6632612084554468, |
|
"eval_para_mine_eval_precision": 0.7405866363656618, |
|
"eval_para_mine_eval_recall": 0.60055647649203, |
|
"eval_para_mine_eval_threshold": 0.8737862706184387, |
|
"eval_runtime": 47.0589, |
|
"eval_samples_per_second": 231.221, |
|
"eval_sequential_score": 0.9088995825285359, |
|
"eval_steps_per_second": 1.827, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 1.004418262150221, |
|
"grad_norm": 2.313579559326172, |
|
"learning_rate": 3.502839442436758e-05, |
|
"loss": 0.4278, |
|
"step": 682 |
|
}, |
|
{ |
|
"epoch": 1.004418262150221, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.886039886039886, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9605734767025089, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9296939619520265, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9435713629262016, |
|
"eval_info_retr_eval_dot_map@100": 0.912725086164855, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9111236201738, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9230849032296308, |
|
"eval_info_retr_eval_dot_precision@1": 0.886039886039886, |
|
"eval_info_retr_eval_dot_precision@10": 0.0960573476702509, |
|
"eval_info_retr_eval_dot_precision@3": 0.30989798731734214, |
|
"eval_info_retr_eval_dot_precision@5": 0.18871427258524037, |
|
"eval_info_retr_eval_dot_recall@1": 0.886039886039886, |
|
"eval_info_retr_eval_dot_recall@10": 0.9605734767025089, |
|
"eval_info_retr_eval_dot_recall@3": 0.9296939619520265, |
|
"eval_info_retr_eval_dot_recall@5": 0.9435713629262016, |
|
"eval_loss": 0.4062098264694214, |
|
"eval_para_mine_eval_average_precision": 0.5569159802538414, |
|
"eval_para_mine_eval_f1": 0.6778007972895148, |
|
"eval_para_mine_eval_precision": 0.7563934207304859, |
|
"eval_para_mine_eval_recall": 0.6140031527645409, |
|
"eval_para_mine_eval_threshold": 0.8800513744354248, |
|
"eval_runtime": 47.9405, |
|
"eval_samples_per_second": 226.969, |
|
"eval_sequential_score": 0.912725086164855, |
|
"eval_steps_per_second": 1.794, |
|
"step": 682 |
|
}, |
|
{ |
|
"epoch": 1.0559646539027983, |
|
"grad_norm": 3.6702966690063477, |
|
"learning_rate": 3.342798141455859e-05, |
|
"loss": 0.337, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 1.0559646539027983, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8869589192169838, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9636981895046411, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9324510614833196, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9460527525043654, |
|
"eval_info_retr_eval_dot_map@100": 0.9139823556373721, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9125556343298289, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.924918869014723, |
|
"eval_info_retr_eval_dot_precision@1": 0.8869589192169838, |
|
"eval_info_retr_eval_dot_precision@10": 0.09636981895046412, |
|
"eval_info_retr_eval_dot_precision@3": 0.31081702049443977, |
|
"eval_info_retr_eval_dot_precision@5": 0.1892105505008731, |
|
"eval_info_retr_eval_dot_recall@1": 0.8869589192169838, |
|
"eval_info_retr_eval_dot_recall@10": 0.9636981895046411, |
|
"eval_info_retr_eval_dot_recall@3": 0.9324510614833196, |
|
"eval_info_retr_eval_dot_recall@5": 0.9460527525043654, |
|
"eval_loss": 0.4025246500968933, |
|
"eval_para_mine_eval_average_precision": 0.5442347943347751, |
|
"eval_para_mine_eval_f1": 0.6641819581357237, |
|
"eval_para_mine_eval_precision": 0.7375383953633291, |
|
"eval_para_mine_eval_recall": 0.604097690532221, |
|
"eval_para_mine_eval_threshold": 0.8758298754692078, |
|
"eval_runtime": 47.2224, |
|
"eval_samples_per_second": 230.42, |
|
"eval_sequential_score": 0.9139823556373721, |
|
"eval_steps_per_second": 1.821, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 1.1472754050073637, |
|
"grad_norm": 3.720041036605835, |
|
"learning_rate": 3.182756840474961e-05, |
|
"loss": 0.3788, |
|
"step": 806 |
|
}, |
|
{ |
|
"epoch": 1.1472754050073637, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.882455656649205, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9624115430567044, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9284073155040897, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9443984927855895, |
|
"eval_info_retr_eval_dot_map@100": 0.9105324753022828, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9090466051935585, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9219529245233927, |
|
"eval_info_retr_eval_dot_precision@1": 0.882455656649205, |
|
"eval_info_retr_eval_dot_precision@10": 0.09624115430567044, |
|
"eval_info_retr_eval_dot_precision@3": 0.3094691051680299, |
|
"eval_info_retr_eval_dot_precision@5": 0.18887969855711795, |
|
"eval_info_retr_eval_dot_recall@1": 0.882455656649205, |
|
"eval_info_retr_eval_dot_recall@10": 0.9624115430567044, |
|
"eval_info_retr_eval_dot_recall@3": 0.9284073155040897, |
|
"eval_info_retr_eval_dot_recall@5": 0.9443984927855895, |
|
"eval_loss": 0.38206225633621216, |
|
"eval_para_mine_eval_average_precision": 0.5650597252874483, |
|
"eval_para_mine_eval_f1": 0.684371051800379, |
|
"eval_para_mine_eval_precision": 0.7542356748524652, |
|
"eval_para_mine_eval_recall": 0.6263522333587783, |
|
"eval_para_mine_eval_threshold": 0.8642670810222626, |
|
"eval_runtime": 47.1588, |
|
"eval_samples_per_second": 230.731, |
|
"eval_sequential_score": 0.9105324753022828, |
|
"eval_steps_per_second": 1.824, |
|
"step": 806 |
|
}, |
|
{ |
|
"epoch": 1.2385861561119293, |
|
"grad_norm": 2.3984501361846924, |
|
"learning_rate": 3.0227155394940632e-05, |
|
"loss": 0.2921, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 1.2385861561119293, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8853046594982079, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9623196397389946, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9301534785405753, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9438470728793309, |
|
"eval_info_retr_eval_dot_map@100": 0.9123716441222456, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9109295291194935, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9233517208473251, |
|
"eval_info_retr_eval_dot_precision@1": 0.8853046594982079, |
|
"eval_info_retr_eval_dot_precision@10": 0.09623196397389946, |
|
"eval_info_retr_eval_dot_precision@3": 0.3100511595135251, |
|
"eval_info_retr_eval_dot_precision@5": 0.18876941457586618, |
|
"eval_info_retr_eval_dot_recall@1": 0.8853046594982079, |
|
"eval_info_retr_eval_dot_recall@10": 0.9623196397389946, |
|
"eval_info_retr_eval_dot_recall@3": 0.9301534785405753, |
|
"eval_info_retr_eval_dot_recall@5": 0.9438470728793309, |
|
"eval_loss": 0.38938164710998535, |
|
"eval_para_mine_eval_average_precision": 0.562639634596526, |
|
"eval_para_mine_eval_f1": 0.6812942943315669, |
|
"eval_para_mine_eval_precision": 0.756277142164319, |
|
"eval_para_mine_eval_recall": 0.6198389289634271, |
|
"eval_para_mine_eval_threshold": 0.8650586903095245, |
|
"eval_runtime": 47.164, |
|
"eval_samples_per_second": 230.706, |
|
"eval_sequential_score": 0.9123716441222456, |
|
"eval_steps_per_second": 1.823, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 1.3298969072164948, |
|
"grad_norm": 2.1422321796417236, |
|
"learning_rate": 2.862674238513165e-05, |
|
"loss": 0.2719, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 1.3298969072164948, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8885212756180498, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9656281591765463, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9345648377906443, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9500045951658855, |
|
"eval_info_retr_eval_dot_map@100": 0.9159948831907755, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9146445748596291, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9270088047632189, |
|
"eval_info_retr_eval_dot_precision@1": 0.8885212756180498, |
|
"eval_info_retr_eval_dot_precision@10": 0.09656281591765466, |
|
"eval_info_retr_eval_dot_precision@3": 0.3115216125968814, |
|
"eval_info_retr_eval_dot_precision@5": 0.19000091903317715, |
|
"eval_info_retr_eval_dot_recall@1": 0.8885212756180498, |
|
"eval_info_retr_eval_dot_recall@10": 0.9656281591765463, |
|
"eval_info_retr_eval_dot_recall@3": 0.9345648377906443, |
|
"eval_info_retr_eval_dot_recall@5": 0.9500045951658855, |
|
"eval_loss": 0.3813144862651825, |
|
"eval_para_mine_eval_average_precision": 0.5562771586743412, |
|
"eval_para_mine_eval_f1": 0.6790739258140527, |
|
"eval_para_mine_eval_precision": 0.7701738104240424, |
|
"eval_para_mine_eval_recall": 0.6072459382184622, |
|
"eval_para_mine_eval_threshold": 0.8749864101409912, |
|
"eval_runtime": 46.8836, |
|
"eval_samples_per_second": 232.085, |
|
"eval_sequential_score": 0.9159948831907755, |
|
"eval_steps_per_second": 1.834, |
|
"step": 930 |
|
}, |
|
{ |
|
"epoch": 1.4212076583210604, |
|
"grad_norm": 2.2384369373321533, |
|
"learning_rate": 2.702632937532267e-05, |
|
"loss": 0.2713, |
|
"step": 992 |
|
}, |
|
{ |
|
"epoch": 1.4212076583210604, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.889256502159728, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9640658027754802, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9335539012958368, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9473393989523021, |
|
"eval_info_retr_eval_dot_map@100": 0.9160609261046996, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9146857125351749, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9266566721638121, |
|
"eval_info_retr_eval_dot_precision@1": 0.889256502159728, |
|
"eval_info_retr_eval_dot_precision@10": 0.09640658027754802, |
|
"eval_info_retr_eval_dot_precision@3": 0.3111846337652789, |
|
"eval_info_retr_eval_dot_precision@5": 0.18946787979046048, |
|
"eval_info_retr_eval_dot_recall@1": 0.889256502159728, |
|
"eval_info_retr_eval_dot_recall@10": 0.9640658027754802, |
|
"eval_info_retr_eval_dot_recall@3": 0.9335539012958368, |
|
"eval_info_retr_eval_dot_recall@5": 0.9473393989523021, |
|
"eval_loss": 0.379529744386673, |
|
"eval_para_mine_eval_average_precision": 0.5652640358968563, |
|
"eval_para_mine_eval_f1": 0.6830371726971242, |
|
"eval_para_mine_eval_precision": 0.7554402272988553, |
|
"eval_para_mine_eval_recall": 0.6232988396200422, |
|
"eval_para_mine_eval_threshold": 0.8636217713356018, |
|
"eval_runtime": 47.0681, |
|
"eval_samples_per_second": 231.176, |
|
"eval_sequential_score": 0.9160609261046996, |
|
"eval_steps_per_second": 1.827, |
|
"step": 992 |
|
}, |
|
{ |
|
"epoch": 1.5125184094256259, |
|
"grad_norm": 1.37623131275177, |
|
"learning_rate": 2.542591636551368e-05, |
|
"loss": 0.2498, |
|
"step": 1054 |
|
}, |
|
{ |
|
"epoch": 1.5125184094256259, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8875103391232424, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9651686425879974, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9322672548479, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9468798823637533, |
|
"eval_info_retr_eval_dot_map@100": 0.9147389573171367, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9134388179191052, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9259428646968195, |
|
"eval_info_retr_eval_dot_precision@1": 0.8875103391232424, |
|
"eval_info_retr_eval_dot_precision@10": 0.09651686425879975, |
|
"eval_info_retr_eval_dot_precision@3": 0.31075575161596664, |
|
"eval_info_retr_eval_dot_precision@5": 0.1893759764727507, |
|
"eval_info_retr_eval_dot_recall@1": 0.8875103391232424, |
|
"eval_info_retr_eval_dot_recall@10": 0.9651686425879974, |
|
"eval_info_retr_eval_dot_recall@3": 0.9322672548479, |
|
"eval_info_retr_eval_dot_recall@5": 0.9468798823637533, |
|
"eval_loss": 0.3791400194168091, |
|
"eval_para_mine_eval_average_precision": 0.5531609578399229, |
|
"eval_para_mine_eval_f1": 0.6710056459938674, |
|
"eval_para_mine_eval_precision": 0.7802172142925567, |
|
"eval_para_mine_eval_recall": 0.5886139128156717, |
|
"eval_para_mine_eval_threshold": 0.8832797706127167, |
|
"eval_runtime": 46.8924, |
|
"eval_samples_per_second": 232.042, |
|
"eval_sequential_score": 0.9147389573171367, |
|
"eval_steps_per_second": 1.834, |
|
"step": 1054 |
|
}, |
|
{ |
|
"epoch": 1.6038291605301915, |
|
"grad_norm": 3.7942512035369873, |
|
"learning_rate": 2.38255033557047e-05, |
|
"loss": 0.2785, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 1.6038291605301915, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8900836320191159, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9648929326348681, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9332781913427075, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9466960757283338, |
|
"eval_info_retr_eval_dot_map@100": 0.9161105864746074, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9147435168044494, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9268526071520827, |
|
"eval_info_retr_eval_dot_precision@1": 0.8900836320191159, |
|
"eval_info_retr_eval_dot_precision@10": 0.09648929326348682, |
|
"eval_info_retr_eval_dot_precision@3": 0.31109273044756913, |
|
"eval_info_retr_eval_dot_precision@5": 0.1893392151456668, |
|
"eval_info_retr_eval_dot_recall@1": 0.8900836320191159, |
|
"eval_info_retr_eval_dot_recall@10": 0.9648929326348681, |
|
"eval_info_retr_eval_dot_recall@3": 0.9332781913427075, |
|
"eval_info_retr_eval_dot_recall@5": 0.9466960757283338, |
|
"eval_loss": 0.3756929337978363, |
|
"eval_para_mine_eval_average_precision": 0.5534577957590571, |
|
"eval_para_mine_eval_f1": 0.6721510117453017, |
|
"eval_para_mine_eval_precision": 0.763900548546983, |
|
"eval_para_mine_eval_recall": 0.6000776898998613, |
|
"eval_para_mine_eval_threshold": 0.8725496828556061, |
|
"eval_runtime": 47.1739, |
|
"eval_samples_per_second": 230.657, |
|
"eval_sequential_score": 0.9161105864746074, |
|
"eval_steps_per_second": 1.823, |
|
"step": 1116 |
|
}, |
|
{ |
|
"epoch": 1.695139911634757, |
|
"grad_norm": 2.6778645515441895, |
|
"learning_rate": 2.2225090345895717e-05, |
|
"loss": 0.2428, |
|
"step": 1178 |
|
}, |
|
{ |
|
"epoch": 1.695139911634757, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8910945685139233, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9671905155776124, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9344729344729344, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9494531752596269, |
|
"eval_info_retr_eval_dot_map@100": 0.9174675014460509, |
|
"eval_info_retr_eval_dot_mrr@10": 0.916212365226703, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9285204933191614, |
|
"eval_info_retr_eval_dot_precision@1": 0.8910945685139233, |
|
"eval_info_retr_eval_dot_precision@10": 0.09671905155776124, |
|
"eval_info_retr_eval_dot_precision@3": 0.3114909781576448, |
|
"eval_info_retr_eval_dot_precision@5": 0.1898906350519254, |
|
"eval_info_retr_eval_dot_recall@1": 0.8910945685139233, |
|
"eval_info_retr_eval_dot_recall@10": 0.9671905155776124, |
|
"eval_info_retr_eval_dot_recall@3": 0.9344729344729344, |
|
"eval_info_retr_eval_dot_recall@5": 0.9494531752596269, |
|
"eval_loss": 0.36561650037765503, |
|
"eval_para_mine_eval_average_precision": 0.5544895514233957, |
|
"eval_para_mine_eval_f1": 0.6734225611719457, |
|
"eval_para_mine_eval_precision": 0.7675405136740874, |
|
"eval_para_mine_eval_recall": 0.5998653977316356, |
|
"eval_para_mine_eval_threshold": 0.8776430785655975, |
|
"eval_runtime": 47.0859, |
|
"eval_samples_per_second": 231.088, |
|
"eval_sequential_score": 0.9174675014460509, |
|
"eval_steps_per_second": 1.826, |
|
"step": 1178 |
|
}, |
|
{ |
|
"epoch": 1.7864506627393224, |
|
"grad_norm": 3.110546112060547, |
|
"learning_rate": 2.0624677336086735e-05, |
|
"loss": 0.2935, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 1.7864506627393224, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8924731182795699, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9348405477437736, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9497288852127562, |
|
"eval_info_retr_eval_dot_map@100": 0.9183095474671825, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9169947469230629, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9289448948774749, |
|
"eval_info_retr_eval_dot_precision@1": 0.8924731182795699, |
|
"eval_info_retr_eval_dot_precision@10": 0.09664552890359342, |
|
"eval_info_retr_eval_dot_precision@3": 0.31161351591459113, |
|
"eval_info_retr_eval_dot_precision@5": 0.18994577704255125, |
|
"eval_info_retr_eval_dot_recall@1": 0.8924731182795699, |
|
"eval_info_retr_eval_dot_recall@10": 0.9664552890359343, |
|
"eval_info_retr_eval_dot_recall@3": 0.9348405477437736, |
|
"eval_info_retr_eval_dot_recall@5": 0.9497288852127562, |
|
"eval_loss": 0.36679840087890625, |
|
"eval_para_mine_eval_average_precision": 0.5492627712847419, |
|
"eval_para_mine_eval_f1": 0.6682617615424452, |
|
"eval_para_mine_eval_precision": 0.7445174891126459, |
|
"eval_para_mine_eval_recall": 0.6061754436680473, |
|
"eval_para_mine_eval_threshold": 0.8671578168869019, |
|
"eval_runtime": 47.2606, |
|
"eval_samples_per_second": 230.234, |
|
"eval_sequential_score": 0.9183095474671825, |
|
"eval_steps_per_second": 1.82, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 1.877761413843888, |
|
"grad_norm": 4.477660655975342, |
|
"learning_rate": 1.902426432627775e-05, |
|
"loss": 0.2823, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 1.877761413843888, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8939435713629262, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9648010293171584, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9359433875562908, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9485341420825292, |
|
"eval_info_retr_eval_dot_map@100": 0.9191298943799292, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9177682665137863, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9291509217029374, |
|
"eval_info_retr_eval_dot_precision@1": 0.8939435713629262, |
|
"eval_info_retr_eval_dot_precision@10": 0.09648010293171583, |
|
"eval_info_retr_eval_dot_precision@3": 0.3119811291854302, |
|
"eval_info_retr_eval_dot_precision@5": 0.18970682841650582, |
|
"eval_info_retr_eval_dot_recall@1": 0.8939435713629262, |
|
"eval_info_retr_eval_dot_recall@10": 0.9648010293171584, |
|
"eval_info_retr_eval_dot_recall@3": 0.9359433875562908, |
|
"eval_info_retr_eval_dot_recall@5": 0.9485341420825292, |
|
"eval_loss": 0.3716655969619751, |
|
"eval_para_mine_eval_average_precision": 0.557578455456071, |
|
"eval_para_mine_eval_f1": 0.6753797157651423, |
|
"eval_para_mine_eval_precision": 0.7440590076966561, |
|
"eval_para_mine_eval_recall": 0.6183077152394159, |
|
"eval_para_mine_eval_threshold": 0.863526463508606, |
|
"eval_runtime": 46.6942, |
|
"eval_samples_per_second": 233.027, |
|
"eval_sequential_score": 0.9191298943799292, |
|
"eval_steps_per_second": 1.842, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 1.9690721649484537, |
|
"grad_norm": 4.546482563018799, |
|
"learning_rate": 1.742385131646877e-05, |
|
"loss": 0.2938, |
|
"step": 1364 |
|
}, |
|
{ |
|
"epoch": 1.9690721649484537, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8946787979046044, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9646172226817388, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9487179487179487, |
|
"eval_info_retr_eval_dot_map@100": 0.9200289882479742, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9186748635673371, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9298216358313898, |
|
"eval_info_retr_eval_dot_precision@1": 0.8946787979046044, |
|
"eval_info_retr_eval_dot_precision@10": 0.09646172226817387, |
|
"eval_info_retr_eval_dot_precision@3": 0.31244064577397906, |
|
"eval_info_retr_eval_dot_precision@5": 0.18974358974358976, |
|
"eval_info_retr_eval_dot_recall@1": 0.8946787979046044, |
|
"eval_info_retr_eval_dot_recall@10": 0.9646172226817388, |
|
"eval_info_retr_eval_dot_recall@3": 0.9373219373219374, |
|
"eval_info_retr_eval_dot_recall@5": 0.9487179487179487, |
|
"eval_loss": 0.3621634840965271, |
|
"eval_para_mine_eval_average_precision": 0.5594570173517496, |
|
"eval_para_mine_eval_f1": 0.6766163284568192, |
|
"eval_para_mine_eval_precision": 0.7421746515327168, |
|
"eval_para_mine_eval_recall": 0.6216998730763845, |
|
"eval_para_mine_eval_threshold": 0.8676250278949738, |
|
"eval_runtime": 47.3006, |
|
"eval_samples_per_second": 230.039, |
|
"eval_sequential_score": 0.9200289882479742, |
|
"eval_steps_per_second": 1.818, |
|
"step": 1364 |
|
}, |
|
{ |
|
"epoch": 2.020618556701031, |
|
"grad_norm": 3.241508722305298, |
|
"learning_rate": 1.5823438306659787e-05, |
|
"loss": 0.216, |
|
"step": 1426 |
|
}, |
|
{ |
|
"epoch": 2.020618556701031, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.893208344821248, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9661795790828049, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9362190975094201, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9500964984835952, |
|
"eval_info_retr_eval_dot_map@100": 0.9191773519681701, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9178556476047521, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9295559143323862, |
|
"eval_info_retr_eval_dot_precision@1": 0.893208344821248, |
|
"eval_info_retr_eval_dot_precision@10": 0.09661795790828051, |
|
"eval_info_retr_eval_dot_precision@3": 0.31207303250314, |
|
"eval_info_retr_eval_dot_precision@5": 0.19001929969671905, |
|
"eval_info_retr_eval_dot_recall@1": 0.893208344821248, |
|
"eval_info_retr_eval_dot_recall@10": 0.9661795790828049, |
|
"eval_info_retr_eval_dot_recall@3": 0.9362190975094201, |
|
"eval_info_retr_eval_dot_recall@5": 0.9500964984835952, |
|
"eval_loss": 0.3684485852718353, |
|
"eval_para_mine_eval_average_precision": 0.5665176151429165, |
|
"eval_para_mine_eval_f1": 0.6839674754190774, |
|
"eval_para_mine_eval_precision": 0.7722483633387889, |
|
"eval_para_mine_eval_recall": 0.6137998943056013, |
|
"eval_para_mine_eval_threshold": 0.886872798204422, |
|
"eval_runtime": 47.5509, |
|
"eval_samples_per_second": 228.829, |
|
"eval_sequential_score": 0.9191773519681701, |
|
"eval_steps_per_second": 1.809, |
|
"step": 1426 |
|
}, |
|
{ |
|
"epoch": 2.1119293078055965, |
|
"grad_norm": 2.4362664222717285, |
|
"learning_rate": 1.42230252968508e-05, |
|
"loss": 0.2363, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 2.1119293078055965, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8943111846337652, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9374138406396471, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9490855619887878, |
|
"eval_info_retr_eval_dot_map@100": 0.9197752678474642, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9185011954725225, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9300922809925127, |
|
"eval_info_retr_eval_dot_precision@1": 0.8943111846337652, |
|
"eval_info_retr_eval_dot_precision@10": 0.09664552890359342, |
|
"eval_info_retr_eval_dot_precision@3": 0.31247128021321563, |
|
"eval_info_retr_eval_dot_precision@5": 0.18981711239775756, |
|
"eval_info_retr_eval_dot_recall@1": 0.8943111846337652, |
|
"eval_info_retr_eval_dot_recall@10": 0.9664552890359343, |
|
"eval_info_retr_eval_dot_recall@3": 0.9374138406396471, |
|
"eval_info_retr_eval_dot_recall@5": 0.9490855619887878, |
|
"eval_loss": 0.36409991979599, |
|
"eval_para_mine_eval_average_precision": 0.5680857985845322, |
|
"eval_para_mine_eval_f1": 0.6845767174265878, |
|
"eval_para_mine_eval_precision": 0.7527188630602916, |
|
"eval_para_mine_eval_recall": 0.6277479414434964, |
|
"eval_para_mine_eval_threshold": 0.874737024307251, |
|
"eval_runtime": 46.8373, |
|
"eval_samples_per_second": 232.315, |
|
"eval_sequential_score": 0.9197752678474642, |
|
"eval_steps_per_second": 1.836, |
|
"step": 1488 |
|
}, |
|
{ |
|
"epoch": 2.203240058910162, |
|
"grad_norm": 1.0034995079040527, |
|
"learning_rate": 1.2622612287041818e-05, |
|
"loss": 0.2336, |
|
"step": 1550 |
|
}, |
|
{ |
|
"epoch": 2.203240058910162, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8936678614097969, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9655362558588365, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9360352908740005, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366, |
|
"eval_info_retr_eval_dot_map@100": 0.9191474148366734, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9178338388015818, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9293775519635007, |
|
"eval_info_retr_eval_dot_precision@1": 0.8936678614097969, |
|
"eval_info_retr_eval_dot_precision@10": 0.09655362558588364, |
|
"eval_info_retr_eval_dot_precision@3": 0.31201176362466687, |
|
"eval_info_retr_eval_dot_precision@5": 0.18990901571546734, |
|
"eval_info_retr_eval_dot_recall@1": 0.8936678614097969, |
|
"eval_info_retr_eval_dot_recall@10": 0.9655362558588365, |
|
"eval_info_retr_eval_dot_recall@3": 0.9360352908740005, |
|
"eval_info_retr_eval_dot_recall@5": 0.9495450785773366, |
|
"eval_loss": 0.3632822632789612, |
|
"eval_para_mine_eval_average_precision": 0.5695600017649123, |
|
"eval_para_mine_eval_f1": 0.6885810689948371, |
|
"eval_para_mine_eval_precision": 0.7525360184242944, |
|
"eval_para_mine_eval_recall": 0.6346451784835112, |
|
"eval_para_mine_eval_threshold": 0.8695259690284729, |
|
"eval_runtime": 46.9973, |
|
"eval_samples_per_second": 231.524, |
|
"eval_sequential_score": 0.9191474148366734, |
|
"eval_steps_per_second": 1.83, |
|
"step": 1550 |
|
}, |
|
{ |
|
"epoch": 2.2945508100147274, |
|
"grad_norm": 1.5235002040863037, |
|
"learning_rate": 1.1022199277232835e-05, |
|
"loss": 0.2065, |
|
"step": 1612 |
|
}, |
|
{ |
|
"epoch": 2.2945508100147274, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8948626045400239, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9658119658119658, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9364029041448396, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366, |
|
"eval_info_retr_eval_dot_map@100": 0.9201749271580272, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9188280722330898, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9302018390100595, |
|
"eval_info_retr_eval_dot_precision@1": 0.8948626045400239, |
|
"eval_info_retr_eval_dot_precision@10": 0.09658119658119659, |
|
"eval_info_retr_eval_dot_precision@3": 0.3121343013816132, |
|
"eval_info_retr_eval_dot_precision@5": 0.18990901571546734, |
|
"eval_info_retr_eval_dot_recall@1": 0.8948626045400239, |
|
"eval_info_retr_eval_dot_recall@10": 0.9658119658119658, |
|
"eval_info_retr_eval_dot_recall@3": 0.9364029041448396, |
|
"eval_info_retr_eval_dot_recall@5": 0.9495450785773366, |
|
"eval_loss": 0.36156603693962097, |
|
"eval_para_mine_eval_average_precision": 0.5665696229109317, |
|
"eval_para_mine_eval_f1": 0.6860915092192124, |
|
"eval_para_mine_eval_precision": 0.7585999354355094, |
|
"eval_para_mine_eval_recall": 0.6262347951380577, |
|
"eval_para_mine_eval_threshold": 0.8720309436321259, |
|
"eval_runtime": 47.7964, |
|
"eval_samples_per_second": 227.653, |
|
"eval_sequential_score": 0.9201749271580272, |
|
"eval_steps_per_second": 1.799, |
|
"step": 1612 |
|
}, |
|
{ |
|
"epoch": 2.385861561119293, |
|
"grad_norm": 1.445999264717102, |
|
"learning_rate": 9.421786267423851e-06, |
|
"loss": 0.2083, |
|
"step": 1674 |
|
}, |
|
{ |
|
"epoch": 2.385861561119293, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.8960573476702509, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9659957724473853, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9503722084367245, |
|
"eval_info_retr_eval_dot_map@100": 0.92104627411852, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9196911975585806, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9309142349609268, |
|
"eval_info_retr_eval_dot_precision@1": 0.8960573476702509, |
|
"eval_info_retr_eval_dot_precision@10": 0.09659957724473853, |
|
"eval_info_retr_eval_dot_precision@3": 0.3124406457739791, |
|
"eval_info_retr_eval_dot_precision@5": 0.19007444168734494, |
|
"eval_info_retr_eval_dot_recall@1": 0.8960573476702509, |
|
"eval_info_retr_eval_dot_recall@10": 0.9659957724473853, |
|
"eval_info_retr_eval_dot_recall@3": 0.9373219373219374, |
|
"eval_info_retr_eval_dot_recall@5": 0.9503722084367245, |
|
"eval_loss": 0.358325332403183, |
|
"eval_para_mine_eval_average_precision": 0.5714132731149775, |
|
"eval_para_mine_eval_f1": 0.6871263293961211, |
|
"eval_para_mine_eval_precision": 0.7587332430898214, |
|
"eval_para_mine_eval_recall": 0.6278698965188602, |
|
"eval_para_mine_eval_threshold": 0.8729398548603058, |
|
"eval_runtime": 47.2608, |
|
"eval_samples_per_second": 230.233, |
|
"eval_sequential_score": 0.92104627411852, |
|
"eval_steps_per_second": 1.82, |
|
"step": 1674 |
|
} |
|
], |
|
"logging_steps": 62, |
|
"max_steps": 2037, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 3, |
|
"save_steps": 62, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 0.0, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|