chgrdj's picture
Upload 14 files
02137df verified
{
"best_metric": 0.5714132731149775,
"best_model_checkpoint": "models/all-minilm-l6-v2-typosquat-v3.1-gist/checkpoint-1674",
"epoch": 2.385861561119293,
"eval_steps": 62,
"global_step": 1674,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.09131075110456553,
"grad_norm": 17.575565338134766,
"learning_rate": 3e-05,
"loss": 1.9075,
"step": 62
},
{
"epoch": 0.09131075110456553,
"eval_info_retr_eval_dot_accuracy@1": 0.8306221854608952,
"eval_info_retr_eval_dot_accuracy@10": 0.9250068927488282,
"eval_info_retr_eval_dot_accuracy@3": 0.8876941457586619,
"eval_info_retr_eval_dot_accuracy@5": 0.9032258064516129,
"eval_info_retr_eval_dot_map@100": 0.8651529300165571,
"eval_info_retr_eval_dot_mrr@10": 0.8627116876220815,
"eval_info_retr_eval_dot_ndcg@10": 0.8777861364040704,
"eval_info_retr_eval_dot_precision@1": 0.8306221854608952,
"eval_info_retr_eval_dot_precision@10": 0.09250068927488282,
"eval_info_retr_eval_dot_precision@3": 0.2958980485862206,
"eval_info_retr_eval_dot_precision@5": 0.18064516129032257,
"eval_info_retr_eval_dot_recall@1": 0.8306221854608952,
"eval_info_retr_eval_dot_recall@10": 0.9250068927488282,
"eval_info_retr_eval_dot_recall@3": 0.8876941457586619,
"eval_info_retr_eval_dot_recall@5": 0.9032258064516129,
"eval_loss": 0.8926403522491455,
"eval_para_mine_eval_average_precision": 0.4175368476477107,
"eval_para_mine_eval_f1": 0.5608786555511446,
"eval_para_mine_eval_precision": 0.6772723495912615,
"eval_para_mine_eval_recall": 0.4786239854015258,
"eval_para_mine_eval_threshold": 0.7514148652553558,
"eval_runtime": 46.7645,
"eval_samples_per_second": 232.676,
"eval_sequential_score": 0.8651529300165571,
"eval_steps_per_second": 1.839,
"step": 62
},
{
"epoch": 0.18262150220913106,
"grad_norm": 6.875263214111328,
"learning_rate": 4.943211151264843e-05,
"loss": 0.9074,
"step": 124
},
{
"epoch": 0.18262150220913106,
"eval_info_retr_eval_dot_accuracy@1": 0.8424777134454554,
"eval_info_retr_eval_dot_accuracy@10": 0.9359433875562908,
"eval_info_retr_eval_dot_accuracy@3": 0.8946787979046044,
"eval_info_retr_eval_dot_accuracy@5": 0.9126918481757191,
"eval_info_retr_eval_dot_map@100": 0.8756277031952363,
"eval_info_retr_eval_dot_mrr@10": 0.873614557485526,
"eval_info_retr_eval_dot_ndcg@10": 0.8886439257445581,
"eval_info_retr_eval_dot_precision@1": 0.8424777134454554,
"eval_info_retr_eval_dot_precision@10": 0.09359433875562909,
"eval_info_retr_eval_dot_precision@3": 0.2982262659682014,
"eval_info_retr_eval_dot_precision@5": 0.18253836963514383,
"eval_info_retr_eval_dot_recall@1": 0.8424777134454554,
"eval_info_retr_eval_dot_recall@10": 0.9359433875562908,
"eval_info_retr_eval_dot_recall@3": 0.8946787979046044,
"eval_info_retr_eval_dot_recall@5": 0.9126918481757191,
"eval_loss": 0.6083176732063293,
"eval_para_mine_eval_average_precision": 0.458339002373722,
"eval_para_mine_eval_f1": 0.5954711973336655,
"eval_para_mine_eval_precision": 0.6810695759380306,
"eval_para_mine_eval_recall": 0.5289869146720989,
"eval_para_mine_eval_threshold": 0.8661167621612549,
"eval_runtime": 47.222,
"eval_samples_per_second": 230.422,
"eval_sequential_score": 0.8756277031952363,
"eval_steps_per_second": 1.821,
"step": 124
},
{
"epoch": 0.27393225331369664,
"grad_norm": 5.694400787353516,
"learning_rate": 4.783169850283944e-05,
"loss": 0.6272,
"step": 186
},
{
"epoch": 0.27393225331369664,
"eval_info_retr_eval_dot_accuracy@1": 0.8515761418987225,
"eval_info_retr_eval_dot_accuracy@10": 0.9441227828324602,
"eval_info_retr_eval_dot_accuracy@3": 0.903961032993291,
"eval_info_retr_eval_dot_accuracy@5": 0.9217902766289863,
"eval_info_retr_eval_dot_map@100": 0.8842285240457468,
"eval_info_retr_eval_dot_mrr@10": 0.8822831920502171,
"eval_info_retr_eval_dot_ndcg@10": 0.8972070930309096,
"eval_info_retr_eval_dot_precision@1": 0.8515761418987225,
"eval_info_retr_eval_dot_precision@10": 0.09441227828324604,
"eval_info_retr_eval_dot_precision@3": 0.301320344331097,
"eval_info_retr_eval_dot_precision@5": 0.18435805532579727,
"eval_info_retr_eval_dot_recall@1": 0.8515761418987225,
"eval_info_retr_eval_dot_recall@10": 0.9441227828324602,
"eval_info_retr_eval_dot_recall@3": 0.903961032993291,
"eval_info_retr_eval_dot_recall@5": 0.9217902766289863,
"eval_loss": 0.5591671466827393,
"eval_para_mine_eval_average_precision": 0.4831713388578378,
"eval_para_mine_eval_f1": 0.6178009413060559,
"eval_para_mine_eval_precision": 0.7009458839715662,
"eval_para_mine_eval_recall": 0.5522893677758556,
"eval_para_mine_eval_threshold": 0.860432505607605,
"eval_runtime": 46.8519,
"eval_samples_per_second": 232.242,
"eval_sequential_score": 0.8842285240457468,
"eval_steps_per_second": 1.836,
"step": 186
},
{
"epoch": 0.36524300441826213,
"grad_norm": 5.078444004058838,
"learning_rate": 4.623128549303046e-05,
"loss": 0.5353,
"step": 248
},
{
"epoch": 0.36524300441826213,
"eval_info_retr_eval_dot_accuracy@1": 0.8613178935759581,
"eval_info_retr_eval_dot_accuracy@10": 0.9482584321293999,
"eval_info_retr_eval_dot_accuracy@3": 0.9126918481757191,
"eval_info_retr_eval_dot_accuracy@5": 0.9284073155040897,
"eval_info_retr_eval_dot_map@100": 0.8925029461858842,
"eval_info_retr_eval_dot_mrr@10": 0.8906325355250079,
"eval_info_retr_eval_dot_ndcg@10": 0.9045724071765342,
"eval_info_retr_eval_dot_precision@1": 0.8613178935759581,
"eval_info_retr_eval_dot_precision@10": 0.09482584321294,
"eval_info_retr_eval_dot_precision@3": 0.30423061605857304,
"eval_info_retr_eval_dot_precision@5": 0.18568146310081796,
"eval_info_retr_eval_dot_recall@1": 0.8613178935759581,
"eval_info_retr_eval_dot_recall@10": 0.9482584321293999,
"eval_info_retr_eval_dot_recall@3": 0.9126918481757191,
"eval_info_retr_eval_dot_recall@5": 0.9284073155040897,
"eval_loss": 0.49234136939048767,
"eval_para_mine_eval_average_precision": 0.5057185080416585,
"eval_para_mine_eval_f1": 0.634543585033742,
"eval_para_mine_eval_precision": 0.7090381773055578,
"eval_para_mine_eval_recall": 0.5742141802134666,
"eval_para_mine_eval_threshold": 0.8692877888679504,
"eval_runtime": 46.7669,
"eval_samples_per_second": 232.665,
"eval_sequential_score": 0.8925029461858842,
"eval_steps_per_second": 1.839,
"step": 248
},
{
"epoch": 0.4565537555228277,
"grad_norm": 3.5897247791290283,
"learning_rate": 4.463087248322148e-05,
"loss": 0.4993,
"step": 310
},
{
"epoch": 0.4565537555228277,
"eval_info_retr_eval_dot_accuracy@1": 0.8651778329197684,
"eval_info_retr_eval_dot_accuracy@10": 0.9506479183898539,
"eval_info_retr_eval_dot_accuracy@3": 0.9142542045767852,
"eval_info_retr_eval_dot_accuracy@5": 0.9308887050822535,
"eval_info_retr_eval_dot_map@100": 0.8952610946722075,
"eval_info_retr_eval_dot_mrr@10": 0.8935005390202521,
"eval_info_retr_eval_dot_ndcg@10": 0.9073002136944609,
"eval_info_retr_eval_dot_precision@1": 0.8651778329197684,
"eval_info_retr_eval_dot_precision@10": 0.09506479183898539,
"eval_info_retr_eval_dot_precision@3": 0.3047514015255951,
"eval_info_retr_eval_dot_precision@5": 0.18617774101645068,
"eval_info_retr_eval_dot_recall@1": 0.8651778329197684,
"eval_info_retr_eval_dot_recall@10": 0.9506479183898539,
"eval_info_retr_eval_dot_recall@3": 0.9142542045767852,
"eval_info_retr_eval_dot_recall@5": 0.9308887050822535,
"eval_loss": 0.49423983693122864,
"eval_para_mine_eval_average_precision": 0.5094425990878857,
"eval_para_mine_eval_f1": 0.6359308330329982,
"eval_para_mine_eval_precision": 0.7193390578495433,
"eval_para_mine_eval_recall": 0.5698554154828743,
"eval_para_mine_eval_threshold": 0.8585812747478485,
"eval_runtime": 47.1777,
"eval_samples_per_second": 230.639,
"eval_sequential_score": 0.8952610946722075,
"eval_steps_per_second": 1.823,
"step": 310
},
{
"epoch": 0.5478645066273933,
"grad_norm": 5.185989856719971,
"learning_rate": 4.3030459473412496e-05,
"loss": 0.5339,
"step": 372
},
{
"epoch": 0.5478645066273933,
"eval_info_retr_eval_dot_accuracy@1": 0.8665563826854149,
"eval_info_retr_eval_dot_accuracy@10": 0.9531293079680176,
"eval_info_retr_eval_dot_accuracy@3": 0.9180222406028857,
"eval_info_retr_eval_dot_accuracy@5": 0.9335539012958368,
"eval_info_retr_eval_dot_map@100": 0.8979226074859789,
"eval_info_retr_eval_dot_mrr@10": 0.8961890028198282,
"eval_info_retr_eval_dot_ndcg@10": 0.9099837143266869,
"eval_info_retr_eval_dot_precision@1": 0.8665563826854149,
"eval_info_retr_eval_dot_precision@10": 0.09531293079680178,
"eval_info_retr_eval_dot_precision@3": 0.3060074135342952,
"eval_info_retr_eval_dot_precision@5": 0.18671078025916735,
"eval_info_retr_eval_dot_recall@1": 0.8665563826854149,
"eval_info_retr_eval_dot_recall@10": 0.9531293079680176,
"eval_info_retr_eval_dot_recall@3": 0.9180222406028857,
"eval_info_retr_eval_dot_recall@5": 0.9335539012958368,
"eval_loss": 0.46397796273231506,
"eval_para_mine_eval_average_precision": 0.5171675614798505,
"eval_para_mine_eval_f1": 0.6460162421829887,
"eval_para_mine_eval_precision": 0.7083665639212813,
"eval_para_mine_eval_recall": 0.5937540933995203,
"eval_para_mine_eval_threshold": 0.8755151331424713,
"eval_runtime": 47.3437,
"eval_samples_per_second": 229.83,
"eval_sequential_score": 0.8979226074859789,
"eval_steps_per_second": 1.817,
"step": 372
},
{
"epoch": 0.6391752577319587,
"grad_norm": 5.517925262451172,
"learning_rate": 4.1430046463603515e-05,
"loss": 0.4712,
"step": 434
},
{
"epoch": 0.6391752577319587,
"eval_info_retr_eval_dot_accuracy@1": 0.876114327727231,
"eval_info_retr_eval_dot_accuracy@10": 0.9580001838066354,
"eval_info_retr_eval_dot_accuracy@3": 0.9218821799466961,
"eval_info_retr_eval_dot_accuracy@5": 0.9385166804521643,
"eval_info_retr_eval_dot_map@100": 0.9048794424295332,
"eval_info_retr_eval_dot_mrr@10": 0.9033319693713965,
"eval_info_retr_eval_dot_ndcg@10": 0.9165326554505013,
"eval_info_retr_eval_dot_precision@1": 0.876114327727231,
"eval_info_retr_eval_dot_precision@10": 0.09580001838066356,
"eval_info_retr_eval_dot_precision@3": 0.30729405998223197,
"eval_info_retr_eval_dot_precision@5": 0.18770333609043288,
"eval_info_retr_eval_dot_recall@1": 0.876114327727231,
"eval_info_retr_eval_dot_recall@10": 0.9580001838066354,
"eval_info_retr_eval_dot_recall@3": 0.9218821799466961,
"eval_info_retr_eval_dot_recall@5": 0.9385166804521643,
"eval_loss": 0.43524134159088135,
"eval_para_mine_eval_average_precision": 0.5120496793668291,
"eval_para_mine_eval_f1": 0.6373077701335491,
"eval_para_mine_eval_precision": 0.7241775739076951,
"eval_para_mine_eval_recall": 0.5690468985017593,
"eval_para_mine_eval_threshold": 0.8673346936702728,
"eval_runtime": 47.1044,
"eval_samples_per_second": 230.997,
"eval_sequential_score": 0.9048794424295332,
"eval_steps_per_second": 1.826,
"step": 434
},
{
"epoch": 0.7304860088365243,
"grad_norm": 5.404409408569336,
"learning_rate": 3.9829633453794526e-05,
"loss": 0.4551,
"step": 496
},
{
"epoch": 0.7304860088365243,
"eval_info_retr_eval_dot_accuracy@1": 0.8799742670710413,
"eval_info_retr_eval_dot_accuracy@10": 0.9583677970774745,
"eval_info_retr_eval_dot_accuracy@3": 0.9246392794779892,
"eval_info_retr_eval_dot_accuracy@5": 0.9411818766657476,
"eval_info_retr_eval_dot_map@100": 0.9077432063489332,
"eval_info_retr_eval_dot_mrr@10": 0.9062031821888451,
"eval_info_retr_eval_dot_ndcg@10": 0.9188197267902801,
"eval_info_retr_eval_dot_precision@1": 0.8799742670710413,
"eval_info_retr_eval_dot_precision@10": 0.09583677970774747,
"eval_info_retr_eval_dot_precision@3": 0.30821309315932965,
"eval_info_retr_eval_dot_precision@5": 0.18823637533314955,
"eval_info_retr_eval_dot_recall@1": 0.8799742670710413,
"eval_info_retr_eval_dot_recall@10": 0.9583677970774745,
"eval_info_retr_eval_dot_recall@3": 0.9246392794779892,
"eval_info_retr_eval_dot_recall@5": 0.9411818766657476,
"eval_loss": 0.43508002161979675,
"eval_para_mine_eval_average_precision": 0.5098966109274621,
"eval_para_mine_eval_f1": 0.6349388484094101,
"eval_para_mine_eval_precision": 0.7090408699915318,
"eval_para_mine_eval_recall": 0.5748600904274299,
"eval_para_mine_eval_threshold": 0.8756376802921295,
"eval_runtime": 46.9049,
"eval_samples_per_second": 231.98,
"eval_sequential_score": 0.9077432063489332,
"eval_steps_per_second": 1.833,
"step": 496
},
{
"epoch": 0.8217967599410898,
"grad_norm": 5.574550151824951,
"learning_rate": 3.8229220443985544e-05,
"loss": 0.5675,
"step": 558
},
{
"epoch": 0.8217967599410898,
"eval_info_retr_eval_dot_accuracy@1": 0.8838342064148516,
"eval_info_retr_eval_dot_accuracy@10": 0.9589192169837331,
"eval_info_retr_eval_dot_accuracy@3": 0.9250068927488282,
"eval_info_retr_eval_dot_accuracy@5": 0.9407223600771988,
"eval_info_retr_eval_dot_map@100": 0.9101926203565123,
"eval_info_retr_eval_dot_mrr@10": 0.9085925955101584,
"eval_info_retr_eval_dot_ndcg@10": 0.9207315014698775,
"eval_info_retr_eval_dot_precision@1": 0.8838342064148516,
"eval_info_retr_eval_dot_precision@10": 0.09589192169837332,
"eval_info_retr_eval_dot_precision@3": 0.3083356309162761,
"eval_info_retr_eval_dot_precision@5": 0.18814447201543977,
"eval_info_retr_eval_dot_recall@1": 0.8838342064148516,
"eval_info_retr_eval_dot_recall@10": 0.9589192169837331,
"eval_info_retr_eval_dot_recall@3": 0.9250068927488282,
"eval_info_retr_eval_dot_recall@5": 0.9407223600771988,
"eval_loss": 0.4080217182636261,
"eval_para_mine_eval_average_precision": 0.5334326202140158,
"eval_para_mine_eval_f1": 0.6571024883172905,
"eval_para_mine_eval_precision": 0.7344628039218969,
"eval_para_mine_eval_recall": 0.5944858238517027,
"eval_para_mine_eval_threshold": 0.8824244141578674,
"eval_runtime": 46.9444,
"eval_samples_per_second": 231.785,
"eval_sequential_score": 0.9101926203565123,
"eval_steps_per_second": 1.832,
"step": 558
},
{
"epoch": 0.9131075110456554,
"grad_norm": 7.1312103271484375,
"learning_rate": 3.662880743417656e-05,
"loss": 0.5189,
"step": 620
},
{
"epoch": 0.9131075110456554,
"eval_info_retr_eval_dot_accuracy@1": 0.8812609135189781,
"eval_info_retr_eval_dot_accuracy@10": 0.9581839904420549,
"eval_info_retr_eval_dot_accuracy@3": 0.9273963790092823,
"eval_info_retr_eval_dot_accuracy@5": 0.9409061667126183,
"eval_info_retr_eval_dot_map@100": 0.9088995825285359,
"eval_info_retr_eval_dot_mrr@10": 0.907332134213855,
"eval_info_retr_eval_dot_ndcg@10": 0.9196508765398915,
"eval_info_retr_eval_dot_precision@1": 0.8812609135189781,
"eval_info_retr_eval_dot_precision@10": 0.09581839904420549,
"eval_info_retr_eval_dot_precision@3": 0.3091321263364274,
"eval_info_retr_eval_dot_precision@5": 0.1881812333425237,
"eval_info_retr_eval_dot_recall@1": 0.8812609135189781,
"eval_info_retr_eval_dot_recall@10": 0.9581839904420549,
"eval_info_retr_eval_dot_recall@3": 0.9273963790092823,
"eval_info_retr_eval_dot_recall@5": 0.9409061667126183,
"eval_loss": 0.3979346752166748,
"eval_para_mine_eval_average_precision": 0.5429228832902425,
"eval_para_mine_eval_f1": 0.6632612084554468,
"eval_para_mine_eval_precision": 0.7405866363656618,
"eval_para_mine_eval_recall": 0.60055647649203,
"eval_para_mine_eval_threshold": 0.8737862706184387,
"eval_runtime": 47.0589,
"eval_samples_per_second": 231.221,
"eval_sequential_score": 0.9088995825285359,
"eval_steps_per_second": 1.827,
"step": 620
},
{
"epoch": 1.004418262150221,
"grad_norm": 2.313579559326172,
"learning_rate": 3.502839442436758e-05,
"loss": 0.4278,
"step": 682
},
{
"epoch": 1.004418262150221,
"eval_info_retr_eval_dot_accuracy@1": 0.886039886039886,
"eval_info_retr_eval_dot_accuracy@10": 0.9605734767025089,
"eval_info_retr_eval_dot_accuracy@3": 0.9296939619520265,
"eval_info_retr_eval_dot_accuracy@5": 0.9435713629262016,
"eval_info_retr_eval_dot_map@100": 0.912725086164855,
"eval_info_retr_eval_dot_mrr@10": 0.9111236201738,
"eval_info_retr_eval_dot_ndcg@10": 0.9230849032296308,
"eval_info_retr_eval_dot_precision@1": 0.886039886039886,
"eval_info_retr_eval_dot_precision@10": 0.0960573476702509,
"eval_info_retr_eval_dot_precision@3": 0.30989798731734214,
"eval_info_retr_eval_dot_precision@5": 0.18871427258524037,
"eval_info_retr_eval_dot_recall@1": 0.886039886039886,
"eval_info_retr_eval_dot_recall@10": 0.9605734767025089,
"eval_info_retr_eval_dot_recall@3": 0.9296939619520265,
"eval_info_retr_eval_dot_recall@5": 0.9435713629262016,
"eval_loss": 0.4062098264694214,
"eval_para_mine_eval_average_precision": 0.5569159802538414,
"eval_para_mine_eval_f1": 0.6778007972895148,
"eval_para_mine_eval_precision": 0.7563934207304859,
"eval_para_mine_eval_recall": 0.6140031527645409,
"eval_para_mine_eval_threshold": 0.8800513744354248,
"eval_runtime": 47.9405,
"eval_samples_per_second": 226.969,
"eval_sequential_score": 0.912725086164855,
"eval_steps_per_second": 1.794,
"step": 682
},
{
"epoch": 1.0559646539027983,
"grad_norm": 3.6702966690063477,
"learning_rate": 3.342798141455859e-05,
"loss": 0.337,
"step": 744
},
{
"epoch": 1.0559646539027983,
"eval_info_retr_eval_dot_accuracy@1": 0.8869589192169838,
"eval_info_retr_eval_dot_accuracy@10": 0.9636981895046411,
"eval_info_retr_eval_dot_accuracy@3": 0.9324510614833196,
"eval_info_retr_eval_dot_accuracy@5": 0.9460527525043654,
"eval_info_retr_eval_dot_map@100": 0.9139823556373721,
"eval_info_retr_eval_dot_mrr@10": 0.9125556343298289,
"eval_info_retr_eval_dot_ndcg@10": 0.924918869014723,
"eval_info_retr_eval_dot_precision@1": 0.8869589192169838,
"eval_info_retr_eval_dot_precision@10": 0.09636981895046412,
"eval_info_retr_eval_dot_precision@3": 0.31081702049443977,
"eval_info_retr_eval_dot_precision@5": 0.1892105505008731,
"eval_info_retr_eval_dot_recall@1": 0.8869589192169838,
"eval_info_retr_eval_dot_recall@10": 0.9636981895046411,
"eval_info_retr_eval_dot_recall@3": 0.9324510614833196,
"eval_info_retr_eval_dot_recall@5": 0.9460527525043654,
"eval_loss": 0.4025246500968933,
"eval_para_mine_eval_average_precision": 0.5442347943347751,
"eval_para_mine_eval_f1": 0.6641819581357237,
"eval_para_mine_eval_precision": 0.7375383953633291,
"eval_para_mine_eval_recall": 0.604097690532221,
"eval_para_mine_eval_threshold": 0.8758298754692078,
"eval_runtime": 47.2224,
"eval_samples_per_second": 230.42,
"eval_sequential_score": 0.9139823556373721,
"eval_steps_per_second": 1.821,
"step": 744
},
{
"epoch": 1.1472754050073637,
"grad_norm": 3.720041036605835,
"learning_rate": 3.182756840474961e-05,
"loss": 0.3788,
"step": 806
},
{
"epoch": 1.1472754050073637,
"eval_info_retr_eval_dot_accuracy@1": 0.882455656649205,
"eval_info_retr_eval_dot_accuracy@10": 0.9624115430567044,
"eval_info_retr_eval_dot_accuracy@3": 0.9284073155040897,
"eval_info_retr_eval_dot_accuracy@5": 0.9443984927855895,
"eval_info_retr_eval_dot_map@100": 0.9105324753022828,
"eval_info_retr_eval_dot_mrr@10": 0.9090466051935585,
"eval_info_retr_eval_dot_ndcg@10": 0.9219529245233927,
"eval_info_retr_eval_dot_precision@1": 0.882455656649205,
"eval_info_retr_eval_dot_precision@10": 0.09624115430567044,
"eval_info_retr_eval_dot_precision@3": 0.3094691051680299,
"eval_info_retr_eval_dot_precision@5": 0.18887969855711795,
"eval_info_retr_eval_dot_recall@1": 0.882455656649205,
"eval_info_retr_eval_dot_recall@10": 0.9624115430567044,
"eval_info_retr_eval_dot_recall@3": 0.9284073155040897,
"eval_info_retr_eval_dot_recall@5": 0.9443984927855895,
"eval_loss": 0.38206225633621216,
"eval_para_mine_eval_average_precision": 0.5650597252874483,
"eval_para_mine_eval_f1": 0.684371051800379,
"eval_para_mine_eval_precision": 0.7542356748524652,
"eval_para_mine_eval_recall": 0.6263522333587783,
"eval_para_mine_eval_threshold": 0.8642670810222626,
"eval_runtime": 47.1588,
"eval_samples_per_second": 230.731,
"eval_sequential_score": 0.9105324753022828,
"eval_steps_per_second": 1.824,
"step": 806
},
{
"epoch": 1.2385861561119293,
"grad_norm": 2.3984501361846924,
"learning_rate": 3.0227155394940632e-05,
"loss": 0.2921,
"step": 868
},
{
"epoch": 1.2385861561119293,
"eval_info_retr_eval_dot_accuracy@1": 0.8853046594982079,
"eval_info_retr_eval_dot_accuracy@10": 0.9623196397389946,
"eval_info_retr_eval_dot_accuracy@3": 0.9301534785405753,
"eval_info_retr_eval_dot_accuracy@5": 0.9438470728793309,
"eval_info_retr_eval_dot_map@100": 0.9123716441222456,
"eval_info_retr_eval_dot_mrr@10": 0.9109295291194935,
"eval_info_retr_eval_dot_ndcg@10": 0.9233517208473251,
"eval_info_retr_eval_dot_precision@1": 0.8853046594982079,
"eval_info_retr_eval_dot_precision@10": 0.09623196397389946,
"eval_info_retr_eval_dot_precision@3": 0.3100511595135251,
"eval_info_retr_eval_dot_precision@5": 0.18876941457586618,
"eval_info_retr_eval_dot_recall@1": 0.8853046594982079,
"eval_info_retr_eval_dot_recall@10": 0.9623196397389946,
"eval_info_retr_eval_dot_recall@3": 0.9301534785405753,
"eval_info_retr_eval_dot_recall@5": 0.9438470728793309,
"eval_loss": 0.38938164710998535,
"eval_para_mine_eval_average_precision": 0.562639634596526,
"eval_para_mine_eval_f1": 0.6812942943315669,
"eval_para_mine_eval_precision": 0.756277142164319,
"eval_para_mine_eval_recall": 0.6198389289634271,
"eval_para_mine_eval_threshold": 0.8650586903095245,
"eval_runtime": 47.164,
"eval_samples_per_second": 230.706,
"eval_sequential_score": 0.9123716441222456,
"eval_steps_per_second": 1.823,
"step": 868
},
{
"epoch": 1.3298969072164948,
"grad_norm": 2.1422321796417236,
"learning_rate": 2.862674238513165e-05,
"loss": 0.2719,
"step": 930
},
{
"epoch": 1.3298969072164948,
"eval_info_retr_eval_dot_accuracy@1": 0.8885212756180498,
"eval_info_retr_eval_dot_accuracy@10": 0.9656281591765463,
"eval_info_retr_eval_dot_accuracy@3": 0.9345648377906443,
"eval_info_retr_eval_dot_accuracy@5": 0.9500045951658855,
"eval_info_retr_eval_dot_map@100": 0.9159948831907755,
"eval_info_retr_eval_dot_mrr@10": 0.9146445748596291,
"eval_info_retr_eval_dot_ndcg@10": 0.9270088047632189,
"eval_info_retr_eval_dot_precision@1": 0.8885212756180498,
"eval_info_retr_eval_dot_precision@10": 0.09656281591765466,
"eval_info_retr_eval_dot_precision@3": 0.3115216125968814,
"eval_info_retr_eval_dot_precision@5": 0.19000091903317715,
"eval_info_retr_eval_dot_recall@1": 0.8885212756180498,
"eval_info_retr_eval_dot_recall@10": 0.9656281591765463,
"eval_info_retr_eval_dot_recall@3": 0.9345648377906443,
"eval_info_retr_eval_dot_recall@5": 0.9500045951658855,
"eval_loss": 0.3813144862651825,
"eval_para_mine_eval_average_precision": 0.5562771586743412,
"eval_para_mine_eval_f1": 0.6790739258140527,
"eval_para_mine_eval_precision": 0.7701738104240424,
"eval_para_mine_eval_recall": 0.6072459382184622,
"eval_para_mine_eval_threshold": 0.8749864101409912,
"eval_runtime": 46.8836,
"eval_samples_per_second": 232.085,
"eval_sequential_score": 0.9159948831907755,
"eval_steps_per_second": 1.834,
"step": 930
},
{
"epoch": 1.4212076583210604,
"grad_norm": 2.2384369373321533,
"learning_rate": 2.702632937532267e-05,
"loss": 0.2713,
"step": 992
},
{
"epoch": 1.4212076583210604,
"eval_info_retr_eval_dot_accuracy@1": 0.889256502159728,
"eval_info_retr_eval_dot_accuracy@10": 0.9640658027754802,
"eval_info_retr_eval_dot_accuracy@3": 0.9335539012958368,
"eval_info_retr_eval_dot_accuracy@5": 0.9473393989523021,
"eval_info_retr_eval_dot_map@100": 0.9160609261046996,
"eval_info_retr_eval_dot_mrr@10": 0.9146857125351749,
"eval_info_retr_eval_dot_ndcg@10": 0.9266566721638121,
"eval_info_retr_eval_dot_precision@1": 0.889256502159728,
"eval_info_retr_eval_dot_precision@10": 0.09640658027754802,
"eval_info_retr_eval_dot_precision@3": 0.3111846337652789,
"eval_info_retr_eval_dot_precision@5": 0.18946787979046048,
"eval_info_retr_eval_dot_recall@1": 0.889256502159728,
"eval_info_retr_eval_dot_recall@10": 0.9640658027754802,
"eval_info_retr_eval_dot_recall@3": 0.9335539012958368,
"eval_info_retr_eval_dot_recall@5": 0.9473393989523021,
"eval_loss": 0.379529744386673,
"eval_para_mine_eval_average_precision": 0.5652640358968563,
"eval_para_mine_eval_f1": 0.6830371726971242,
"eval_para_mine_eval_precision": 0.7554402272988553,
"eval_para_mine_eval_recall": 0.6232988396200422,
"eval_para_mine_eval_threshold": 0.8636217713356018,
"eval_runtime": 47.0681,
"eval_samples_per_second": 231.176,
"eval_sequential_score": 0.9160609261046996,
"eval_steps_per_second": 1.827,
"step": 992
},
{
"epoch": 1.5125184094256259,
"grad_norm": 1.37623131275177,
"learning_rate": 2.542591636551368e-05,
"loss": 0.2498,
"step": 1054
},
{
"epoch": 1.5125184094256259,
"eval_info_retr_eval_dot_accuracy@1": 0.8875103391232424,
"eval_info_retr_eval_dot_accuracy@10": 0.9651686425879974,
"eval_info_retr_eval_dot_accuracy@3": 0.9322672548479,
"eval_info_retr_eval_dot_accuracy@5": 0.9468798823637533,
"eval_info_retr_eval_dot_map@100": 0.9147389573171367,
"eval_info_retr_eval_dot_mrr@10": 0.9134388179191052,
"eval_info_retr_eval_dot_ndcg@10": 0.9259428646968195,
"eval_info_retr_eval_dot_precision@1": 0.8875103391232424,
"eval_info_retr_eval_dot_precision@10": 0.09651686425879975,
"eval_info_retr_eval_dot_precision@3": 0.31075575161596664,
"eval_info_retr_eval_dot_precision@5": 0.1893759764727507,
"eval_info_retr_eval_dot_recall@1": 0.8875103391232424,
"eval_info_retr_eval_dot_recall@10": 0.9651686425879974,
"eval_info_retr_eval_dot_recall@3": 0.9322672548479,
"eval_info_retr_eval_dot_recall@5": 0.9468798823637533,
"eval_loss": 0.3791400194168091,
"eval_para_mine_eval_average_precision": 0.5531609578399229,
"eval_para_mine_eval_f1": 0.6710056459938674,
"eval_para_mine_eval_precision": 0.7802172142925567,
"eval_para_mine_eval_recall": 0.5886139128156717,
"eval_para_mine_eval_threshold": 0.8832797706127167,
"eval_runtime": 46.8924,
"eval_samples_per_second": 232.042,
"eval_sequential_score": 0.9147389573171367,
"eval_steps_per_second": 1.834,
"step": 1054
},
{
"epoch": 1.6038291605301915,
"grad_norm": 3.7942512035369873,
"learning_rate": 2.38255033557047e-05,
"loss": 0.2785,
"step": 1116
},
{
"epoch": 1.6038291605301915,
"eval_info_retr_eval_dot_accuracy@1": 0.8900836320191159,
"eval_info_retr_eval_dot_accuracy@10": 0.9648929326348681,
"eval_info_retr_eval_dot_accuracy@3": 0.9332781913427075,
"eval_info_retr_eval_dot_accuracy@5": 0.9466960757283338,
"eval_info_retr_eval_dot_map@100": 0.9161105864746074,
"eval_info_retr_eval_dot_mrr@10": 0.9147435168044494,
"eval_info_retr_eval_dot_ndcg@10": 0.9268526071520827,
"eval_info_retr_eval_dot_precision@1": 0.8900836320191159,
"eval_info_retr_eval_dot_precision@10": 0.09648929326348682,
"eval_info_retr_eval_dot_precision@3": 0.31109273044756913,
"eval_info_retr_eval_dot_precision@5": 0.1893392151456668,
"eval_info_retr_eval_dot_recall@1": 0.8900836320191159,
"eval_info_retr_eval_dot_recall@10": 0.9648929326348681,
"eval_info_retr_eval_dot_recall@3": 0.9332781913427075,
"eval_info_retr_eval_dot_recall@5": 0.9466960757283338,
"eval_loss": 0.3756929337978363,
"eval_para_mine_eval_average_precision": 0.5534577957590571,
"eval_para_mine_eval_f1": 0.6721510117453017,
"eval_para_mine_eval_precision": 0.763900548546983,
"eval_para_mine_eval_recall": 0.6000776898998613,
"eval_para_mine_eval_threshold": 0.8725496828556061,
"eval_runtime": 47.1739,
"eval_samples_per_second": 230.657,
"eval_sequential_score": 0.9161105864746074,
"eval_steps_per_second": 1.823,
"step": 1116
},
{
"epoch": 1.695139911634757,
"grad_norm": 2.6778645515441895,
"learning_rate": 2.2225090345895717e-05,
"loss": 0.2428,
"step": 1178
},
{
"epoch": 1.695139911634757,
"eval_info_retr_eval_dot_accuracy@1": 0.8910945685139233,
"eval_info_retr_eval_dot_accuracy@10": 0.9671905155776124,
"eval_info_retr_eval_dot_accuracy@3": 0.9344729344729344,
"eval_info_retr_eval_dot_accuracy@5": 0.9494531752596269,
"eval_info_retr_eval_dot_map@100": 0.9174675014460509,
"eval_info_retr_eval_dot_mrr@10": 0.916212365226703,
"eval_info_retr_eval_dot_ndcg@10": 0.9285204933191614,
"eval_info_retr_eval_dot_precision@1": 0.8910945685139233,
"eval_info_retr_eval_dot_precision@10": 0.09671905155776124,
"eval_info_retr_eval_dot_precision@3": 0.3114909781576448,
"eval_info_retr_eval_dot_precision@5": 0.1898906350519254,
"eval_info_retr_eval_dot_recall@1": 0.8910945685139233,
"eval_info_retr_eval_dot_recall@10": 0.9671905155776124,
"eval_info_retr_eval_dot_recall@3": 0.9344729344729344,
"eval_info_retr_eval_dot_recall@5": 0.9494531752596269,
"eval_loss": 0.36561650037765503,
"eval_para_mine_eval_average_precision": 0.5544895514233957,
"eval_para_mine_eval_f1": 0.6734225611719457,
"eval_para_mine_eval_precision": 0.7675405136740874,
"eval_para_mine_eval_recall": 0.5998653977316356,
"eval_para_mine_eval_threshold": 0.8776430785655975,
"eval_runtime": 47.0859,
"eval_samples_per_second": 231.088,
"eval_sequential_score": 0.9174675014460509,
"eval_steps_per_second": 1.826,
"step": 1178
},
{
"epoch": 1.7864506627393224,
"grad_norm": 3.110546112060547,
"learning_rate": 2.0624677336086735e-05,
"loss": 0.2935,
"step": 1240
},
{
"epoch": 1.7864506627393224,
"eval_info_retr_eval_dot_accuracy@1": 0.8924731182795699,
"eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343,
"eval_info_retr_eval_dot_accuracy@3": 0.9348405477437736,
"eval_info_retr_eval_dot_accuracy@5": 0.9497288852127562,
"eval_info_retr_eval_dot_map@100": 0.9183095474671825,
"eval_info_retr_eval_dot_mrr@10": 0.9169947469230629,
"eval_info_retr_eval_dot_ndcg@10": 0.9289448948774749,
"eval_info_retr_eval_dot_precision@1": 0.8924731182795699,
"eval_info_retr_eval_dot_precision@10": 0.09664552890359342,
"eval_info_retr_eval_dot_precision@3": 0.31161351591459113,
"eval_info_retr_eval_dot_precision@5": 0.18994577704255125,
"eval_info_retr_eval_dot_recall@1": 0.8924731182795699,
"eval_info_retr_eval_dot_recall@10": 0.9664552890359343,
"eval_info_retr_eval_dot_recall@3": 0.9348405477437736,
"eval_info_retr_eval_dot_recall@5": 0.9497288852127562,
"eval_loss": 0.36679840087890625,
"eval_para_mine_eval_average_precision": 0.5492627712847419,
"eval_para_mine_eval_f1": 0.6682617615424452,
"eval_para_mine_eval_precision": 0.7445174891126459,
"eval_para_mine_eval_recall": 0.6061754436680473,
"eval_para_mine_eval_threshold": 0.8671578168869019,
"eval_runtime": 47.2606,
"eval_samples_per_second": 230.234,
"eval_sequential_score": 0.9183095474671825,
"eval_steps_per_second": 1.82,
"step": 1240
},
{
"epoch": 1.877761413843888,
"grad_norm": 4.477660655975342,
"learning_rate": 1.902426432627775e-05,
"loss": 0.2823,
"step": 1302
},
{
"epoch": 1.877761413843888,
"eval_info_retr_eval_dot_accuracy@1": 0.8939435713629262,
"eval_info_retr_eval_dot_accuracy@10": 0.9648010293171584,
"eval_info_retr_eval_dot_accuracy@3": 0.9359433875562908,
"eval_info_retr_eval_dot_accuracy@5": 0.9485341420825292,
"eval_info_retr_eval_dot_map@100": 0.9191298943799292,
"eval_info_retr_eval_dot_mrr@10": 0.9177682665137863,
"eval_info_retr_eval_dot_ndcg@10": 0.9291509217029374,
"eval_info_retr_eval_dot_precision@1": 0.8939435713629262,
"eval_info_retr_eval_dot_precision@10": 0.09648010293171583,
"eval_info_retr_eval_dot_precision@3": 0.3119811291854302,
"eval_info_retr_eval_dot_precision@5": 0.18970682841650582,
"eval_info_retr_eval_dot_recall@1": 0.8939435713629262,
"eval_info_retr_eval_dot_recall@10": 0.9648010293171584,
"eval_info_retr_eval_dot_recall@3": 0.9359433875562908,
"eval_info_retr_eval_dot_recall@5": 0.9485341420825292,
"eval_loss": 0.3716655969619751,
"eval_para_mine_eval_average_precision": 0.557578455456071,
"eval_para_mine_eval_f1": 0.6753797157651423,
"eval_para_mine_eval_precision": 0.7440590076966561,
"eval_para_mine_eval_recall": 0.6183077152394159,
"eval_para_mine_eval_threshold": 0.863526463508606,
"eval_runtime": 46.6942,
"eval_samples_per_second": 233.027,
"eval_sequential_score": 0.9191298943799292,
"eval_steps_per_second": 1.842,
"step": 1302
},
{
"epoch": 1.9690721649484537,
"grad_norm": 4.546482563018799,
"learning_rate": 1.742385131646877e-05,
"loss": 0.2938,
"step": 1364
},
{
"epoch": 1.9690721649484537,
"eval_info_retr_eval_dot_accuracy@1": 0.8946787979046044,
"eval_info_retr_eval_dot_accuracy@10": 0.9646172226817388,
"eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374,
"eval_info_retr_eval_dot_accuracy@5": 0.9487179487179487,
"eval_info_retr_eval_dot_map@100": 0.9200289882479742,
"eval_info_retr_eval_dot_mrr@10": 0.9186748635673371,
"eval_info_retr_eval_dot_ndcg@10": 0.9298216358313898,
"eval_info_retr_eval_dot_precision@1": 0.8946787979046044,
"eval_info_retr_eval_dot_precision@10": 0.09646172226817387,
"eval_info_retr_eval_dot_precision@3": 0.31244064577397906,
"eval_info_retr_eval_dot_precision@5": 0.18974358974358976,
"eval_info_retr_eval_dot_recall@1": 0.8946787979046044,
"eval_info_retr_eval_dot_recall@10": 0.9646172226817388,
"eval_info_retr_eval_dot_recall@3": 0.9373219373219374,
"eval_info_retr_eval_dot_recall@5": 0.9487179487179487,
"eval_loss": 0.3621634840965271,
"eval_para_mine_eval_average_precision": 0.5594570173517496,
"eval_para_mine_eval_f1": 0.6766163284568192,
"eval_para_mine_eval_precision": 0.7421746515327168,
"eval_para_mine_eval_recall": 0.6216998730763845,
"eval_para_mine_eval_threshold": 0.8676250278949738,
"eval_runtime": 47.3006,
"eval_samples_per_second": 230.039,
"eval_sequential_score": 0.9200289882479742,
"eval_steps_per_second": 1.818,
"step": 1364
},
{
"epoch": 2.020618556701031,
"grad_norm": 3.241508722305298,
"learning_rate": 1.5823438306659787e-05,
"loss": 0.216,
"step": 1426
},
{
"epoch": 2.020618556701031,
"eval_info_retr_eval_dot_accuracy@1": 0.893208344821248,
"eval_info_retr_eval_dot_accuracy@10": 0.9661795790828049,
"eval_info_retr_eval_dot_accuracy@3": 0.9362190975094201,
"eval_info_retr_eval_dot_accuracy@5": 0.9500964984835952,
"eval_info_retr_eval_dot_map@100": 0.9191773519681701,
"eval_info_retr_eval_dot_mrr@10": 0.9178556476047521,
"eval_info_retr_eval_dot_ndcg@10": 0.9295559143323862,
"eval_info_retr_eval_dot_precision@1": 0.893208344821248,
"eval_info_retr_eval_dot_precision@10": 0.09661795790828051,
"eval_info_retr_eval_dot_precision@3": 0.31207303250314,
"eval_info_retr_eval_dot_precision@5": 0.19001929969671905,
"eval_info_retr_eval_dot_recall@1": 0.893208344821248,
"eval_info_retr_eval_dot_recall@10": 0.9661795790828049,
"eval_info_retr_eval_dot_recall@3": 0.9362190975094201,
"eval_info_retr_eval_dot_recall@5": 0.9500964984835952,
"eval_loss": 0.3684485852718353,
"eval_para_mine_eval_average_precision": 0.5665176151429165,
"eval_para_mine_eval_f1": 0.6839674754190774,
"eval_para_mine_eval_precision": 0.7722483633387889,
"eval_para_mine_eval_recall": 0.6137998943056013,
"eval_para_mine_eval_threshold": 0.886872798204422,
"eval_runtime": 47.5509,
"eval_samples_per_second": 228.829,
"eval_sequential_score": 0.9191773519681701,
"eval_steps_per_second": 1.809,
"step": 1426
},
{
"epoch": 2.1119293078055965,
"grad_norm": 2.4362664222717285,
"learning_rate": 1.42230252968508e-05,
"loss": 0.2363,
"step": 1488
},
{
"epoch": 2.1119293078055965,
"eval_info_retr_eval_dot_accuracy@1": 0.8943111846337652,
"eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343,
"eval_info_retr_eval_dot_accuracy@3": 0.9374138406396471,
"eval_info_retr_eval_dot_accuracy@5": 0.9490855619887878,
"eval_info_retr_eval_dot_map@100": 0.9197752678474642,
"eval_info_retr_eval_dot_mrr@10": 0.9185011954725225,
"eval_info_retr_eval_dot_ndcg@10": 0.9300922809925127,
"eval_info_retr_eval_dot_precision@1": 0.8943111846337652,
"eval_info_retr_eval_dot_precision@10": 0.09664552890359342,
"eval_info_retr_eval_dot_precision@3": 0.31247128021321563,
"eval_info_retr_eval_dot_precision@5": 0.18981711239775756,
"eval_info_retr_eval_dot_recall@1": 0.8943111846337652,
"eval_info_retr_eval_dot_recall@10": 0.9664552890359343,
"eval_info_retr_eval_dot_recall@3": 0.9374138406396471,
"eval_info_retr_eval_dot_recall@5": 0.9490855619887878,
"eval_loss": 0.36409991979599,
"eval_para_mine_eval_average_precision": 0.5680857985845322,
"eval_para_mine_eval_f1": 0.6845767174265878,
"eval_para_mine_eval_precision": 0.7527188630602916,
"eval_para_mine_eval_recall": 0.6277479414434964,
"eval_para_mine_eval_threshold": 0.874737024307251,
"eval_runtime": 46.8373,
"eval_samples_per_second": 232.315,
"eval_sequential_score": 0.9197752678474642,
"eval_steps_per_second": 1.836,
"step": 1488
},
{
"epoch": 2.203240058910162,
"grad_norm": 1.0034995079040527,
"learning_rate": 1.2622612287041818e-05,
"loss": 0.2336,
"step": 1550
},
{
"epoch": 2.203240058910162,
"eval_info_retr_eval_dot_accuracy@1": 0.8936678614097969,
"eval_info_retr_eval_dot_accuracy@10": 0.9655362558588365,
"eval_info_retr_eval_dot_accuracy@3": 0.9360352908740005,
"eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366,
"eval_info_retr_eval_dot_map@100": 0.9191474148366734,
"eval_info_retr_eval_dot_mrr@10": 0.9178338388015818,
"eval_info_retr_eval_dot_ndcg@10": 0.9293775519635007,
"eval_info_retr_eval_dot_precision@1": 0.8936678614097969,
"eval_info_retr_eval_dot_precision@10": 0.09655362558588364,
"eval_info_retr_eval_dot_precision@3": 0.31201176362466687,
"eval_info_retr_eval_dot_precision@5": 0.18990901571546734,
"eval_info_retr_eval_dot_recall@1": 0.8936678614097969,
"eval_info_retr_eval_dot_recall@10": 0.9655362558588365,
"eval_info_retr_eval_dot_recall@3": 0.9360352908740005,
"eval_info_retr_eval_dot_recall@5": 0.9495450785773366,
"eval_loss": 0.3632822632789612,
"eval_para_mine_eval_average_precision": 0.5695600017649123,
"eval_para_mine_eval_f1": 0.6885810689948371,
"eval_para_mine_eval_precision": 0.7525360184242944,
"eval_para_mine_eval_recall": 0.6346451784835112,
"eval_para_mine_eval_threshold": 0.8695259690284729,
"eval_runtime": 46.9973,
"eval_samples_per_second": 231.524,
"eval_sequential_score": 0.9191474148366734,
"eval_steps_per_second": 1.83,
"step": 1550
},
{
"epoch": 2.2945508100147274,
"grad_norm": 1.5235002040863037,
"learning_rate": 1.1022199277232835e-05,
"loss": 0.2065,
"step": 1612
},
{
"epoch": 2.2945508100147274,
"eval_info_retr_eval_dot_accuracy@1": 0.8948626045400239,
"eval_info_retr_eval_dot_accuracy@10": 0.9658119658119658,
"eval_info_retr_eval_dot_accuracy@3": 0.9364029041448396,
"eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366,
"eval_info_retr_eval_dot_map@100": 0.9201749271580272,
"eval_info_retr_eval_dot_mrr@10": 0.9188280722330898,
"eval_info_retr_eval_dot_ndcg@10": 0.9302018390100595,
"eval_info_retr_eval_dot_precision@1": 0.8948626045400239,
"eval_info_retr_eval_dot_precision@10": 0.09658119658119659,
"eval_info_retr_eval_dot_precision@3": 0.3121343013816132,
"eval_info_retr_eval_dot_precision@5": 0.18990901571546734,
"eval_info_retr_eval_dot_recall@1": 0.8948626045400239,
"eval_info_retr_eval_dot_recall@10": 0.9658119658119658,
"eval_info_retr_eval_dot_recall@3": 0.9364029041448396,
"eval_info_retr_eval_dot_recall@5": 0.9495450785773366,
"eval_loss": 0.36156603693962097,
"eval_para_mine_eval_average_precision": 0.5665696229109317,
"eval_para_mine_eval_f1": 0.6860915092192124,
"eval_para_mine_eval_precision": 0.7585999354355094,
"eval_para_mine_eval_recall": 0.6262347951380577,
"eval_para_mine_eval_threshold": 0.8720309436321259,
"eval_runtime": 47.7964,
"eval_samples_per_second": 227.653,
"eval_sequential_score": 0.9201749271580272,
"eval_steps_per_second": 1.799,
"step": 1612
},
{
"epoch": 2.385861561119293,
"grad_norm": 1.445999264717102,
"learning_rate": 9.421786267423851e-06,
"loss": 0.2083,
"step": 1674
},
{
"epoch": 2.385861561119293,
"eval_info_retr_eval_dot_accuracy@1": 0.8960573476702509,
"eval_info_retr_eval_dot_accuracy@10": 0.9659957724473853,
"eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374,
"eval_info_retr_eval_dot_accuracy@5": 0.9503722084367245,
"eval_info_retr_eval_dot_map@100": 0.92104627411852,
"eval_info_retr_eval_dot_mrr@10": 0.9196911975585806,
"eval_info_retr_eval_dot_ndcg@10": 0.9309142349609268,
"eval_info_retr_eval_dot_precision@1": 0.8960573476702509,
"eval_info_retr_eval_dot_precision@10": 0.09659957724473853,
"eval_info_retr_eval_dot_precision@3": 0.3124406457739791,
"eval_info_retr_eval_dot_precision@5": 0.19007444168734494,
"eval_info_retr_eval_dot_recall@1": 0.8960573476702509,
"eval_info_retr_eval_dot_recall@10": 0.9659957724473853,
"eval_info_retr_eval_dot_recall@3": 0.9373219373219374,
"eval_info_retr_eval_dot_recall@5": 0.9503722084367245,
"eval_loss": 0.358325332403183,
"eval_para_mine_eval_average_precision": 0.5714132731149775,
"eval_para_mine_eval_f1": 0.6871263293961211,
"eval_para_mine_eval_precision": 0.7587332430898214,
"eval_para_mine_eval_recall": 0.6278698965188602,
"eval_para_mine_eval_threshold": 0.8729398548603058,
"eval_runtime": 47.2608,
"eval_samples_per_second": 230.233,
"eval_sequential_score": 0.92104627411852,
"eval_steps_per_second": 1.82,
"step": 1674
}
],
"logging_steps": 62,
"max_steps": 2037,
"num_input_tokens_seen": 0,
"num_train_epochs": 3,
"save_steps": 62,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 0.0,
"train_batch_size": 64,
"trial_name": null,
"trial_params": null
}