|
{ |
|
"best_metric": 0.9306620270961232, |
|
"best_model_checkpoint": "models/google-canine-c-typosquat-v3.1-mnrl/checkpoint-868", |
|
"epoch": 1.2385861561119293, |
|
"eval_steps": 62, |
|
"global_step": 868, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.09131075110456553, |
|
"grad_norm": 5.324620723724365, |
|
"learning_rate": 3e-05, |
|
"loss": 1.219, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 0.09131075110456553, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9574487639003768, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.994026284348865, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9816193364580461, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9881444720154398, |
|
"eval_info_retr_eval_dot_map@100": 0.9710061189570759, |
|
"eval_info_retr_eval_dot_mrr@10": 0.970718399481841, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9764345312554475, |
|
"eval_info_retr_eval_dot_precision@1": 0.9574487639003768, |
|
"eval_info_retr_eval_dot_precision@10": 0.09940262843488651, |
|
"eval_info_retr_eval_dot_precision@3": 0.32720644548601535, |
|
"eval_info_retr_eval_dot_precision@5": 0.197628894403088, |
|
"eval_info_retr_eval_dot_recall@1": 0.9574487639003768, |
|
"eval_info_retr_eval_dot_recall@10": 0.994026284348865, |
|
"eval_info_retr_eval_dot_recall@3": 0.9816193364580461, |
|
"eval_info_retr_eval_dot_recall@5": 0.9881444720154398, |
|
"eval_loss": 0.11100412905216217, |
|
"eval_para_mine_eval_average_precision": 0.7672056895535211, |
|
"eval_para_mine_eval_f1": 0.7847944762520686, |
|
"eval_para_mine_eval_precision": 0.8285314095516364, |
|
"eval_para_mine_eval_recall": 0.7454436228787721, |
|
"eval_para_mine_eval_threshold": 0.7348841428756714, |
|
"eval_runtime": 44.8792, |
|
"eval_samples_per_second": 242.451, |
|
"eval_sequential_score": 0.9710061189570759, |
|
"eval_steps_per_second": 1.916, |
|
"step": 62 |
|
}, |
|
{ |
|
"epoch": 0.18262150220913106, |
|
"grad_norm": 3.005993604660034, |
|
"learning_rate": 4.943211151264843e-05, |
|
"loss": 0.1012, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 0.18262150220913106, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9798731734215606, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9973348037864167, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9930153478540575, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9957724473853506, |
|
"eval_info_retr_eval_dot_map@100": 0.9868644025653387, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9867332819841785, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.989378667273856, |
|
"eval_info_retr_eval_dot_precision@1": 0.9798731734215606, |
|
"eval_info_retr_eval_dot_precision@10": 0.09973348037864167, |
|
"eval_info_retr_eval_dot_precision@3": 0.33100511595135246, |
|
"eval_info_retr_eval_dot_precision@5": 0.19915448947707012, |
|
"eval_info_retr_eval_dot_recall@1": 0.9798731734215606, |
|
"eval_info_retr_eval_dot_recall@10": 0.9973348037864167, |
|
"eval_info_retr_eval_dot_recall@3": 0.9930153478540575, |
|
"eval_info_retr_eval_dot_recall@5": 0.9957724473853506, |
|
"eval_loss": 0.04060104861855507, |
|
"eval_para_mine_eval_average_precision": 0.8585605463078829, |
|
"eval_para_mine_eval_f1": 0.8537043823665016, |
|
"eval_para_mine_eval_precision": 0.8957241803604032, |
|
"eval_para_mine_eval_recall": 0.8154503529921904, |
|
"eval_para_mine_eval_threshold": 0.6834436357021332, |
|
"eval_runtime": 44.147, |
|
"eval_samples_per_second": 246.472, |
|
"eval_sequential_score": 0.9868644025653387, |
|
"eval_steps_per_second": 1.948, |
|
"step": 124 |
|
}, |
|
{ |
|
"epoch": 0.27393225331369664, |
|
"grad_norm": 0.6856785416603088, |
|
"learning_rate": 4.783169850283944e-05, |
|
"loss": 0.0693, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.27393225331369664, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9855711791195663, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9988971601874828, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9959562540207701, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9977943203749655, |
|
"eval_info_retr_eval_dot_map@100": 0.9910708474937577, |
|
"eval_info_retr_eval_dot_mrr@10": 0.991004780431304, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9929831934334958, |
|
"eval_info_retr_eval_dot_precision@1": 0.9855711791195663, |
|
"eval_info_retr_eval_dot_precision@10": 0.09988971601874828, |
|
"eval_info_retr_eval_dot_precision@3": 0.3319854180069234, |
|
"eval_info_retr_eval_dot_precision@5": 0.19955886407499313, |
|
"eval_info_retr_eval_dot_recall@1": 0.9855711791195663, |
|
"eval_info_retr_eval_dot_recall@10": 0.9988971601874828, |
|
"eval_info_retr_eval_dot_recall@3": 0.9959562540207701, |
|
"eval_info_retr_eval_dot_recall@5": 0.9977943203749655, |
|
"eval_loss": 0.024971680715680122, |
|
"eval_para_mine_eval_average_precision": 0.8878504879371486, |
|
"eval_para_mine_eval_f1": 0.8765703942488466, |
|
"eval_para_mine_eval_precision": 0.9063191861895322, |
|
"eval_para_mine_eval_recall": 0.8487124705839841, |
|
"eval_para_mine_eval_threshold": 0.6699230670928955, |
|
"eval_runtime": 44.4383, |
|
"eval_samples_per_second": 244.856, |
|
"eval_sequential_score": 0.9910708474937577, |
|
"eval_steps_per_second": 1.935, |
|
"step": 186 |
|
}, |
|
{ |
|
"epoch": 0.36524300441826213, |
|
"grad_norm": 0.5819792747497559, |
|
"learning_rate": 4.623128549303046e-05, |
|
"loss": 0.0424, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 0.36524300441826213, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9887877952394082, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9994485800937414, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9978862236926753, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9986214502343534, |
|
"eval_info_retr_eval_dot_map@100": 0.9933887693878125, |
|
"eval_info_retr_eval_dot_mrr@10": 0.993345798632537, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.994887605721736, |
|
"eval_info_retr_eval_dot_precision@1": 0.9887877952394082, |
|
"eval_info_retr_eval_dot_precision@10": 0.09994485800937414, |
|
"eval_info_retr_eval_dot_precision@3": 0.33262874123089176, |
|
"eval_info_retr_eval_dot_precision@5": 0.19972429004687073, |
|
"eval_info_retr_eval_dot_recall@1": 0.9887877952394082, |
|
"eval_info_retr_eval_dot_recall@10": 0.9994485800937414, |
|
"eval_info_retr_eval_dot_recall@3": 0.9978862236926753, |
|
"eval_info_retr_eval_dot_recall@5": 0.9986214502343534, |
|
"eval_loss": 0.01834421418607235, |
|
"eval_para_mine_eval_average_precision": 0.8919509440660052, |
|
"eval_para_mine_eval_f1": 0.8783150608010457, |
|
"eval_para_mine_eval_precision": 0.8953218322315484, |
|
"eval_para_mine_eval_recall": 0.8619423378336262, |
|
"eval_para_mine_eval_threshold": 0.6646433770656586, |
|
"eval_runtime": 44.2865, |
|
"eval_samples_per_second": 245.696, |
|
"eval_sequential_score": 0.9933887693878125, |
|
"eval_steps_per_second": 1.942, |
|
"step": 248 |
|
}, |
|
{ |
|
"epoch": 0.4565537555228277, |
|
"grad_norm": 0.2500639259815216, |
|
"learning_rate": 4.463087248322148e-05, |
|
"loss": 0.0382, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 0.4565537555228277, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9904420549581839, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9982538369635143, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.998805256869773, |
|
"eval_info_retr_eval_dot_map@100": 0.9944206662844655, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9944099442307328, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9957667469329782, |
|
"eval_info_retr_eval_dot_precision@1": 0.9904420549581839, |
|
"eval_info_retr_eval_dot_precision@10": 0.09998161933645805, |
|
"eval_info_retr_eval_dot_precision@3": 0.3327512789878381, |
|
"eval_info_retr_eval_dot_precision@5": 0.19976105137395464, |
|
"eval_info_retr_eval_dot_recall@1": 0.9904420549581839, |
|
"eval_info_retr_eval_dot_recall@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_recall@3": 0.9982538369635143, |
|
"eval_info_retr_eval_dot_recall@5": 0.998805256869773, |
|
"eval_loss": 0.01802203245460987, |
|
"eval_para_mine_eval_average_precision": 0.8868720697863423, |
|
"eval_para_mine_eval_f1": 0.8749901834425858, |
|
"eval_para_mine_eval_precision": 0.8953481226571621, |
|
"eval_para_mine_eval_recall": 0.8555374379497094, |
|
"eval_para_mine_eval_threshold": 0.6635497808456421, |
|
"eval_runtime": 44.1381, |
|
"eval_samples_per_second": 246.521, |
|
"eval_sequential_score": 0.9944206662844655, |
|
"eval_steps_per_second": 1.948, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 0.5478645066273933, |
|
"grad_norm": 0.8567762970924377, |
|
"learning_rate": 4.3030459473412496e-05, |
|
"loss": 0.0475, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.5478645066273933, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9909934748644426, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9995404834114512, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9974267071041265, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9978862236926753, |
|
"eval_info_retr_eval_dot_map@100": 0.9943151219822102, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9942822642643431, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9955792346109411, |
|
"eval_info_retr_eval_dot_precision@1": 0.9909934748644426, |
|
"eval_info_retr_eval_dot_precision@10": 0.09995404834114513, |
|
"eval_info_retr_eval_dot_precision@3": 0.33247556903470876, |
|
"eval_info_retr_eval_dot_precision@5": 0.19957724473853508, |
|
"eval_info_retr_eval_dot_recall@1": 0.9909934748644426, |
|
"eval_info_retr_eval_dot_recall@10": 0.9995404834114512, |
|
"eval_info_retr_eval_dot_recall@3": 0.9974267071041265, |
|
"eval_info_retr_eval_dot_recall@5": 0.9978862236926753, |
|
"eval_loss": 0.020289968699216843, |
|
"eval_para_mine_eval_average_precision": 0.9057199011076745, |
|
"eval_para_mine_eval_f1": 0.8932047816062182, |
|
"eval_para_mine_eval_precision": 0.9151715052081852, |
|
"eval_para_mine_eval_recall": 0.8722678675477544, |
|
"eval_para_mine_eval_threshold": 0.6722444593906403, |
|
"eval_runtime": 44.2598, |
|
"eval_samples_per_second": 245.844, |
|
"eval_sequential_score": 0.9943151219822102, |
|
"eval_steps_per_second": 1.943, |
|
"step": 372 |
|
}, |
|
{ |
|
"epoch": 0.6391752577319587, |
|
"grad_norm": 1.4318528175354004, |
|
"learning_rate": 4.1430046463603515e-05, |
|
"loss": 0.0377, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 0.6391752577319587, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9912691848175719, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9997242900468707, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.998805256869773, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9995404834114512, |
|
"eval_info_retr_eval_dot_map@100": 0.9950291896321672, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9950066958131474, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.996211640167477, |
|
"eval_info_retr_eval_dot_precision@1": 0.9912691848175719, |
|
"eval_info_retr_eval_dot_precision@10": 0.09997242900468709, |
|
"eval_info_retr_eval_dot_precision@3": 0.33293508562325763, |
|
"eval_info_retr_eval_dot_precision@5": 0.1999080966822902, |
|
"eval_info_retr_eval_dot_recall@1": 0.9912691848175719, |
|
"eval_info_retr_eval_dot_recall@10": 0.9997242900468707, |
|
"eval_info_retr_eval_dot_recall@3": 0.998805256869773, |
|
"eval_info_retr_eval_dot_recall@5": 0.9995404834114512, |
|
"eval_loss": 0.015328879468142986, |
|
"eval_para_mine_eval_average_precision": 0.8941081769196199, |
|
"eval_para_mine_eval_f1": 0.8799847506361558, |
|
"eval_para_mine_eval_precision": 0.8951106127502512, |
|
"eval_para_mine_eval_recall": 0.8653615967984535, |
|
"eval_para_mine_eval_threshold": 0.6661731898784637, |
|
"eval_runtime": 44.1048, |
|
"eval_samples_per_second": 246.708, |
|
"eval_sequential_score": 0.9950291896321672, |
|
"eval_steps_per_second": 1.95, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 0.7304860088365243, |
|
"grad_norm": 0.5837889909744263, |
|
"learning_rate": 3.9829633453794526e-05, |
|
"loss": 0.0241, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 0.7304860088365243, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9905339582758937, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9981619336458046, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9993566767760316, |
|
"eval_info_retr_eval_dot_map@100": 0.9944845062676603, |
|
"eval_info_retr_eval_dot_mrr@10": 0.994473656570431, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9958242906817244, |
|
"eval_info_retr_eval_dot_precision@1": 0.9905339582758937, |
|
"eval_info_retr_eval_dot_precision@10": 0.09998161933645805, |
|
"eval_info_retr_eval_dot_precision@3": 0.3327206445486015, |
|
"eval_info_retr_eval_dot_precision@5": 0.19987133535520635, |
|
"eval_info_retr_eval_dot_recall@1": 0.9905339582758937, |
|
"eval_info_retr_eval_dot_recall@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_recall@3": 0.9981619336458046, |
|
"eval_info_retr_eval_dot_recall@5": 0.9993566767760316, |
|
"eval_loss": 0.016888538375496864, |
|
"eval_para_mine_eval_average_precision": 0.8920135475248205, |
|
"eval_para_mine_eval_f1": 0.8817566331198535, |
|
"eval_para_mine_eval_precision": 0.8931684329053274, |
|
"eval_para_mine_eval_recall": 0.870632766166952, |
|
"eval_para_mine_eval_threshold": 0.6506930291652679, |
|
"eval_runtime": 43.9952, |
|
"eval_samples_per_second": 247.322, |
|
"eval_sequential_score": 0.9944845062676603, |
|
"eval_steps_per_second": 1.955, |
|
"step": 496 |
|
}, |
|
{ |
|
"epoch": 0.8217967599410898, |
|
"grad_norm": 0.7147839069366455, |
|
"learning_rate": 3.8229220443985544e-05, |
|
"loss": 0.045, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.8217967599410898, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9938424777134455, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9986214502343534, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9993566767760316, |
|
"eval_info_retr_eval_dot_map@100": 0.9963993172223115, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9963845891265246, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9972497507624225, |
|
"eval_info_retr_eval_dot_precision@1": 0.9938424777134455, |
|
"eval_info_retr_eval_dot_precision@10": 0.09998161933645805, |
|
"eval_info_retr_eval_dot_precision@3": 0.33287381674478445, |
|
"eval_info_retr_eval_dot_precision@5": 0.19987133535520635, |
|
"eval_info_retr_eval_dot_recall@1": 0.9938424777134455, |
|
"eval_info_retr_eval_dot_recall@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_recall@3": 0.9986214502343534, |
|
"eval_info_retr_eval_dot_recall@5": 0.9993566767760316, |
|
"eval_loss": 0.013228075578808784, |
|
"eval_para_mine_eval_average_precision": 0.9111664137442287, |
|
"eval_para_mine_eval_f1": 0.8942790038822603, |
|
"eval_para_mine_eval_precision": 0.9093417624592629, |
|
"eval_para_mine_eval_recall": 0.8797071271449414, |
|
"eval_para_mine_eval_threshold": 0.6545680165290833, |
|
"eval_runtime": 44.1589, |
|
"eval_samples_per_second": 246.405, |
|
"eval_sequential_score": 0.9963993172223115, |
|
"eval_steps_per_second": 1.948, |
|
"step": 558 |
|
}, |
|
{ |
|
"epoch": 0.9131075110456554, |
|
"grad_norm": 1.6569366455078125, |
|
"learning_rate": 3.662880743417656e-05, |
|
"loss": 0.0302, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 0.9131075110456554, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9913610881352817, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9992647734583219, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9980700303280948, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9987133535520633, |
|
"eval_info_retr_eval_dot_map@100": 0.9947594505678611, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9947092135264177, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9958603290565278, |
|
"eval_info_retr_eval_dot_precision@1": 0.9913610881352817, |
|
"eval_info_retr_eval_dot_precision@10": 0.0999264773458322, |
|
"eval_info_retr_eval_dot_precision@3": 0.33269001010936494, |
|
"eval_info_retr_eval_dot_precision@5": 0.19974267071041266, |
|
"eval_info_retr_eval_dot_recall@1": 0.9913610881352817, |
|
"eval_info_retr_eval_dot_recall@10": 0.9992647734583219, |
|
"eval_info_retr_eval_dot_recall@3": 0.9980700303280948, |
|
"eval_info_retr_eval_dot_recall@5": 0.9987133535520633, |
|
"eval_loss": 0.01584717258810997, |
|
"eval_para_mine_eval_average_precision": 0.9161096169142061, |
|
"eval_para_mine_eval_f1": 0.9015840220385676, |
|
"eval_para_mine_eval_precision": 0.9167067369413698, |
|
"eval_para_mine_eval_recall": 0.886952161992475, |
|
"eval_para_mine_eval_threshold": 0.6570625901222229, |
|
"eval_runtime": 44.3069, |
|
"eval_samples_per_second": 245.583, |
|
"eval_sequential_score": 0.9947594505678611, |
|
"eval_steps_per_second": 1.941, |
|
"step": 620 |
|
}, |
|
{ |
|
"epoch": 1.004418262150221, |
|
"grad_norm": 0.12535937130451202, |
|
"learning_rate": 3.502839442436758e-05, |
|
"loss": 0.0314, |
|
"step": 682 |
|
}, |
|
{ |
|
"epoch": 1.004418262150221, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9902582483227644, |
|
"eval_info_retr_eval_dot_accuracy@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9983457402812241, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9994485800937414, |
|
"eval_info_retr_eval_dot_map@100": 0.9944195539625648, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9944061513953989, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9957806542116834, |
|
"eval_info_retr_eval_dot_precision@1": 0.9902582483227644, |
|
"eval_info_retr_eval_dot_precision@10": 0.09998161933645805, |
|
"eval_info_retr_eval_dot_precision@3": 0.3327819134270747, |
|
"eval_info_retr_eval_dot_precision@5": 0.19988971601874833, |
|
"eval_info_retr_eval_dot_recall@1": 0.9902582483227644, |
|
"eval_info_retr_eval_dot_recall@10": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_recall@3": 0.9983457402812241, |
|
"eval_info_retr_eval_dot_recall@5": 0.9994485800937414, |
|
"eval_loss": 0.01480414904654026, |
|
"eval_para_mine_eval_average_precision": 0.9018706893922749, |
|
"eval_para_mine_eval_f1": 0.8877219600165349, |
|
"eval_para_mine_eval_precision": 0.8927995468022605, |
|
"eval_para_mine_eval_recall": 0.8827018017733171, |
|
"eval_para_mine_eval_threshold": 0.6474231779575348, |
|
"eval_runtime": 43.8665, |
|
"eval_samples_per_second": 248.048, |
|
"eval_sequential_score": 0.9944195539625648, |
|
"eval_steps_per_second": 1.96, |
|
"step": 682 |
|
}, |
|
{ |
|
"epoch": 1.0559646539027983, |
|
"grad_norm": 0.2109777331352234, |
|
"learning_rate": 3.342798141455859e-05, |
|
"loss": 0.0204, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 1.0559646539027983, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_accuracy@10": 1.0, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9992647734583219, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9999080966822902, |
|
"eval_info_retr_eval_dot_map@100": 0.996594216217872, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9965942162178723, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9974631239499567, |
|
"eval_info_retr_eval_dot_precision@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_precision@10": 0.10000000000000002, |
|
"eval_info_retr_eval_dot_precision@3": 0.33308825781944057, |
|
"eval_info_retr_eval_dot_precision@5": 0.19998161933645806, |
|
"eval_info_retr_eval_dot_recall@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_recall@10": 1.0, |
|
"eval_info_retr_eval_dot_recall@3": 0.9992647734583219, |
|
"eval_info_retr_eval_dot_recall@5": 0.9999080966822902, |
|
"eval_loss": 0.011477422900497913, |
|
"eval_para_mine_eval_average_precision": 0.9183526341973961, |
|
"eval_para_mine_eval_f1": 0.9008710021688987, |
|
"eval_para_mine_eval_precision": 0.9157536675501139, |
|
"eval_para_mine_eval_recall": 0.8864643416910201, |
|
"eval_para_mine_eval_threshold": 0.6480826139450073, |
|
"eval_runtime": 45.0423, |
|
"eval_samples_per_second": 241.573, |
|
"eval_sequential_score": 0.996594216217872, |
|
"eval_steps_per_second": 1.909, |
|
"step": 744 |
|
}, |
|
{ |
|
"epoch": 1.1472754050073637, |
|
"grad_norm": 0.43087926506996155, |
|
"learning_rate": 3.182756840474961e-05, |
|
"loss": 0.0193, |
|
"step": 806 |
|
}, |
|
{ |
|
"epoch": 1.1472754050073637, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_accuracy@10": 1.0, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9991728701406121, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9998161933645805, |
|
"eval_info_retr_eval_dot_map@100": 0.996541371810189, |
|
"eval_info_retr_eval_dot_mrr@10": 0.996541371810189, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9974193893555866, |
|
"eval_info_retr_eval_dot_precision@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_precision@10": 0.10000000000000002, |
|
"eval_info_retr_eval_dot_precision@3": 0.333057623380204, |
|
"eval_info_retr_eval_dot_precision@5": 0.1999632386729161, |
|
"eval_info_retr_eval_dot_recall@1": 0.9939343810311553, |
|
"eval_info_retr_eval_dot_recall@10": 1.0, |
|
"eval_info_retr_eval_dot_recall@3": 0.9991728701406121, |
|
"eval_info_retr_eval_dot_recall@5": 0.9998161933645805, |
|
"eval_loss": 0.01137059461325407, |
|
"eval_para_mine_eval_average_precision": 0.9152930281344098, |
|
"eval_para_mine_eval_f1": 0.8996903771768937, |
|
"eval_para_mine_eval_precision": 0.9043090584686712, |
|
"eval_para_mine_eval_recall": 0.895118635187201, |
|
"eval_para_mine_eval_threshold": 0.6495572626590729, |
|
"eval_runtime": 43.8875, |
|
"eval_samples_per_second": 247.93, |
|
"eval_sequential_score": 0.996541371810189, |
|
"eval_steps_per_second": 1.96, |
|
"step": 806 |
|
}, |
|
{ |
|
"epoch": 1.2385861561119293, |
|
"grad_norm": 1.3790454864501953, |
|
"learning_rate": 3.0227155394940632e-05, |
|
"loss": 0.0164, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 1.2385861561119293, |
|
"eval_info_retr_eval_dot_accuracy@1": 0.9937505743957357, |
|
"eval_info_retr_eval_dot_accuracy@10": 1.0, |
|
"eval_info_retr_eval_dot_accuracy@3": 0.9990809668229023, |
|
"eval_info_retr_eval_dot_accuracy@5": 0.9999080966822902, |
|
"eval_info_retr_eval_dot_map@100": 0.9964954201513342, |
|
"eval_info_retr_eval_dot_mrr@10": 0.9964954201513342, |
|
"eval_info_retr_eval_dot_ndcg@10": 0.9973903161826975, |
|
"eval_info_retr_eval_dot_precision@1": 0.9937505743957357, |
|
"eval_info_retr_eval_dot_precision@10": 0.10000000000000002, |
|
"eval_info_retr_eval_dot_precision@3": 0.3330269889409674, |
|
"eval_info_retr_eval_dot_precision@5": 0.19998161933645806, |
|
"eval_info_retr_eval_dot_recall@1": 0.9937505743957357, |
|
"eval_info_retr_eval_dot_recall@10": 1.0, |
|
"eval_info_retr_eval_dot_recall@3": 0.9990809668229023, |
|
"eval_info_retr_eval_dot_recall@5": 0.9999080966822902, |
|
"eval_loss": 0.009216207079589367, |
|
"eval_para_mine_eval_average_precision": 0.9306620270961232, |
|
"eval_para_mine_eval_f1": 0.9113359207458677, |
|
"eval_para_mine_eval_precision": 0.9197094729482332, |
|
"eval_para_mine_eval_recall": 0.9031134679054893, |
|
"eval_para_mine_eval_threshold": 0.6408547163009644, |
|
"eval_runtime": 44.7336, |
|
"eval_samples_per_second": 243.24, |
|
"eval_sequential_score": 0.9964954201513342, |
|
"eval_steps_per_second": 1.922, |
|
"step": 868 |
|
} |
|
], |
|
"logging_steps": 62, |
|
"max_steps": 2037, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 3, |
|
"save_steps": 62, |
|
"stateful_callbacks": { |
|
"EarlyStoppingCallback": { |
|
"args": { |
|
"early_stopping_patience": 3, |
|
"early_stopping_threshold": 0.0 |
|
}, |
|
"attributes": { |
|
"early_stopping_patience_counter": 0 |
|
} |
|
}, |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": false |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 0.0, |
|
"train_batch_size": 64, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|