File size: 46,218 Bytes
02137df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
{
  "best_metric": 0.5714132731149775,
  "best_model_checkpoint": "models/all-minilm-l6-v2-typosquat-v3.1-gist/checkpoint-1674",
  "epoch": 2.385861561119293,
  "eval_steps": 62,
  "global_step": 1674,
  "is_hyper_param_search": false,
  "is_local_process_zero": true,
  "is_world_process_zero": true,
  "log_history": [
    {
      "epoch": 0.09131075110456553,
      "grad_norm": 17.575565338134766,
      "learning_rate": 3e-05,
      "loss": 1.9075,
      "step": 62
    },
    {
      "epoch": 0.09131075110456553,
      "eval_info_retr_eval_dot_accuracy@1": 0.8306221854608952,
      "eval_info_retr_eval_dot_accuracy@10": 0.9250068927488282,
      "eval_info_retr_eval_dot_accuracy@3": 0.8876941457586619,
      "eval_info_retr_eval_dot_accuracy@5": 0.9032258064516129,
      "eval_info_retr_eval_dot_map@100": 0.8651529300165571,
      "eval_info_retr_eval_dot_mrr@10": 0.8627116876220815,
      "eval_info_retr_eval_dot_ndcg@10": 0.8777861364040704,
      "eval_info_retr_eval_dot_precision@1": 0.8306221854608952,
      "eval_info_retr_eval_dot_precision@10": 0.09250068927488282,
      "eval_info_retr_eval_dot_precision@3": 0.2958980485862206,
      "eval_info_retr_eval_dot_precision@5": 0.18064516129032257,
      "eval_info_retr_eval_dot_recall@1": 0.8306221854608952,
      "eval_info_retr_eval_dot_recall@10": 0.9250068927488282,
      "eval_info_retr_eval_dot_recall@3": 0.8876941457586619,
      "eval_info_retr_eval_dot_recall@5": 0.9032258064516129,
      "eval_loss": 0.8926403522491455,
      "eval_para_mine_eval_average_precision": 0.4175368476477107,
      "eval_para_mine_eval_f1": 0.5608786555511446,
      "eval_para_mine_eval_precision": 0.6772723495912615,
      "eval_para_mine_eval_recall": 0.4786239854015258,
      "eval_para_mine_eval_threshold": 0.7514148652553558,
      "eval_runtime": 46.7645,
      "eval_samples_per_second": 232.676,
      "eval_sequential_score": 0.8651529300165571,
      "eval_steps_per_second": 1.839,
      "step": 62
    },
    {
      "epoch": 0.18262150220913106,
      "grad_norm": 6.875263214111328,
      "learning_rate": 4.943211151264843e-05,
      "loss": 0.9074,
      "step": 124
    },
    {
      "epoch": 0.18262150220913106,
      "eval_info_retr_eval_dot_accuracy@1": 0.8424777134454554,
      "eval_info_retr_eval_dot_accuracy@10": 0.9359433875562908,
      "eval_info_retr_eval_dot_accuracy@3": 0.8946787979046044,
      "eval_info_retr_eval_dot_accuracy@5": 0.9126918481757191,
      "eval_info_retr_eval_dot_map@100": 0.8756277031952363,
      "eval_info_retr_eval_dot_mrr@10": 0.873614557485526,
      "eval_info_retr_eval_dot_ndcg@10": 0.8886439257445581,
      "eval_info_retr_eval_dot_precision@1": 0.8424777134454554,
      "eval_info_retr_eval_dot_precision@10": 0.09359433875562909,
      "eval_info_retr_eval_dot_precision@3": 0.2982262659682014,
      "eval_info_retr_eval_dot_precision@5": 0.18253836963514383,
      "eval_info_retr_eval_dot_recall@1": 0.8424777134454554,
      "eval_info_retr_eval_dot_recall@10": 0.9359433875562908,
      "eval_info_retr_eval_dot_recall@3": 0.8946787979046044,
      "eval_info_retr_eval_dot_recall@5": 0.9126918481757191,
      "eval_loss": 0.6083176732063293,
      "eval_para_mine_eval_average_precision": 0.458339002373722,
      "eval_para_mine_eval_f1": 0.5954711973336655,
      "eval_para_mine_eval_precision": 0.6810695759380306,
      "eval_para_mine_eval_recall": 0.5289869146720989,
      "eval_para_mine_eval_threshold": 0.8661167621612549,
      "eval_runtime": 47.222,
      "eval_samples_per_second": 230.422,
      "eval_sequential_score": 0.8756277031952363,
      "eval_steps_per_second": 1.821,
      "step": 124
    },
    {
      "epoch": 0.27393225331369664,
      "grad_norm": 5.694400787353516,
      "learning_rate": 4.783169850283944e-05,
      "loss": 0.6272,
      "step": 186
    },
    {
      "epoch": 0.27393225331369664,
      "eval_info_retr_eval_dot_accuracy@1": 0.8515761418987225,
      "eval_info_retr_eval_dot_accuracy@10": 0.9441227828324602,
      "eval_info_retr_eval_dot_accuracy@3": 0.903961032993291,
      "eval_info_retr_eval_dot_accuracy@5": 0.9217902766289863,
      "eval_info_retr_eval_dot_map@100": 0.8842285240457468,
      "eval_info_retr_eval_dot_mrr@10": 0.8822831920502171,
      "eval_info_retr_eval_dot_ndcg@10": 0.8972070930309096,
      "eval_info_retr_eval_dot_precision@1": 0.8515761418987225,
      "eval_info_retr_eval_dot_precision@10": 0.09441227828324604,
      "eval_info_retr_eval_dot_precision@3": 0.301320344331097,
      "eval_info_retr_eval_dot_precision@5": 0.18435805532579727,
      "eval_info_retr_eval_dot_recall@1": 0.8515761418987225,
      "eval_info_retr_eval_dot_recall@10": 0.9441227828324602,
      "eval_info_retr_eval_dot_recall@3": 0.903961032993291,
      "eval_info_retr_eval_dot_recall@5": 0.9217902766289863,
      "eval_loss": 0.5591671466827393,
      "eval_para_mine_eval_average_precision": 0.4831713388578378,
      "eval_para_mine_eval_f1": 0.6178009413060559,
      "eval_para_mine_eval_precision": 0.7009458839715662,
      "eval_para_mine_eval_recall": 0.5522893677758556,
      "eval_para_mine_eval_threshold": 0.860432505607605,
      "eval_runtime": 46.8519,
      "eval_samples_per_second": 232.242,
      "eval_sequential_score": 0.8842285240457468,
      "eval_steps_per_second": 1.836,
      "step": 186
    },
    {
      "epoch": 0.36524300441826213,
      "grad_norm": 5.078444004058838,
      "learning_rate": 4.623128549303046e-05,
      "loss": 0.5353,
      "step": 248
    },
    {
      "epoch": 0.36524300441826213,
      "eval_info_retr_eval_dot_accuracy@1": 0.8613178935759581,
      "eval_info_retr_eval_dot_accuracy@10": 0.9482584321293999,
      "eval_info_retr_eval_dot_accuracy@3": 0.9126918481757191,
      "eval_info_retr_eval_dot_accuracy@5": 0.9284073155040897,
      "eval_info_retr_eval_dot_map@100": 0.8925029461858842,
      "eval_info_retr_eval_dot_mrr@10": 0.8906325355250079,
      "eval_info_retr_eval_dot_ndcg@10": 0.9045724071765342,
      "eval_info_retr_eval_dot_precision@1": 0.8613178935759581,
      "eval_info_retr_eval_dot_precision@10": 0.09482584321294,
      "eval_info_retr_eval_dot_precision@3": 0.30423061605857304,
      "eval_info_retr_eval_dot_precision@5": 0.18568146310081796,
      "eval_info_retr_eval_dot_recall@1": 0.8613178935759581,
      "eval_info_retr_eval_dot_recall@10": 0.9482584321293999,
      "eval_info_retr_eval_dot_recall@3": 0.9126918481757191,
      "eval_info_retr_eval_dot_recall@5": 0.9284073155040897,
      "eval_loss": 0.49234136939048767,
      "eval_para_mine_eval_average_precision": 0.5057185080416585,
      "eval_para_mine_eval_f1": 0.634543585033742,
      "eval_para_mine_eval_precision": 0.7090381773055578,
      "eval_para_mine_eval_recall": 0.5742141802134666,
      "eval_para_mine_eval_threshold": 0.8692877888679504,
      "eval_runtime": 46.7669,
      "eval_samples_per_second": 232.665,
      "eval_sequential_score": 0.8925029461858842,
      "eval_steps_per_second": 1.839,
      "step": 248
    },
    {
      "epoch": 0.4565537555228277,
      "grad_norm": 3.5897247791290283,
      "learning_rate": 4.463087248322148e-05,
      "loss": 0.4993,
      "step": 310
    },
    {
      "epoch": 0.4565537555228277,
      "eval_info_retr_eval_dot_accuracy@1": 0.8651778329197684,
      "eval_info_retr_eval_dot_accuracy@10": 0.9506479183898539,
      "eval_info_retr_eval_dot_accuracy@3": 0.9142542045767852,
      "eval_info_retr_eval_dot_accuracy@5": 0.9308887050822535,
      "eval_info_retr_eval_dot_map@100": 0.8952610946722075,
      "eval_info_retr_eval_dot_mrr@10": 0.8935005390202521,
      "eval_info_retr_eval_dot_ndcg@10": 0.9073002136944609,
      "eval_info_retr_eval_dot_precision@1": 0.8651778329197684,
      "eval_info_retr_eval_dot_precision@10": 0.09506479183898539,
      "eval_info_retr_eval_dot_precision@3": 0.3047514015255951,
      "eval_info_retr_eval_dot_precision@5": 0.18617774101645068,
      "eval_info_retr_eval_dot_recall@1": 0.8651778329197684,
      "eval_info_retr_eval_dot_recall@10": 0.9506479183898539,
      "eval_info_retr_eval_dot_recall@3": 0.9142542045767852,
      "eval_info_retr_eval_dot_recall@5": 0.9308887050822535,
      "eval_loss": 0.49423983693122864,
      "eval_para_mine_eval_average_precision": 0.5094425990878857,
      "eval_para_mine_eval_f1": 0.6359308330329982,
      "eval_para_mine_eval_precision": 0.7193390578495433,
      "eval_para_mine_eval_recall": 0.5698554154828743,
      "eval_para_mine_eval_threshold": 0.8585812747478485,
      "eval_runtime": 47.1777,
      "eval_samples_per_second": 230.639,
      "eval_sequential_score": 0.8952610946722075,
      "eval_steps_per_second": 1.823,
      "step": 310
    },
    {
      "epoch": 0.5478645066273933,
      "grad_norm": 5.185989856719971,
      "learning_rate": 4.3030459473412496e-05,
      "loss": 0.5339,
      "step": 372
    },
    {
      "epoch": 0.5478645066273933,
      "eval_info_retr_eval_dot_accuracy@1": 0.8665563826854149,
      "eval_info_retr_eval_dot_accuracy@10": 0.9531293079680176,
      "eval_info_retr_eval_dot_accuracy@3": 0.9180222406028857,
      "eval_info_retr_eval_dot_accuracy@5": 0.9335539012958368,
      "eval_info_retr_eval_dot_map@100": 0.8979226074859789,
      "eval_info_retr_eval_dot_mrr@10": 0.8961890028198282,
      "eval_info_retr_eval_dot_ndcg@10": 0.9099837143266869,
      "eval_info_retr_eval_dot_precision@1": 0.8665563826854149,
      "eval_info_retr_eval_dot_precision@10": 0.09531293079680178,
      "eval_info_retr_eval_dot_precision@3": 0.3060074135342952,
      "eval_info_retr_eval_dot_precision@5": 0.18671078025916735,
      "eval_info_retr_eval_dot_recall@1": 0.8665563826854149,
      "eval_info_retr_eval_dot_recall@10": 0.9531293079680176,
      "eval_info_retr_eval_dot_recall@3": 0.9180222406028857,
      "eval_info_retr_eval_dot_recall@5": 0.9335539012958368,
      "eval_loss": 0.46397796273231506,
      "eval_para_mine_eval_average_precision": 0.5171675614798505,
      "eval_para_mine_eval_f1": 0.6460162421829887,
      "eval_para_mine_eval_precision": 0.7083665639212813,
      "eval_para_mine_eval_recall": 0.5937540933995203,
      "eval_para_mine_eval_threshold": 0.8755151331424713,
      "eval_runtime": 47.3437,
      "eval_samples_per_second": 229.83,
      "eval_sequential_score": 0.8979226074859789,
      "eval_steps_per_second": 1.817,
      "step": 372
    },
    {
      "epoch": 0.6391752577319587,
      "grad_norm": 5.517925262451172,
      "learning_rate": 4.1430046463603515e-05,
      "loss": 0.4712,
      "step": 434
    },
    {
      "epoch": 0.6391752577319587,
      "eval_info_retr_eval_dot_accuracy@1": 0.876114327727231,
      "eval_info_retr_eval_dot_accuracy@10": 0.9580001838066354,
      "eval_info_retr_eval_dot_accuracy@3": 0.9218821799466961,
      "eval_info_retr_eval_dot_accuracy@5": 0.9385166804521643,
      "eval_info_retr_eval_dot_map@100": 0.9048794424295332,
      "eval_info_retr_eval_dot_mrr@10": 0.9033319693713965,
      "eval_info_retr_eval_dot_ndcg@10": 0.9165326554505013,
      "eval_info_retr_eval_dot_precision@1": 0.876114327727231,
      "eval_info_retr_eval_dot_precision@10": 0.09580001838066356,
      "eval_info_retr_eval_dot_precision@3": 0.30729405998223197,
      "eval_info_retr_eval_dot_precision@5": 0.18770333609043288,
      "eval_info_retr_eval_dot_recall@1": 0.876114327727231,
      "eval_info_retr_eval_dot_recall@10": 0.9580001838066354,
      "eval_info_retr_eval_dot_recall@3": 0.9218821799466961,
      "eval_info_retr_eval_dot_recall@5": 0.9385166804521643,
      "eval_loss": 0.43524134159088135,
      "eval_para_mine_eval_average_precision": 0.5120496793668291,
      "eval_para_mine_eval_f1": 0.6373077701335491,
      "eval_para_mine_eval_precision": 0.7241775739076951,
      "eval_para_mine_eval_recall": 0.5690468985017593,
      "eval_para_mine_eval_threshold": 0.8673346936702728,
      "eval_runtime": 47.1044,
      "eval_samples_per_second": 230.997,
      "eval_sequential_score": 0.9048794424295332,
      "eval_steps_per_second": 1.826,
      "step": 434
    },
    {
      "epoch": 0.7304860088365243,
      "grad_norm": 5.404409408569336,
      "learning_rate": 3.9829633453794526e-05,
      "loss": 0.4551,
      "step": 496
    },
    {
      "epoch": 0.7304860088365243,
      "eval_info_retr_eval_dot_accuracy@1": 0.8799742670710413,
      "eval_info_retr_eval_dot_accuracy@10": 0.9583677970774745,
      "eval_info_retr_eval_dot_accuracy@3": 0.9246392794779892,
      "eval_info_retr_eval_dot_accuracy@5": 0.9411818766657476,
      "eval_info_retr_eval_dot_map@100": 0.9077432063489332,
      "eval_info_retr_eval_dot_mrr@10": 0.9062031821888451,
      "eval_info_retr_eval_dot_ndcg@10": 0.9188197267902801,
      "eval_info_retr_eval_dot_precision@1": 0.8799742670710413,
      "eval_info_retr_eval_dot_precision@10": 0.09583677970774747,
      "eval_info_retr_eval_dot_precision@3": 0.30821309315932965,
      "eval_info_retr_eval_dot_precision@5": 0.18823637533314955,
      "eval_info_retr_eval_dot_recall@1": 0.8799742670710413,
      "eval_info_retr_eval_dot_recall@10": 0.9583677970774745,
      "eval_info_retr_eval_dot_recall@3": 0.9246392794779892,
      "eval_info_retr_eval_dot_recall@5": 0.9411818766657476,
      "eval_loss": 0.43508002161979675,
      "eval_para_mine_eval_average_precision": 0.5098966109274621,
      "eval_para_mine_eval_f1": 0.6349388484094101,
      "eval_para_mine_eval_precision": 0.7090408699915318,
      "eval_para_mine_eval_recall": 0.5748600904274299,
      "eval_para_mine_eval_threshold": 0.8756376802921295,
      "eval_runtime": 46.9049,
      "eval_samples_per_second": 231.98,
      "eval_sequential_score": 0.9077432063489332,
      "eval_steps_per_second": 1.833,
      "step": 496
    },
    {
      "epoch": 0.8217967599410898,
      "grad_norm": 5.574550151824951,
      "learning_rate": 3.8229220443985544e-05,
      "loss": 0.5675,
      "step": 558
    },
    {
      "epoch": 0.8217967599410898,
      "eval_info_retr_eval_dot_accuracy@1": 0.8838342064148516,
      "eval_info_retr_eval_dot_accuracy@10": 0.9589192169837331,
      "eval_info_retr_eval_dot_accuracy@3": 0.9250068927488282,
      "eval_info_retr_eval_dot_accuracy@5": 0.9407223600771988,
      "eval_info_retr_eval_dot_map@100": 0.9101926203565123,
      "eval_info_retr_eval_dot_mrr@10": 0.9085925955101584,
      "eval_info_retr_eval_dot_ndcg@10": 0.9207315014698775,
      "eval_info_retr_eval_dot_precision@1": 0.8838342064148516,
      "eval_info_retr_eval_dot_precision@10": 0.09589192169837332,
      "eval_info_retr_eval_dot_precision@3": 0.3083356309162761,
      "eval_info_retr_eval_dot_precision@5": 0.18814447201543977,
      "eval_info_retr_eval_dot_recall@1": 0.8838342064148516,
      "eval_info_retr_eval_dot_recall@10": 0.9589192169837331,
      "eval_info_retr_eval_dot_recall@3": 0.9250068927488282,
      "eval_info_retr_eval_dot_recall@5": 0.9407223600771988,
      "eval_loss": 0.4080217182636261,
      "eval_para_mine_eval_average_precision": 0.5334326202140158,
      "eval_para_mine_eval_f1": 0.6571024883172905,
      "eval_para_mine_eval_precision": 0.7344628039218969,
      "eval_para_mine_eval_recall": 0.5944858238517027,
      "eval_para_mine_eval_threshold": 0.8824244141578674,
      "eval_runtime": 46.9444,
      "eval_samples_per_second": 231.785,
      "eval_sequential_score": 0.9101926203565123,
      "eval_steps_per_second": 1.832,
      "step": 558
    },
    {
      "epoch": 0.9131075110456554,
      "grad_norm": 7.1312103271484375,
      "learning_rate": 3.662880743417656e-05,
      "loss": 0.5189,
      "step": 620
    },
    {
      "epoch": 0.9131075110456554,
      "eval_info_retr_eval_dot_accuracy@1": 0.8812609135189781,
      "eval_info_retr_eval_dot_accuracy@10": 0.9581839904420549,
      "eval_info_retr_eval_dot_accuracy@3": 0.9273963790092823,
      "eval_info_retr_eval_dot_accuracy@5": 0.9409061667126183,
      "eval_info_retr_eval_dot_map@100": 0.9088995825285359,
      "eval_info_retr_eval_dot_mrr@10": 0.907332134213855,
      "eval_info_retr_eval_dot_ndcg@10": 0.9196508765398915,
      "eval_info_retr_eval_dot_precision@1": 0.8812609135189781,
      "eval_info_retr_eval_dot_precision@10": 0.09581839904420549,
      "eval_info_retr_eval_dot_precision@3": 0.3091321263364274,
      "eval_info_retr_eval_dot_precision@5": 0.1881812333425237,
      "eval_info_retr_eval_dot_recall@1": 0.8812609135189781,
      "eval_info_retr_eval_dot_recall@10": 0.9581839904420549,
      "eval_info_retr_eval_dot_recall@3": 0.9273963790092823,
      "eval_info_retr_eval_dot_recall@5": 0.9409061667126183,
      "eval_loss": 0.3979346752166748,
      "eval_para_mine_eval_average_precision": 0.5429228832902425,
      "eval_para_mine_eval_f1": 0.6632612084554468,
      "eval_para_mine_eval_precision": 0.7405866363656618,
      "eval_para_mine_eval_recall": 0.60055647649203,
      "eval_para_mine_eval_threshold": 0.8737862706184387,
      "eval_runtime": 47.0589,
      "eval_samples_per_second": 231.221,
      "eval_sequential_score": 0.9088995825285359,
      "eval_steps_per_second": 1.827,
      "step": 620
    },
    {
      "epoch": 1.004418262150221,
      "grad_norm": 2.313579559326172,
      "learning_rate": 3.502839442436758e-05,
      "loss": 0.4278,
      "step": 682
    },
    {
      "epoch": 1.004418262150221,
      "eval_info_retr_eval_dot_accuracy@1": 0.886039886039886,
      "eval_info_retr_eval_dot_accuracy@10": 0.9605734767025089,
      "eval_info_retr_eval_dot_accuracy@3": 0.9296939619520265,
      "eval_info_retr_eval_dot_accuracy@5": 0.9435713629262016,
      "eval_info_retr_eval_dot_map@100": 0.912725086164855,
      "eval_info_retr_eval_dot_mrr@10": 0.9111236201738,
      "eval_info_retr_eval_dot_ndcg@10": 0.9230849032296308,
      "eval_info_retr_eval_dot_precision@1": 0.886039886039886,
      "eval_info_retr_eval_dot_precision@10": 0.0960573476702509,
      "eval_info_retr_eval_dot_precision@3": 0.30989798731734214,
      "eval_info_retr_eval_dot_precision@5": 0.18871427258524037,
      "eval_info_retr_eval_dot_recall@1": 0.886039886039886,
      "eval_info_retr_eval_dot_recall@10": 0.9605734767025089,
      "eval_info_retr_eval_dot_recall@3": 0.9296939619520265,
      "eval_info_retr_eval_dot_recall@5": 0.9435713629262016,
      "eval_loss": 0.4062098264694214,
      "eval_para_mine_eval_average_precision": 0.5569159802538414,
      "eval_para_mine_eval_f1": 0.6778007972895148,
      "eval_para_mine_eval_precision": 0.7563934207304859,
      "eval_para_mine_eval_recall": 0.6140031527645409,
      "eval_para_mine_eval_threshold": 0.8800513744354248,
      "eval_runtime": 47.9405,
      "eval_samples_per_second": 226.969,
      "eval_sequential_score": 0.912725086164855,
      "eval_steps_per_second": 1.794,
      "step": 682
    },
    {
      "epoch": 1.0559646539027983,
      "grad_norm": 3.6702966690063477,
      "learning_rate": 3.342798141455859e-05,
      "loss": 0.337,
      "step": 744
    },
    {
      "epoch": 1.0559646539027983,
      "eval_info_retr_eval_dot_accuracy@1": 0.8869589192169838,
      "eval_info_retr_eval_dot_accuracy@10": 0.9636981895046411,
      "eval_info_retr_eval_dot_accuracy@3": 0.9324510614833196,
      "eval_info_retr_eval_dot_accuracy@5": 0.9460527525043654,
      "eval_info_retr_eval_dot_map@100": 0.9139823556373721,
      "eval_info_retr_eval_dot_mrr@10": 0.9125556343298289,
      "eval_info_retr_eval_dot_ndcg@10": 0.924918869014723,
      "eval_info_retr_eval_dot_precision@1": 0.8869589192169838,
      "eval_info_retr_eval_dot_precision@10": 0.09636981895046412,
      "eval_info_retr_eval_dot_precision@3": 0.31081702049443977,
      "eval_info_retr_eval_dot_precision@5": 0.1892105505008731,
      "eval_info_retr_eval_dot_recall@1": 0.8869589192169838,
      "eval_info_retr_eval_dot_recall@10": 0.9636981895046411,
      "eval_info_retr_eval_dot_recall@3": 0.9324510614833196,
      "eval_info_retr_eval_dot_recall@5": 0.9460527525043654,
      "eval_loss": 0.4025246500968933,
      "eval_para_mine_eval_average_precision": 0.5442347943347751,
      "eval_para_mine_eval_f1": 0.6641819581357237,
      "eval_para_mine_eval_precision": 0.7375383953633291,
      "eval_para_mine_eval_recall": 0.604097690532221,
      "eval_para_mine_eval_threshold": 0.8758298754692078,
      "eval_runtime": 47.2224,
      "eval_samples_per_second": 230.42,
      "eval_sequential_score": 0.9139823556373721,
      "eval_steps_per_second": 1.821,
      "step": 744
    },
    {
      "epoch": 1.1472754050073637,
      "grad_norm": 3.720041036605835,
      "learning_rate": 3.182756840474961e-05,
      "loss": 0.3788,
      "step": 806
    },
    {
      "epoch": 1.1472754050073637,
      "eval_info_retr_eval_dot_accuracy@1": 0.882455656649205,
      "eval_info_retr_eval_dot_accuracy@10": 0.9624115430567044,
      "eval_info_retr_eval_dot_accuracy@3": 0.9284073155040897,
      "eval_info_retr_eval_dot_accuracy@5": 0.9443984927855895,
      "eval_info_retr_eval_dot_map@100": 0.9105324753022828,
      "eval_info_retr_eval_dot_mrr@10": 0.9090466051935585,
      "eval_info_retr_eval_dot_ndcg@10": 0.9219529245233927,
      "eval_info_retr_eval_dot_precision@1": 0.882455656649205,
      "eval_info_retr_eval_dot_precision@10": 0.09624115430567044,
      "eval_info_retr_eval_dot_precision@3": 0.3094691051680299,
      "eval_info_retr_eval_dot_precision@5": 0.18887969855711795,
      "eval_info_retr_eval_dot_recall@1": 0.882455656649205,
      "eval_info_retr_eval_dot_recall@10": 0.9624115430567044,
      "eval_info_retr_eval_dot_recall@3": 0.9284073155040897,
      "eval_info_retr_eval_dot_recall@5": 0.9443984927855895,
      "eval_loss": 0.38206225633621216,
      "eval_para_mine_eval_average_precision": 0.5650597252874483,
      "eval_para_mine_eval_f1": 0.684371051800379,
      "eval_para_mine_eval_precision": 0.7542356748524652,
      "eval_para_mine_eval_recall": 0.6263522333587783,
      "eval_para_mine_eval_threshold": 0.8642670810222626,
      "eval_runtime": 47.1588,
      "eval_samples_per_second": 230.731,
      "eval_sequential_score": 0.9105324753022828,
      "eval_steps_per_second": 1.824,
      "step": 806
    },
    {
      "epoch": 1.2385861561119293,
      "grad_norm": 2.3984501361846924,
      "learning_rate": 3.0227155394940632e-05,
      "loss": 0.2921,
      "step": 868
    },
    {
      "epoch": 1.2385861561119293,
      "eval_info_retr_eval_dot_accuracy@1": 0.8853046594982079,
      "eval_info_retr_eval_dot_accuracy@10": 0.9623196397389946,
      "eval_info_retr_eval_dot_accuracy@3": 0.9301534785405753,
      "eval_info_retr_eval_dot_accuracy@5": 0.9438470728793309,
      "eval_info_retr_eval_dot_map@100": 0.9123716441222456,
      "eval_info_retr_eval_dot_mrr@10": 0.9109295291194935,
      "eval_info_retr_eval_dot_ndcg@10": 0.9233517208473251,
      "eval_info_retr_eval_dot_precision@1": 0.8853046594982079,
      "eval_info_retr_eval_dot_precision@10": 0.09623196397389946,
      "eval_info_retr_eval_dot_precision@3": 0.3100511595135251,
      "eval_info_retr_eval_dot_precision@5": 0.18876941457586618,
      "eval_info_retr_eval_dot_recall@1": 0.8853046594982079,
      "eval_info_retr_eval_dot_recall@10": 0.9623196397389946,
      "eval_info_retr_eval_dot_recall@3": 0.9301534785405753,
      "eval_info_retr_eval_dot_recall@5": 0.9438470728793309,
      "eval_loss": 0.38938164710998535,
      "eval_para_mine_eval_average_precision": 0.562639634596526,
      "eval_para_mine_eval_f1": 0.6812942943315669,
      "eval_para_mine_eval_precision": 0.756277142164319,
      "eval_para_mine_eval_recall": 0.6198389289634271,
      "eval_para_mine_eval_threshold": 0.8650586903095245,
      "eval_runtime": 47.164,
      "eval_samples_per_second": 230.706,
      "eval_sequential_score": 0.9123716441222456,
      "eval_steps_per_second": 1.823,
      "step": 868
    },
    {
      "epoch": 1.3298969072164948,
      "grad_norm": 2.1422321796417236,
      "learning_rate": 2.862674238513165e-05,
      "loss": 0.2719,
      "step": 930
    },
    {
      "epoch": 1.3298969072164948,
      "eval_info_retr_eval_dot_accuracy@1": 0.8885212756180498,
      "eval_info_retr_eval_dot_accuracy@10": 0.9656281591765463,
      "eval_info_retr_eval_dot_accuracy@3": 0.9345648377906443,
      "eval_info_retr_eval_dot_accuracy@5": 0.9500045951658855,
      "eval_info_retr_eval_dot_map@100": 0.9159948831907755,
      "eval_info_retr_eval_dot_mrr@10": 0.9146445748596291,
      "eval_info_retr_eval_dot_ndcg@10": 0.9270088047632189,
      "eval_info_retr_eval_dot_precision@1": 0.8885212756180498,
      "eval_info_retr_eval_dot_precision@10": 0.09656281591765466,
      "eval_info_retr_eval_dot_precision@3": 0.3115216125968814,
      "eval_info_retr_eval_dot_precision@5": 0.19000091903317715,
      "eval_info_retr_eval_dot_recall@1": 0.8885212756180498,
      "eval_info_retr_eval_dot_recall@10": 0.9656281591765463,
      "eval_info_retr_eval_dot_recall@3": 0.9345648377906443,
      "eval_info_retr_eval_dot_recall@5": 0.9500045951658855,
      "eval_loss": 0.3813144862651825,
      "eval_para_mine_eval_average_precision": 0.5562771586743412,
      "eval_para_mine_eval_f1": 0.6790739258140527,
      "eval_para_mine_eval_precision": 0.7701738104240424,
      "eval_para_mine_eval_recall": 0.6072459382184622,
      "eval_para_mine_eval_threshold": 0.8749864101409912,
      "eval_runtime": 46.8836,
      "eval_samples_per_second": 232.085,
      "eval_sequential_score": 0.9159948831907755,
      "eval_steps_per_second": 1.834,
      "step": 930
    },
    {
      "epoch": 1.4212076583210604,
      "grad_norm": 2.2384369373321533,
      "learning_rate": 2.702632937532267e-05,
      "loss": 0.2713,
      "step": 992
    },
    {
      "epoch": 1.4212076583210604,
      "eval_info_retr_eval_dot_accuracy@1": 0.889256502159728,
      "eval_info_retr_eval_dot_accuracy@10": 0.9640658027754802,
      "eval_info_retr_eval_dot_accuracy@3": 0.9335539012958368,
      "eval_info_retr_eval_dot_accuracy@5": 0.9473393989523021,
      "eval_info_retr_eval_dot_map@100": 0.9160609261046996,
      "eval_info_retr_eval_dot_mrr@10": 0.9146857125351749,
      "eval_info_retr_eval_dot_ndcg@10": 0.9266566721638121,
      "eval_info_retr_eval_dot_precision@1": 0.889256502159728,
      "eval_info_retr_eval_dot_precision@10": 0.09640658027754802,
      "eval_info_retr_eval_dot_precision@3": 0.3111846337652789,
      "eval_info_retr_eval_dot_precision@5": 0.18946787979046048,
      "eval_info_retr_eval_dot_recall@1": 0.889256502159728,
      "eval_info_retr_eval_dot_recall@10": 0.9640658027754802,
      "eval_info_retr_eval_dot_recall@3": 0.9335539012958368,
      "eval_info_retr_eval_dot_recall@5": 0.9473393989523021,
      "eval_loss": 0.379529744386673,
      "eval_para_mine_eval_average_precision": 0.5652640358968563,
      "eval_para_mine_eval_f1": 0.6830371726971242,
      "eval_para_mine_eval_precision": 0.7554402272988553,
      "eval_para_mine_eval_recall": 0.6232988396200422,
      "eval_para_mine_eval_threshold": 0.8636217713356018,
      "eval_runtime": 47.0681,
      "eval_samples_per_second": 231.176,
      "eval_sequential_score": 0.9160609261046996,
      "eval_steps_per_second": 1.827,
      "step": 992
    },
    {
      "epoch": 1.5125184094256259,
      "grad_norm": 1.37623131275177,
      "learning_rate": 2.542591636551368e-05,
      "loss": 0.2498,
      "step": 1054
    },
    {
      "epoch": 1.5125184094256259,
      "eval_info_retr_eval_dot_accuracy@1": 0.8875103391232424,
      "eval_info_retr_eval_dot_accuracy@10": 0.9651686425879974,
      "eval_info_retr_eval_dot_accuracy@3": 0.9322672548479,
      "eval_info_retr_eval_dot_accuracy@5": 0.9468798823637533,
      "eval_info_retr_eval_dot_map@100": 0.9147389573171367,
      "eval_info_retr_eval_dot_mrr@10": 0.9134388179191052,
      "eval_info_retr_eval_dot_ndcg@10": 0.9259428646968195,
      "eval_info_retr_eval_dot_precision@1": 0.8875103391232424,
      "eval_info_retr_eval_dot_precision@10": 0.09651686425879975,
      "eval_info_retr_eval_dot_precision@3": 0.31075575161596664,
      "eval_info_retr_eval_dot_precision@5": 0.1893759764727507,
      "eval_info_retr_eval_dot_recall@1": 0.8875103391232424,
      "eval_info_retr_eval_dot_recall@10": 0.9651686425879974,
      "eval_info_retr_eval_dot_recall@3": 0.9322672548479,
      "eval_info_retr_eval_dot_recall@5": 0.9468798823637533,
      "eval_loss": 0.3791400194168091,
      "eval_para_mine_eval_average_precision": 0.5531609578399229,
      "eval_para_mine_eval_f1": 0.6710056459938674,
      "eval_para_mine_eval_precision": 0.7802172142925567,
      "eval_para_mine_eval_recall": 0.5886139128156717,
      "eval_para_mine_eval_threshold": 0.8832797706127167,
      "eval_runtime": 46.8924,
      "eval_samples_per_second": 232.042,
      "eval_sequential_score": 0.9147389573171367,
      "eval_steps_per_second": 1.834,
      "step": 1054
    },
    {
      "epoch": 1.6038291605301915,
      "grad_norm": 3.7942512035369873,
      "learning_rate": 2.38255033557047e-05,
      "loss": 0.2785,
      "step": 1116
    },
    {
      "epoch": 1.6038291605301915,
      "eval_info_retr_eval_dot_accuracy@1": 0.8900836320191159,
      "eval_info_retr_eval_dot_accuracy@10": 0.9648929326348681,
      "eval_info_retr_eval_dot_accuracy@3": 0.9332781913427075,
      "eval_info_retr_eval_dot_accuracy@5": 0.9466960757283338,
      "eval_info_retr_eval_dot_map@100": 0.9161105864746074,
      "eval_info_retr_eval_dot_mrr@10": 0.9147435168044494,
      "eval_info_retr_eval_dot_ndcg@10": 0.9268526071520827,
      "eval_info_retr_eval_dot_precision@1": 0.8900836320191159,
      "eval_info_retr_eval_dot_precision@10": 0.09648929326348682,
      "eval_info_retr_eval_dot_precision@3": 0.31109273044756913,
      "eval_info_retr_eval_dot_precision@5": 0.1893392151456668,
      "eval_info_retr_eval_dot_recall@1": 0.8900836320191159,
      "eval_info_retr_eval_dot_recall@10": 0.9648929326348681,
      "eval_info_retr_eval_dot_recall@3": 0.9332781913427075,
      "eval_info_retr_eval_dot_recall@5": 0.9466960757283338,
      "eval_loss": 0.3756929337978363,
      "eval_para_mine_eval_average_precision": 0.5534577957590571,
      "eval_para_mine_eval_f1": 0.6721510117453017,
      "eval_para_mine_eval_precision": 0.763900548546983,
      "eval_para_mine_eval_recall": 0.6000776898998613,
      "eval_para_mine_eval_threshold": 0.8725496828556061,
      "eval_runtime": 47.1739,
      "eval_samples_per_second": 230.657,
      "eval_sequential_score": 0.9161105864746074,
      "eval_steps_per_second": 1.823,
      "step": 1116
    },
    {
      "epoch": 1.695139911634757,
      "grad_norm": 2.6778645515441895,
      "learning_rate": 2.2225090345895717e-05,
      "loss": 0.2428,
      "step": 1178
    },
    {
      "epoch": 1.695139911634757,
      "eval_info_retr_eval_dot_accuracy@1": 0.8910945685139233,
      "eval_info_retr_eval_dot_accuracy@10": 0.9671905155776124,
      "eval_info_retr_eval_dot_accuracy@3": 0.9344729344729344,
      "eval_info_retr_eval_dot_accuracy@5": 0.9494531752596269,
      "eval_info_retr_eval_dot_map@100": 0.9174675014460509,
      "eval_info_retr_eval_dot_mrr@10": 0.916212365226703,
      "eval_info_retr_eval_dot_ndcg@10": 0.9285204933191614,
      "eval_info_retr_eval_dot_precision@1": 0.8910945685139233,
      "eval_info_retr_eval_dot_precision@10": 0.09671905155776124,
      "eval_info_retr_eval_dot_precision@3": 0.3114909781576448,
      "eval_info_retr_eval_dot_precision@5": 0.1898906350519254,
      "eval_info_retr_eval_dot_recall@1": 0.8910945685139233,
      "eval_info_retr_eval_dot_recall@10": 0.9671905155776124,
      "eval_info_retr_eval_dot_recall@3": 0.9344729344729344,
      "eval_info_retr_eval_dot_recall@5": 0.9494531752596269,
      "eval_loss": 0.36561650037765503,
      "eval_para_mine_eval_average_precision": 0.5544895514233957,
      "eval_para_mine_eval_f1": 0.6734225611719457,
      "eval_para_mine_eval_precision": 0.7675405136740874,
      "eval_para_mine_eval_recall": 0.5998653977316356,
      "eval_para_mine_eval_threshold": 0.8776430785655975,
      "eval_runtime": 47.0859,
      "eval_samples_per_second": 231.088,
      "eval_sequential_score": 0.9174675014460509,
      "eval_steps_per_second": 1.826,
      "step": 1178
    },
    {
      "epoch": 1.7864506627393224,
      "grad_norm": 3.110546112060547,
      "learning_rate": 2.0624677336086735e-05,
      "loss": 0.2935,
      "step": 1240
    },
    {
      "epoch": 1.7864506627393224,
      "eval_info_retr_eval_dot_accuracy@1": 0.8924731182795699,
      "eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343,
      "eval_info_retr_eval_dot_accuracy@3": 0.9348405477437736,
      "eval_info_retr_eval_dot_accuracy@5": 0.9497288852127562,
      "eval_info_retr_eval_dot_map@100": 0.9183095474671825,
      "eval_info_retr_eval_dot_mrr@10": 0.9169947469230629,
      "eval_info_retr_eval_dot_ndcg@10": 0.9289448948774749,
      "eval_info_retr_eval_dot_precision@1": 0.8924731182795699,
      "eval_info_retr_eval_dot_precision@10": 0.09664552890359342,
      "eval_info_retr_eval_dot_precision@3": 0.31161351591459113,
      "eval_info_retr_eval_dot_precision@5": 0.18994577704255125,
      "eval_info_retr_eval_dot_recall@1": 0.8924731182795699,
      "eval_info_retr_eval_dot_recall@10": 0.9664552890359343,
      "eval_info_retr_eval_dot_recall@3": 0.9348405477437736,
      "eval_info_retr_eval_dot_recall@5": 0.9497288852127562,
      "eval_loss": 0.36679840087890625,
      "eval_para_mine_eval_average_precision": 0.5492627712847419,
      "eval_para_mine_eval_f1": 0.6682617615424452,
      "eval_para_mine_eval_precision": 0.7445174891126459,
      "eval_para_mine_eval_recall": 0.6061754436680473,
      "eval_para_mine_eval_threshold": 0.8671578168869019,
      "eval_runtime": 47.2606,
      "eval_samples_per_second": 230.234,
      "eval_sequential_score": 0.9183095474671825,
      "eval_steps_per_second": 1.82,
      "step": 1240
    },
    {
      "epoch": 1.877761413843888,
      "grad_norm": 4.477660655975342,
      "learning_rate": 1.902426432627775e-05,
      "loss": 0.2823,
      "step": 1302
    },
    {
      "epoch": 1.877761413843888,
      "eval_info_retr_eval_dot_accuracy@1": 0.8939435713629262,
      "eval_info_retr_eval_dot_accuracy@10": 0.9648010293171584,
      "eval_info_retr_eval_dot_accuracy@3": 0.9359433875562908,
      "eval_info_retr_eval_dot_accuracy@5": 0.9485341420825292,
      "eval_info_retr_eval_dot_map@100": 0.9191298943799292,
      "eval_info_retr_eval_dot_mrr@10": 0.9177682665137863,
      "eval_info_retr_eval_dot_ndcg@10": 0.9291509217029374,
      "eval_info_retr_eval_dot_precision@1": 0.8939435713629262,
      "eval_info_retr_eval_dot_precision@10": 0.09648010293171583,
      "eval_info_retr_eval_dot_precision@3": 0.3119811291854302,
      "eval_info_retr_eval_dot_precision@5": 0.18970682841650582,
      "eval_info_retr_eval_dot_recall@1": 0.8939435713629262,
      "eval_info_retr_eval_dot_recall@10": 0.9648010293171584,
      "eval_info_retr_eval_dot_recall@3": 0.9359433875562908,
      "eval_info_retr_eval_dot_recall@5": 0.9485341420825292,
      "eval_loss": 0.3716655969619751,
      "eval_para_mine_eval_average_precision": 0.557578455456071,
      "eval_para_mine_eval_f1": 0.6753797157651423,
      "eval_para_mine_eval_precision": 0.7440590076966561,
      "eval_para_mine_eval_recall": 0.6183077152394159,
      "eval_para_mine_eval_threshold": 0.863526463508606,
      "eval_runtime": 46.6942,
      "eval_samples_per_second": 233.027,
      "eval_sequential_score": 0.9191298943799292,
      "eval_steps_per_second": 1.842,
      "step": 1302
    },
    {
      "epoch": 1.9690721649484537,
      "grad_norm": 4.546482563018799,
      "learning_rate": 1.742385131646877e-05,
      "loss": 0.2938,
      "step": 1364
    },
    {
      "epoch": 1.9690721649484537,
      "eval_info_retr_eval_dot_accuracy@1": 0.8946787979046044,
      "eval_info_retr_eval_dot_accuracy@10": 0.9646172226817388,
      "eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374,
      "eval_info_retr_eval_dot_accuracy@5": 0.9487179487179487,
      "eval_info_retr_eval_dot_map@100": 0.9200289882479742,
      "eval_info_retr_eval_dot_mrr@10": 0.9186748635673371,
      "eval_info_retr_eval_dot_ndcg@10": 0.9298216358313898,
      "eval_info_retr_eval_dot_precision@1": 0.8946787979046044,
      "eval_info_retr_eval_dot_precision@10": 0.09646172226817387,
      "eval_info_retr_eval_dot_precision@3": 0.31244064577397906,
      "eval_info_retr_eval_dot_precision@5": 0.18974358974358976,
      "eval_info_retr_eval_dot_recall@1": 0.8946787979046044,
      "eval_info_retr_eval_dot_recall@10": 0.9646172226817388,
      "eval_info_retr_eval_dot_recall@3": 0.9373219373219374,
      "eval_info_retr_eval_dot_recall@5": 0.9487179487179487,
      "eval_loss": 0.3621634840965271,
      "eval_para_mine_eval_average_precision": 0.5594570173517496,
      "eval_para_mine_eval_f1": 0.6766163284568192,
      "eval_para_mine_eval_precision": 0.7421746515327168,
      "eval_para_mine_eval_recall": 0.6216998730763845,
      "eval_para_mine_eval_threshold": 0.8676250278949738,
      "eval_runtime": 47.3006,
      "eval_samples_per_second": 230.039,
      "eval_sequential_score": 0.9200289882479742,
      "eval_steps_per_second": 1.818,
      "step": 1364
    },
    {
      "epoch": 2.020618556701031,
      "grad_norm": 3.241508722305298,
      "learning_rate": 1.5823438306659787e-05,
      "loss": 0.216,
      "step": 1426
    },
    {
      "epoch": 2.020618556701031,
      "eval_info_retr_eval_dot_accuracy@1": 0.893208344821248,
      "eval_info_retr_eval_dot_accuracy@10": 0.9661795790828049,
      "eval_info_retr_eval_dot_accuracy@3": 0.9362190975094201,
      "eval_info_retr_eval_dot_accuracy@5": 0.9500964984835952,
      "eval_info_retr_eval_dot_map@100": 0.9191773519681701,
      "eval_info_retr_eval_dot_mrr@10": 0.9178556476047521,
      "eval_info_retr_eval_dot_ndcg@10": 0.9295559143323862,
      "eval_info_retr_eval_dot_precision@1": 0.893208344821248,
      "eval_info_retr_eval_dot_precision@10": 0.09661795790828051,
      "eval_info_retr_eval_dot_precision@3": 0.31207303250314,
      "eval_info_retr_eval_dot_precision@5": 0.19001929969671905,
      "eval_info_retr_eval_dot_recall@1": 0.893208344821248,
      "eval_info_retr_eval_dot_recall@10": 0.9661795790828049,
      "eval_info_retr_eval_dot_recall@3": 0.9362190975094201,
      "eval_info_retr_eval_dot_recall@5": 0.9500964984835952,
      "eval_loss": 0.3684485852718353,
      "eval_para_mine_eval_average_precision": 0.5665176151429165,
      "eval_para_mine_eval_f1": 0.6839674754190774,
      "eval_para_mine_eval_precision": 0.7722483633387889,
      "eval_para_mine_eval_recall": 0.6137998943056013,
      "eval_para_mine_eval_threshold": 0.886872798204422,
      "eval_runtime": 47.5509,
      "eval_samples_per_second": 228.829,
      "eval_sequential_score": 0.9191773519681701,
      "eval_steps_per_second": 1.809,
      "step": 1426
    },
    {
      "epoch": 2.1119293078055965,
      "grad_norm": 2.4362664222717285,
      "learning_rate": 1.42230252968508e-05,
      "loss": 0.2363,
      "step": 1488
    },
    {
      "epoch": 2.1119293078055965,
      "eval_info_retr_eval_dot_accuracy@1": 0.8943111846337652,
      "eval_info_retr_eval_dot_accuracy@10": 0.9664552890359343,
      "eval_info_retr_eval_dot_accuracy@3": 0.9374138406396471,
      "eval_info_retr_eval_dot_accuracy@5": 0.9490855619887878,
      "eval_info_retr_eval_dot_map@100": 0.9197752678474642,
      "eval_info_retr_eval_dot_mrr@10": 0.9185011954725225,
      "eval_info_retr_eval_dot_ndcg@10": 0.9300922809925127,
      "eval_info_retr_eval_dot_precision@1": 0.8943111846337652,
      "eval_info_retr_eval_dot_precision@10": 0.09664552890359342,
      "eval_info_retr_eval_dot_precision@3": 0.31247128021321563,
      "eval_info_retr_eval_dot_precision@5": 0.18981711239775756,
      "eval_info_retr_eval_dot_recall@1": 0.8943111846337652,
      "eval_info_retr_eval_dot_recall@10": 0.9664552890359343,
      "eval_info_retr_eval_dot_recall@3": 0.9374138406396471,
      "eval_info_retr_eval_dot_recall@5": 0.9490855619887878,
      "eval_loss": 0.36409991979599,
      "eval_para_mine_eval_average_precision": 0.5680857985845322,
      "eval_para_mine_eval_f1": 0.6845767174265878,
      "eval_para_mine_eval_precision": 0.7527188630602916,
      "eval_para_mine_eval_recall": 0.6277479414434964,
      "eval_para_mine_eval_threshold": 0.874737024307251,
      "eval_runtime": 46.8373,
      "eval_samples_per_second": 232.315,
      "eval_sequential_score": 0.9197752678474642,
      "eval_steps_per_second": 1.836,
      "step": 1488
    },
    {
      "epoch": 2.203240058910162,
      "grad_norm": 1.0034995079040527,
      "learning_rate": 1.2622612287041818e-05,
      "loss": 0.2336,
      "step": 1550
    },
    {
      "epoch": 2.203240058910162,
      "eval_info_retr_eval_dot_accuracy@1": 0.8936678614097969,
      "eval_info_retr_eval_dot_accuracy@10": 0.9655362558588365,
      "eval_info_retr_eval_dot_accuracy@3": 0.9360352908740005,
      "eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366,
      "eval_info_retr_eval_dot_map@100": 0.9191474148366734,
      "eval_info_retr_eval_dot_mrr@10": 0.9178338388015818,
      "eval_info_retr_eval_dot_ndcg@10": 0.9293775519635007,
      "eval_info_retr_eval_dot_precision@1": 0.8936678614097969,
      "eval_info_retr_eval_dot_precision@10": 0.09655362558588364,
      "eval_info_retr_eval_dot_precision@3": 0.31201176362466687,
      "eval_info_retr_eval_dot_precision@5": 0.18990901571546734,
      "eval_info_retr_eval_dot_recall@1": 0.8936678614097969,
      "eval_info_retr_eval_dot_recall@10": 0.9655362558588365,
      "eval_info_retr_eval_dot_recall@3": 0.9360352908740005,
      "eval_info_retr_eval_dot_recall@5": 0.9495450785773366,
      "eval_loss": 0.3632822632789612,
      "eval_para_mine_eval_average_precision": 0.5695600017649123,
      "eval_para_mine_eval_f1": 0.6885810689948371,
      "eval_para_mine_eval_precision": 0.7525360184242944,
      "eval_para_mine_eval_recall": 0.6346451784835112,
      "eval_para_mine_eval_threshold": 0.8695259690284729,
      "eval_runtime": 46.9973,
      "eval_samples_per_second": 231.524,
      "eval_sequential_score": 0.9191474148366734,
      "eval_steps_per_second": 1.83,
      "step": 1550
    },
    {
      "epoch": 2.2945508100147274,
      "grad_norm": 1.5235002040863037,
      "learning_rate": 1.1022199277232835e-05,
      "loss": 0.2065,
      "step": 1612
    },
    {
      "epoch": 2.2945508100147274,
      "eval_info_retr_eval_dot_accuracy@1": 0.8948626045400239,
      "eval_info_retr_eval_dot_accuracy@10": 0.9658119658119658,
      "eval_info_retr_eval_dot_accuracy@3": 0.9364029041448396,
      "eval_info_retr_eval_dot_accuracy@5": 0.9495450785773366,
      "eval_info_retr_eval_dot_map@100": 0.9201749271580272,
      "eval_info_retr_eval_dot_mrr@10": 0.9188280722330898,
      "eval_info_retr_eval_dot_ndcg@10": 0.9302018390100595,
      "eval_info_retr_eval_dot_precision@1": 0.8948626045400239,
      "eval_info_retr_eval_dot_precision@10": 0.09658119658119659,
      "eval_info_retr_eval_dot_precision@3": 0.3121343013816132,
      "eval_info_retr_eval_dot_precision@5": 0.18990901571546734,
      "eval_info_retr_eval_dot_recall@1": 0.8948626045400239,
      "eval_info_retr_eval_dot_recall@10": 0.9658119658119658,
      "eval_info_retr_eval_dot_recall@3": 0.9364029041448396,
      "eval_info_retr_eval_dot_recall@5": 0.9495450785773366,
      "eval_loss": 0.36156603693962097,
      "eval_para_mine_eval_average_precision": 0.5665696229109317,
      "eval_para_mine_eval_f1": 0.6860915092192124,
      "eval_para_mine_eval_precision": 0.7585999354355094,
      "eval_para_mine_eval_recall": 0.6262347951380577,
      "eval_para_mine_eval_threshold": 0.8720309436321259,
      "eval_runtime": 47.7964,
      "eval_samples_per_second": 227.653,
      "eval_sequential_score": 0.9201749271580272,
      "eval_steps_per_second": 1.799,
      "step": 1612
    },
    {
      "epoch": 2.385861561119293,
      "grad_norm": 1.445999264717102,
      "learning_rate": 9.421786267423851e-06,
      "loss": 0.2083,
      "step": 1674
    },
    {
      "epoch": 2.385861561119293,
      "eval_info_retr_eval_dot_accuracy@1": 0.8960573476702509,
      "eval_info_retr_eval_dot_accuracy@10": 0.9659957724473853,
      "eval_info_retr_eval_dot_accuracy@3": 0.9373219373219374,
      "eval_info_retr_eval_dot_accuracy@5": 0.9503722084367245,
      "eval_info_retr_eval_dot_map@100": 0.92104627411852,
      "eval_info_retr_eval_dot_mrr@10": 0.9196911975585806,
      "eval_info_retr_eval_dot_ndcg@10": 0.9309142349609268,
      "eval_info_retr_eval_dot_precision@1": 0.8960573476702509,
      "eval_info_retr_eval_dot_precision@10": 0.09659957724473853,
      "eval_info_retr_eval_dot_precision@3": 0.3124406457739791,
      "eval_info_retr_eval_dot_precision@5": 0.19007444168734494,
      "eval_info_retr_eval_dot_recall@1": 0.8960573476702509,
      "eval_info_retr_eval_dot_recall@10": 0.9659957724473853,
      "eval_info_retr_eval_dot_recall@3": 0.9373219373219374,
      "eval_info_retr_eval_dot_recall@5": 0.9503722084367245,
      "eval_loss": 0.358325332403183,
      "eval_para_mine_eval_average_precision": 0.5714132731149775,
      "eval_para_mine_eval_f1": 0.6871263293961211,
      "eval_para_mine_eval_precision": 0.7587332430898214,
      "eval_para_mine_eval_recall": 0.6278698965188602,
      "eval_para_mine_eval_threshold": 0.8729398548603058,
      "eval_runtime": 47.2608,
      "eval_samples_per_second": 230.233,
      "eval_sequential_score": 0.92104627411852,
      "eval_steps_per_second": 1.82,
      "step": 1674
    }
  ],
  "logging_steps": 62,
  "max_steps": 2037,
  "num_input_tokens_seen": 0,
  "num_train_epochs": 3,
  "save_steps": 62,
  "stateful_callbacks": {
    "TrainerControl": {
      "args": {
        "should_epoch_stop": false,
        "should_evaluate": false,
        "should_log": false,
        "should_save": true,
        "should_training_stop": false
      },
      "attributes": {}
    }
  },
  "total_flos": 0.0,
  "train_batch_size": 64,
  "trial_name": null,
  "trial_params": null
}