Shadman-Rohan commited on
Commit
ff24bac
·
1 Parent(s): 5378162

Training in progress, epoch 1

Browse files
all_results.json CHANGED
@@ -38,10 +38,10 @@
38
  "eval_ne_word_err_precision": 0.9970827762246263,
39
  "eval_ne_word_err_recall": 0.9946647265672366,
40
  "eval_overall_accuracy": 0.9993957202777317,
41
- "eval_runtime": 11.3466,
42
  "eval_samples": 18388,
43
- "eval_samples_per_second": 1620.567,
44
- "eval_steps_per_second": 101.352,
45
  "eval_unc_insert_err_f1": 0.9961218836565098,
46
  "eval_unc_insert_err_number": 902,
47
  "eval_unc_insert_err_precision": 0.9955703211517165,
@@ -51,8 +51,8 @@
51
  "eval_weighted_avg_precision": 0.9936401344515604,
52
  "eval_weighted_avg_recall": 0.9931156910287495,
53
  "train_loss": 0.06519987745561462,
54
- "train_runtime": 1743.5904,
55
  "train_samples": 18388,
56
- "train_samples_per_second": 316.382,
57
- "train_steps_per_second": 9.893
58
  }
 
38
  "eval_ne_word_err_precision": 0.9970827762246263,
39
  "eval_ne_word_err_recall": 0.9946647265672366,
40
  "eval_overall_accuracy": 0.9993957202777317,
41
+ "eval_runtime": 11.4329,
42
  "eval_samples": 18388,
43
+ "eval_samples_per_second": 1608.342,
44
+ "eval_steps_per_second": 100.587,
45
  "eval_unc_insert_err_f1": 0.9961218836565098,
46
  "eval_unc_insert_err_number": 902,
47
  "eval_unc_insert_err_precision": 0.9955703211517165,
 
51
  "eval_weighted_avg_precision": 0.9936401344515604,
52
  "eval_weighted_avg_recall": 0.9931156910287495,
53
  "train_loss": 0.06519987745561462,
54
+ "train_runtime": 1743.8633,
55
  "train_samples": 18388,
56
+ "train_samples_per_second": 316.332,
57
+ "train_steps_per_second": 9.892
58
  }
eval_results.json CHANGED
@@ -38,10 +38,10 @@
38
  "eval_ne_word_err_precision": 0.9970827762246263,
39
  "eval_ne_word_err_recall": 0.9946647265672366,
40
  "eval_overall_accuracy": 0.9993957202777317,
41
- "eval_runtime": 11.3466,
42
  "eval_samples": 18388,
43
- "eval_samples_per_second": 1620.567,
44
- "eval_steps_per_second": 101.352,
45
  "eval_unc_insert_err_f1": 0.9961218836565098,
46
  "eval_unc_insert_err_number": 902,
47
  "eval_unc_insert_err_precision": 0.9955703211517165,
 
38
  "eval_ne_word_err_precision": 0.9970827762246263,
39
  "eval_ne_word_err_recall": 0.9946647265672366,
40
  "eval_overall_accuracy": 0.9993957202777317,
41
+ "eval_runtime": 11.4329,
42
  "eval_samples": 18388,
43
+ "eval_samples_per_second": 1608.342,
44
+ "eval_steps_per_second": 100.587,
45
  "eval_unc_insert_err_f1": 0.9961218836565098,
46
  "eval_unc_insert_err_number": 902,
47
  "eval_unc_insert_err_precision": 0.9955703211517165,
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb8de0288b5a6e76feea0bd3fc8fd584ac1e2b3cae7999f2b363d2d1f1869015
3
  size 440204333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:782a74d01c2012b5d99332313c0794974e8965c7c8027eb0901f5118df32f7f3
3
  size 440204333
runs/Mar03_01-20-39_home-3090/events.out.tfevents.1677786630.home-3090.52004.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39373ce231698dc357cc544e011a293aa1868f277921b0565725b850385cdef0
3
+ size 2994
runs/Mar03_15-28-56_home-3090/1677835755.4833965/events.out.tfevents.1677835755.home-3090.22403.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6e69d61ff4a983ba335c65dc90e26811b6900344b603bb5126edff8dd4be54f
3
+ size 5523
runs/Mar03_15-28-56_home-3090/events.out.tfevents.1677835755.home-3090.22403.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7b8e1128585d66a929bdb76df7bdece7d52108c15b5b3897af64bde3d519505
3
+ size 7325
train_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "epoch": 30.0,
3
  "train_loss": 0.06519987745561462,
4
- "train_runtime": 1743.5904,
5
  "train_samples": 18388,
6
- "train_samples_per_second": 316.382,
7
- "train_steps_per_second": 9.893
8
  }
 
1
  {
2
  "epoch": 30.0,
3
  "train_loss": 0.06519987745561462,
4
+ "train_runtime": 1743.8633,
5
  "train_samples": 18388,
6
+ "train_samples_per_second": 316.332,
7
+ "train_steps_per_second": 9.892
8
  }
trainer_state.json CHANGED
@@ -53,9 +53,9 @@
53
  "eval_ne_word_err_precision": 0.6340406114533425,
54
  "eval_ne_word_err_recall": 0.33697101976476296,
55
  "eval_overall_accuracy": 0.9313016896134979,
56
- "eval_runtime": 11.4511,
57
- "eval_samples_per_second": 1605.79,
58
- "eval_steps_per_second": 100.427,
59
  "eval_unc_insert_err_f1": 0.0,
60
  "eval_unc_insert_err_number": 902,
61
  "eval_unc_insert_err_precision": 0.0,
@@ -112,9 +112,9 @@
112
  "eval_ne_word_err_precision": 0.7050460865489767,
113
  "eval_ne_word_err_recall": 0.5472292955013944,
114
  "eval_overall_accuracy": 0.9455378089528188,
115
- "eval_runtime": 12.2219,
116
- "eval_samples_per_second": 1504.512,
117
- "eval_steps_per_second": 94.093,
118
  "eval_unc_insert_err_f1": 0.0022148394241417496,
119
  "eval_unc_insert_err_number": 902,
120
  "eval_unc_insert_err_precision": 1.0,
@@ -171,9 +171,9 @@
171
  "eval_ne_word_err_precision": 0.7622462787550744,
172
  "eval_ne_word_err_recall": 0.6830362556080999,
173
  "eval_overall_accuracy": 0.9567288324367876,
174
- "eval_runtime": 11.5134,
175
- "eval_samples_per_second": 1597.097,
176
- "eval_steps_per_second": 99.884,
177
  "eval_unc_insert_err_f1": 0.3054662379421222,
178
  "eval_unc_insert_err_number": 902,
179
  "eval_unc_insert_err_precision": 0.5555555555555556,
@@ -230,9 +230,9 @@
230
  "eval_ne_word_err_precision": 0.8228239366963402,
231
  "eval_ne_word_err_recall": 0.8069601067054687,
232
  "eval_overall_accuracy": 0.9701177753027322,
233
- "eval_runtime": 11.6132,
234
- "eval_samples_per_second": 1583.375,
235
- "eval_steps_per_second": 99.026,
236
  "eval_unc_insert_err_f1": 0.37326813365933176,
237
  "eval_unc_insert_err_number": 902,
238
  "eval_unc_insert_err_precision": 0.7046153846153846,
@@ -289,9 +289,9 @@
289
  "eval_ne_word_err_precision": 0.887815750371471,
290
  "eval_ne_word_err_recall": 0.869407057111677,
291
  "eval_overall_accuracy": 0.9797270077489988,
292
- "eval_runtime": 11.582,
293
- "eval_samples_per_second": 1587.637,
294
- "eval_steps_per_second": 99.292,
295
  "eval_unc_insert_err_f1": 0.5340674466620785,
296
  "eval_unc_insert_err_number": 902,
297
  "eval_unc_insert_err_precision": 0.7041742286751361,
@@ -348,9 +348,9 @@
348
  "eval_ne_word_err_precision": 0.918532634587899,
349
  "eval_ne_word_err_recall": 0.935127925306172,
350
  "eval_overall_accuracy": 0.9874049148084078,
351
- "eval_runtime": 11.5539,
352
- "eval_samples_per_second": 1591.493,
353
- "eval_steps_per_second": 99.533,
354
  "eval_unc_insert_err_f1": 0.7559591373439274,
355
  "eval_unc_insert_err_number": 902,
356
  "eval_unc_insert_err_precision": 0.7744186046511627,
@@ -407,9 +407,9 @@
407
  "eval_ne_word_err_precision": 0.9517692680562287,
408
  "eval_ne_word_err_recall": 0.9523463077482721,
409
  "eval_overall_accuracy": 0.9913860518021754,
410
- "eval_runtime": 11.6281,
411
- "eval_samples_per_second": 1581.339,
412
- "eval_steps_per_second": 98.898,
413
  "eval_unc_insert_err_f1": 0.8407367280606717,
414
  "eval_unc_insert_err_number": 902,
415
  "eval_unc_insert_err_precision": 0.8220338983050848,
@@ -466,9 +466,9 @@
466
  "eval_ne_word_err_precision": 0.9697043435941112,
467
  "eval_ne_word_err_recall": 0.9664120286164666,
468
  "eval_overall_accuracy": 0.9938387165572644,
469
- "eval_runtime": 11.5399,
470
- "eval_samples_per_second": 1593.424,
471
- "eval_steps_per_second": 99.654,
472
  "eval_unc_insert_err_f1": 0.897196261682243,
473
  "eval_unc_insert_err_number": 902,
474
  "eval_unc_insert_err_precision": 0.8898582333696837,
@@ -525,9 +525,9 @@
525
  "eval_ne_word_err_precision": 0.9782503037667072,
526
  "eval_ne_word_err_recall": 0.9762337819813266,
527
  "eval_overall_accuracy": 0.9954619777719851,
528
- "eval_runtime": 11.5934,
529
- "eval_samples_per_second": 1586.069,
530
- "eval_steps_per_second": 99.194,
531
  "eval_unc_insert_err_f1": 0.934559221200649,
532
  "eval_unc_insert_err_number": 902,
533
  "eval_unc_insert_err_precision": 0.9123548046462513,
@@ -584,9 +584,9 @@
584
  "eval_ne_word_err_precision": 0.9809141745684415,
585
  "eval_ne_word_err_recall": 0.9784163938401843,
586
  "eval_overall_accuracy": 0.9963387758003744,
587
- "eval_runtime": 11.5919,
588
- "eval_samples_per_second": 1586.275,
589
- "eval_steps_per_second": 99.207,
590
  "eval_unc_insert_err_f1": 0.9537289058247141,
591
  "eval_unc_insert_err_number": 902,
592
  "eval_unc_insert_err_precision": 0.9368983957219251,
@@ -643,9 +643,9 @@
643
  "eval_ne_word_err_precision": 0.989462075726014,
644
  "eval_ne_word_err_recall": 0.9791439311264702,
645
  "eval_overall_accuracy": 0.9968541908576033,
646
- "eval_runtime": 11.5138,
647
- "eval_samples_per_second": 1597.044,
648
- "eval_steps_per_second": 99.88,
649
  "eval_unc_insert_err_f1": 0.9379310344827587,
650
  "eval_unc_insert_err_number": 902,
651
  "eval_unc_insert_err_precision": 0.8992878942014242,
@@ -702,9 +702,9 @@
702
  "eval_ne_word_err_precision": 0.9917153996101364,
703
  "eval_ne_word_err_recall": 0.9870255850612344,
704
  "eval_overall_accuracy": 0.9976184269769426,
705
- "eval_runtime": 11.5829,
706
- "eval_samples_per_second": 1587.51,
707
- "eval_steps_per_second": 99.284,
708
  "eval_unc_insert_err_f1": 0.9763866007688083,
709
  "eval_unc_insert_err_number": 902,
710
  "eval_unc_insert_err_precision": 0.9673558215451578,
@@ -761,9 +761,9 @@
761
  "eval_ne_word_err_precision": 0.991969826012897,
762
  "eval_ne_word_err_recall": 0.9886019158481872,
763
  "eval_overall_accuracy": 0.9980627503021399,
764
- "eval_runtime": 11.6079,
765
- "eval_samples_per_second": 1584.097,
766
- "eval_steps_per_second": 99.071,
767
  "eval_unc_insert_err_f1": 0.9796367638965328,
768
  "eval_unc_insert_err_number": 902,
769
  "eval_unc_insert_err_precision": 0.9726775956284153,
@@ -820,9 +820,9 @@
820
  "eval_ne_word_err_precision": 0.9943957115009746,
821
  "eval_ne_word_err_recall": 0.9896932217776161,
822
  "eval_overall_accuracy": 0.9983589658522714,
823
- "eval_runtime": 11.6047,
824
- "eval_samples_per_second": 1584.53,
825
- "eval_steps_per_second": 99.098,
826
  "eval_unc_insert_err_f1": 0.9839513004980631,
827
  "eval_unc_insert_err_number": 902,
828
  "eval_unc_insert_err_precision": 0.9823204419889503,
@@ -879,9 +879,9 @@
879
  "eval_ne_word_err_precision": 0.9951290793960058,
880
  "eval_ne_word_err_recall": 0.9909057839214259,
881
  "eval_overall_accuracy": 0.9986137112253844,
882
- "eval_runtime": 11.5772,
883
- "eval_samples_per_second": 1588.3,
884
- "eval_steps_per_second": 99.334,
885
  "eval_unc_insert_err_f1": 0.991111111111111,
886
  "eval_unc_insert_err_number": 902,
887
  "eval_unc_insert_err_precision": 0.9933184855233853,
@@ -938,9 +938,9 @@
938
  "eval_ne_word_err_precision": 0.9948998178506375,
939
  "eval_ne_word_err_recall": 0.9934521644234267,
940
  "eval_overall_accuracy": 0.998862532287495,
941
- "eval_runtime": 12.719,
942
- "eval_samples_per_second": 1445.712,
943
- "eval_steps_per_second": 90.416,
944
  "eval_unc_insert_err_f1": 0.9900662251655629,
945
  "eval_unc_insert_err_number": 902,
946
  "eval_unc_insert_err_precision": 0.9857142857142858,
@@ -997,9 +997,9 @@
997
  "eval_ne_word_err_precision": 0.9945454545454545,
998
  "eval_ne_word_err_recall": 0.9949072389959985,
999
  "eval_overall_accuracy": 0.9990106400625607,
1000
- "eval_runtime": 11.5897,
1001
- "eval_samples_per_second": 1586.578,
1002
- "eval_steps_per_second": 99.226,
1003
  "eval_unc_insert_err_f1": 0.9927897947864671,
1004
  "eval_unc_insert_err_number": 902,
1005
  "eval_unc_insert_err_precision": 0.9933407325194229,
@@ -1056,9 +1056,9 @@
1056
  "eval_ne_word_err_precision": 0.9949097079141922,
1057
  "eval_ne_word_err_recall": 0.9953922638535225,
1058
  "eval_overall_accuracy": 0.9991054290386028,
1059
- "eval_runtime": 11.5456,
1060
- "eval_samples_per_second": 1592.643,
1061
- "eval_steps_per_second": 99.605,
1062
  "eval_unc_insert_err_f1": 0.9927897947864671,
1063
  "eval_unc_insert_err_number": 902,
1064
  "eval_unc_insert_err_precision": 0.9933407325194229,
@@ -1115,9 +1115,9 @@
1115
  "eval_ne_word_err_precision": 0.9956300072833212,
1116
  "eval_ne_word_err_recall": 0.9945434703528556,
1117
  "eval_overall_accuracy": 0.9992179909476527,
1118
- "eval_runtime": 11.6822,
1119
- "eval_samples_per_second": 1574.022,
1120
- "eval_steps_per_second": 98.441,
1121
  "eval_unc_insert_err_f1": 0.9933701657458565,
1122
  "eval_unc_insert_err_number": 902,
1123
  "eval_unc_insert_err_precision": 0.9900881057268722,
@@ -1174,9 +1174,9 @@
1174
  "eval_ne_word_err_precision": 0.9959941733430444,
1175
  "eval_ne_word_err_recall": 0.9949072389959985,
1176
  "eval_overall_accuracy": 0.9992594611246712,
1177
- "eval_runtime": 11.3322,
1178
- "eval_samples_per_second": 1622.634,
1179
- "eval_steps_per_second": 101.481,
1180
  "eval_unc_insert_err_f1": 0.9944444444444444,
1181
  "eval_unc_insert_err_number": 902,
1182
  "eval_unc_insert_err_precision": 0.9966592427616926,
@@ -1233,9 +1233,9 @@
1233
  "eval_ne_word_err_precision": 0.9953922638535225,
1234
  "eval_ne_word_err_recall": 0.9953922638535225,
1235
  "eval_overall_accuracy": 0.999295006990687,
1236
- "eval_runtime": 11.5781,
1237
- "eval_samples_per_second": 1588.177,
1238
- "eval_steps_per_second": 99.326,
1239
  "eval_unc_insert_err_f1": 0.9944506104328523,
1240
  "eval_unc_insert_err_number": 902,
1241
  "eval_unc_insert_err_precision": 0.9955555555555555,
@@ -1292,9 +1292,9 @@
1292
  "eval_ne_word_err_precision": 0.996719319562576,
1293
  "eval_ne_word_err_recall": 0.9946647265672366,
1294
  "eval_overall_accuracy": 0.9993127799236948,
1295
- "eval_runtime": 11.7025,
1296
- "eval_samples_per_second": 1571.285,
1297
- "eval_steps_per_second": 98.269,
1298
  "eval_unc_insert_err_f1": 0.9939125622578859,
1299
  "eval_unc_insert_err_number": 902,
1300
  "eval_unc_insert_err_precision": 0.9922651933701657,
@@ -1351,9 +1351,9 @@
1351
  "eval_ne_word_err_precision": 0.9975666139433021,
1352
  "eval_ne_word_err_recall": 0.9941797017097126,
1353
  "eval_overall_accuracy": 0.9993601744117159,
1354
- "eval_runtime": 11.5685,
1355
- "eval_samples_per_second": 1589.49,
1356
- "eval_steps_per_second": 99.408,
1357
  "eval_unc_insert_err_f1": 0.9950193691200886,
1358
  "eval_unc_insert_err_number": 902,
1359
  "eval_unc_insert_err_precision": 0.9933701657458563,
@@ -1410,9 +1410,9 @@
1410
  "eval_ne_word_err_precision": 0.9959966031784544,
1411
  "eval_ne_word_err_recall": 0.9955135200679035,
1412
  "eval_overall_accuracy": 0.9993720230337212,
1413
- "eval_runtime": 11.5823,
1414
- "eval_samples_per_second": 1587.59,
1415
- "eval_steps_per_second": 99.289,
1416
  "eval_unc_insert_err_f1": 0.9950138504155125,
1417
  "eval_unc_insert_err_number": 902,
1418
  "eval_unc_insert_err_precision": 0.9944629014396457,
@@ -1469,9 +1469,9 @@
1469
  "eval_ne_word_err_precision": 0.9968412100595311,
1470
  "eval_ne_word_err_recall": 0.9949072389959985,
1471
  "eval_overall_accuracy": 0.9993720230337212,
1472
- "eval_runtime": 11.6443,
1473
- "eval_samples_per_second": 1579.141,
1474
- "eval_steps_per_second": 98.761,
1475
  "eval_unc_insert_err_f1": 0.9955654101995566,
1476
  "eval_unc_insert_err_number": 902,
1477
  "eval_unc_insert_err_precision": 0.9955654101995566,
@@ -1528,9 +1528,9 @@
1528
  "eval_ne_word_err_precision": 0.9957565470417071,
1529
  "eval_ne_word_err_recall": 0.9958772887110464,
1530
  "eval_overall_accuracy": 0.9993779473447238,
1531
- "eval_runtime": 11.6017,
1532
- "eval_samples_per_second": 1584.944,
1533
- "eval_steps_per_second": 99.124,
1534
  "eval_unc_insert_err_f1": 0.995575221238938,
1535
  "eval_unc_insert_err_number": 902,
1536
  "eval_unc_insert_err_precision": 0.9933774834437086,
@@ -1587,9 +1587,9 @@
1587
  "eval_ne_word_err_precision": 0.9964784456587735,
1588
  "eval_ne_word_err_recall": 0.9950284952103795,
1589
  "eval_overall_accuracy": 0.9993720230337212,
1590
- "eval_runtime": 11.6586,
1591
- "eval_samples_per_second": 1577.202,
1592
- "eval_steps_per_second": 98.639,
1593
  "eval_unc_insert_err_f1": 0.9955703211517165,
1594
  "eval_unc_insert_err_number": 902,
1595
  "eval_unc_insert_err_precision": 0.9944690265486725,
@@ -1646,9 +1646,9 @@
1646
  "eval_ne_word_err_precision": 0.9963578972927036,
1647
  "eval_ne_word_err_recall": 0.9951497514247605,
1648
  "eval_overall_accuracy": 0.9993838716557264,
1649
- "eval_runtime": 11.7106,
1650
- "eval_samples_per_second": 1570.205,
1651
- "eval_steps_per_second": 98.202,
1652
  "eval_unc_insert_err_f1": 0.9955703211517165,
1653
  "eval_unc_insert_err_number": 902,
1654
  "eval_unc_insert_err_precision": 0.9944690265486725,
@@ -1705,9 +1705,9 @@
1705
  "eval_ne_word_err_precision": 0.9962374074523607,
1706
  "eval_ne_word_err_recall": 0.9952710076391416,
1707
  "eval_overall_accuracy": 0.9993957202777317,
1708
- "eval_runtime": 11.6052,
1709
- "eval_samples_per_second": 1584.462,
1710
- "eval_steps_per_second": 99.094,
1711
  "eval_unc_insert_err_f1": 0.9961175818080976,
1712
  "eval_unc_insert_err_number": 902,
1713
  "eval_unc_insert_err_precision": 0.9966703662597114,
@@ -1764,9 +1764,9 @@
1764
  "eval_ne_word_err_precision": 0.9970827762246263,
1765
  "eval_ne_word_err_recall": 0.9946647265672366,
1766
  "eval_overall_accuracy": 0.9993957202777317,
1767
- "eval_runtime": 11.623,
1768
- "eval_samples_per_second": 1582.033,
1769
- "eval_steps_per_second": 98.942,
1770
  "eval_unc_insert_err_f1": 0.9961218836565098,
1771
  "eval_unc_insert_err_number": 902,
1772
  "eval_unc_insert_err_precision": 0.9955703211517165,
@@ -1782,9 +1782,9 @@
1782
  "step": 17250,
1783
  "total_flos": 7911429330344064.0,
1784
  "train_loss": 0.06519987745561462,
1785
- "train_runtime": 1743.5904,
1786
- "train_samples_per_second": 316.382,
1787
- "train_steps_per_second": 9.893
1788
  }
1789
  ],
1790
  "max_steps": 17250,
 
53
  "eval_ne_word_err_precision": 0.6340406114533425,
54
  "eval_ne_word_err_recall": 0.33697101976476296,
55
  "eval_overall_accuracy": 0.9313016896134979,
56
+ "eval_runtime": 11.367,
57
+ "eval_samples_per_second": 1617.671,
58
+ "eval_steps_per_second": 101.17,
59
  "eval_unc_insert_err_f1": 0.0,
60
  "eval_unc_insert_err_number": 902,
61
  "eval_unc_insert_err_precision": 0.0,
 
112
  "eval_ne_word_err_precision": 0.7050460865489767,
113
  "eval_ne_word_err_recall": 0.5472292955013944,
114
  "eval_overall_accuracy": 0.9455378089528188,
115
+ "eval_runtime": 11.0987,
116
+ "eval_samples_per_second": 1656.776,
117
+ "eval_steps_per_second": 103.616,
118
  "eval_unc_insert_err_f1": 0.0022148394241417496,
119
  "eval_unc_insert_err_number": 902,
120
  "eval_unc_insert_err_precision": 1.0,
 
171
  "eval_ne_word_err_precision": 0.7622462787550744,
172
  "eval_ne_word_err_recall": 0.6830362556080999,
173
  "eval_overall_accuracy": 0.9567288324367876,
174
+ "eval_runtime": 11.1567,
175
+ "eval_samples_per_second": 1648.155,
176
+ "eval_steps_per_second": 103.077,
177
  "eval_unc_insert_err_f1": 0.3054662379421222,
178
  "eval_unc_insert_err_number": 902,
179
  "eval_unc_insert_err_precision": 0.5555555555555556,
 
230
  "eval_ne_word_err_precision": 0.8228239366963402,
231
  "eval_ne_word_err_recall": 0.8069601067054687,
232
  "eval_overall_accuracy": 0.9701177753027322,
233
+ "eval_runtime": 11.5543,
234
+ "eval_samples_per_second": 1591.447,
235
+ "eval_steps_per_second": 99.53,
236
  "eval_unc_insert_err_f1": 0.37326813365933176,
237
  "eval_unc_insert_err_number": 902,
238
  "eval_unc_insert_err_precision": 0.7046153846153846,
 
289
  "eval_ne_word_err_precision": 0.887815750371471,
290
  "eval_ne_word_err_recall": 0.869407057111677,
291
  "eval_overall_accuracy": 0.9797270077489988,
292
+ "eval_runtime": 11.5559,
293
+ "eval_samples_per_second": 1591.224,
294
+ "eval_steps_per_second": 99.516,
295
  "eval_unc_insert_err_f1": 0.5340674466620785,
296
  "eval_unc_insert_err_number": 902,
297
  "eval_unc_insert_err_precision": 0.7041742286751361,
 
348
  "eval_ne_word_err_precision": 0.918532634587899,
349
  "eval_ne_word_err_recall": 0.935127925306172,
350
  "eval_overall_accuracy": 0.9874049148084078,
351
+ "eval_runtime": 11.4906,
352
+ "eval_samples_per_second": 1600.268,
353
+ "eval_steps_per_second": 100.082,
354
  "eval_unc_insert_err_f1": 0.7559591373439274,
355
  "eval_unc_insert_err_number": 902,
356
  "eval_unc_insert_err_precision": 0.7744186046511627,
 
407
  "eval_ne_word_err_precision": 0.9517692680562287,
408
  "eval_ne_word_err_recall": 0.9523463077482721,
409
  "eval_overall_accuracy": 0.9913860518021754,
410
+ "eval_runtime": 11.5809,
411
+ "eval_samples_per_second": 1587.783,
412
+ "eval_steps_per_second": 99.301,
413
  "eval_unc_insert_err_f1": 0.8407367280606717,
414
  "eval_unc_insert_err_number": 902,
415
  "eval_unc_insert_err_precision": 0.8220338983050848,
 
466
  "eval_ne_word_err_precision": 0.9697043435941112,
467
  "eval_ne_word_err_recall": 0.9664120286164666,
468
  "eval_overall_accuracy": 0.9938387165572644,
469
+ "eval_runtime": 11.5948,
470
+ "eval_samples_per_second": 1585.884,
471
+ "eval_steps_per_second": 99.182,
472
  "eval_unc_insert_err_f1": 0.897196261682243,
473
  "eval_unc_insert_err_number": 902,
474
  "eval_unc_insert_err_precision": 0.8898582333696837,
 
525
  "eval_ne_word_err_precision": 0.9782503037667072,
526
  "eval_ne_word_err_recall": 0.9762337819813266,
527
  "eval_overall_accuracy": 0.9954619777719851,
528
+ "eval_runtime": 11.4901,
529
+ "eval_samples_per_second": 1600.333,
530
+ "eval_steps_per_second": 100.086,
531
  "eval_unc_insert_err_f1": 0.934559221200649,
532
  "eval_unc_insert_err_number": 902,
533
  "eval_unc_insert_err_precision": 0.9123548046462513,
 
584
  "eval_ne_word_err_precision": 0.9809141745684415,
585
  "eval_ne_word_err_recall": 0.9784163938401843,
586
  "eval_overall_accuracy": 0.9963387758003744,
587
+ "eval_runtime": 11.5603,
588
+ "eval_samples_per_second": 1590.617,
589
+ "eval_steps_per_second": 99.478,
590
  "eval_unc_insert_err_f1": 0.9537289058247141,
591
  "eval_unc_insert_err_number": 902,
592
  "eval_unc_insert_err_precision": 0.9368983957219251,
 
643
  "eval_ne_word_err_precision": 0.989462075726014,
644
  "eval_ne_word_err_recall": 0.9791439311264702,
645
  "eval_overall_accuracy": 0.9968541908576033,
646
+ "eval_runtime": 11.4621,
647
+ "eval_samples_per_second": 1604.24,
648
+ "eval_steps_per_second": 100.33,
649
  "eval_unc_insert_err_f1": 0.9379310344827587,
650
  "eval_unc_insert_err_number": 902,
651
  "eval_unc_insert_err_precision": 0.8992878942014242,
 
702
  "eval_ne_word_err_precision": 0.9917153996101364,
703
  "eval_ne_word_err_recall": 0.9870255850612344,
704
  "eval_overall_accuracy": 0.9976184269769426,
705
+ "eval_runtime": 11.7351,
706
+ "eval_samples_per_second": 1566.929,
707
+ "eval_steps_per_second": 97.997,
708
  "eval_unc_insert_err_f1": 0.9763866007688083,
709
  "eval_unc_insert_err_number": 902,
710
  "eval_unc_insert_err_precision": 0.9673558215451578,
 
761
  "eval_ne_word_err_precision": 0.991969826012897,
762
  "eval_ne_word_err_recall": 0.9886019158481872,
763
  "eval_overall_accuracy": 0.9980627503021399,
764
+ "eval_runtime": 11.5718,
765
+ "eval_samples_per_second": 1589.041,
766
+ "eval_steps_per_second": 99.38,
767
  "eval_unc_insert_err_f1": 0.9796367638965328,
768
  "eval_unc_insert_err_number": 902,
769
  "eval_unc_insert_err_precision": 0.9726775956284153,
 
820
  "eval_ne_word_err_precision": 0.9943957115009746,
821
  "eval_ne_word_err_recall": 0.9896932217776161,
822
  "eval_overall_accuracy": 0.9983589658522714,
823
+ "eval_runtime": 11.4901,
824
+ "eval_samples_per_second": 1600.34,
825
+ "eval_steps_per_second": 100.087,
826
  "eval_unc_insert_err_f1": 0.9839513004980631,
827
  "eval_unc_insert_err_number": 902,
828
  "eval_unc_insert_err_precision": 0.9823204419889503,
 
879
  "eval_ne_word_err_precision": 0.9951290793960058,
880
  "eval_ne_word_err_recall": 0.9909057839214259,
881
  "eval_overall_accuracy": 0.9986137112253844,
882
+ "eval_runtime": 11.4842,
883
+ "eval_samples_per_second": 1601.155,
884
+ "eval_steps_per_second": 100.137,
885
  "eval_unc_insert_err_f1": 0.991111111111111,
886
  "eval_unc_insert_err_number": 902,
887
  "eval_unc_insert_err_precision": 0.9933184855233853,
 
938
  "eval_ne_word_err_precision": 0.9948998178506375,
939
  "eval_ne_word_err_recall": 0.9934521644234267,
940
  "eval_overall_accuracy": 0.998862532287495,
941
+ "eval_runtime": 11.5461,
942
+ "eval_samples_per_second": 1592.57,
943
+ "eval_steps_per_second": 99.601,
944
  "eval_unc_insert_err_f1": 0.9900662251655629,
945
  "eval_unc_insert_err_number": 902,
946
  "eval_unc_insert_err_precision": 0.9857142857142858,
 
997
  "eval_ne_word_err_precision": 0.9945454545454545,
998
  "eval_ne_word_err_recall": 0.9949072389959985,
999
  "eval_overall_accuracy": 0.9990106400625607,
1000
+ "eval_runtime": 11.5275,
1001
+ "eval_samples_per_second": 1595.144,
1002
+ "eval_steps_per_second": 99.762,
1003
  "eval_unc_insert_err_f1": 0.9927897947864671,
1004
  "eval_unc_insert_err_number": 902,
1005
  "eval_unc_insert_err_precision": 0.9933407325194229,
 
1056
  "eval_ne_word_err_precision": 0.9949097079141922,
1057
  "eval_ne_word_err_recall": 0.9953922638535225,
1058
  "eval_overall_accuracy": 0.9991054290386028,
1059
+ "eval_runtime": 11.4848,
1060
+ "eval_samples_per_second": 1601.066,
1061
+ "eval_steps_per_second": 100.132,
1062
  "eval_unc_insert_err_f1": 0.9927897947864671,
1063
  "eval_unc_insert_err_number": 902,
1064
  "eval_unc_insert_err_precision": 0.9933407325194229,
 
1115
  "eval_ne_word_err_precision": 0.9956300072833212,
1116
  "eval_ne_word_err_recall": 0.9945434703528556,
1117
  "eval_overall_accuracy": 0.9992179909476527,
1118
+ "eval_runtime": 11.5451,
1119
+ "eval_samples_per_second": 1592.714,
1120
+ "eval_steps_per_second": 99.61,
1121
  "eval_unc_insert_err_f1": 0.9933701657458565,
1122
  "eval_unc_insert_err_number": 902,
1123
  "eval_unc_insert_err_precision": 0.9900881057268722,
 
1174
  "eval_ne_word_err_precision": 0.9959941733430444,
1175
  "eval_ne_word_err_recall": 0.9949072389959985,
1176
  "eval_overall_accuracy": 0.9992594611246712,
1177
+ "eval_runtime": 11.5037,
1178
+ "eval_samples_per_second": 1598.447,
1179
+ "eval_steps_per_second": 99.968,
1180
  "eval_unc_insert_err_f1": 0.9944444444444444,
1181
  "eval_unc_insert_err_number": 902,
1182
  "eval_unc_insert_err_precision": 0.9966592427616926,
 
1233
  "eval_ne_word_err_precision": 0.9953922638535225,
1234
  "eval_ne_word_err_recall": 0.9953922638535225,
1235
  "eval_overall_accuracy": 0.999295006990687,
1236
+ "eval_runtime": 11.4631,
1237
+ "eval_samples_per_second": 1604.101,
1238
+ "eval_steps_per_second": 100.322,
1239
  "eval_unc_insert_err_f1": 0.9944506104328523,
1240
  "eval_unc_insert_err_number": 902,
1241
  "eval_unc_insert_err_precision": 0.9955555555555555,
 
1292
  "eval_ne_word_err_precision": 0.996719319562576,
1293
  "eval_ne_word_err_recall": 0.9946647265672366,
1294
  "eval_overall_accuracy": 0.9993127799236948,
1295
+ "eval_runtime": 11.5654,
1296
+ "eval_samples_per_second": 1589.911,
1297
+ "eval_steps_per_second": 99.434,
1298
  "eval_unc_insert_err_f1": 0.9939125622578859,
1299
  "eval_unc_insert_err_number": 902,
1300
  "eval_unc_insert_err_precision": 0.9922651933701657,
 
1351
  "eval_ne_word_err_precision": 0.9975666139433021,
1352
  "eval_ne_word_err_recall": 0.9941797017097126,
1353
  "eval_overall_accuracy": 0.9993601744117159,
1354
+ "eval_runtime": 11.5142,
1355
+ "eval_samples_per_second": 1596.978,
1356
+ "eval_steps_per_second": 99.876,
1357
  "eval_unc_insert_err_f1": 0.9950193691200886,
1358
  "eval_unc_insert_err_number": 902,
1359
  "eval_unc_insert_err_precision": 0.9933701657458563,
 
1410
  "eval_ne_word_err_precision": 0.9959966031784544,
1411
  "eval_ne_word_err_recall": 0.9955135200679035,
1412
  "eval_overall_accuracy": 0.9993720230337212,
1413
+ "eval_runtime": 11.4924,
1414
+ "eval_samples_per_second": 1600.014,
1415
+ "eval_steps_per_second": 100.066,
1416
  "eval_unc_insert_err_f1": 0.9950138504155125,
1417
  "eval_unc_insert_err_number": 902,
1418
  "eval_unc_insert_err_precision": 0.9944629014396457,
 
1469
  "eval_ne_word_err_precision": 0.9968412100595311,
1470
  "eval_ne_word_err_recall": 0.9949072389959985,
1471
  "eval_overall_accuracy": 0.9993720230337212,
1472
+ "eval_runtime": 11.6279,
1473
+ "eval_samples_per_second": 1581.368,
1474
+ "eval_steps_per_second": 98.9,
1475
  "eval_unc_insert_err_f1": 0.9955654101995566,
1476
  "eval_unc_insert_err_number": 902,
1477
  "eval_unc_insert_err_precision": 0.9955654101995566,
 
1528
  "eval_ne_word_err_precision": 0.9957565470417071,
1529
  "eval_ne_word_err_recall": 0.9958772887110464,
1530
  "eval_overall_accuracy": 0.9993779473447238,
1531
+ "eval_runtime": 11.5517,
1532
+ "eval_samples_per_second": 1591.803,
1533
+ "eval_steps_per_second": 99.553,
1534
  "eval_unc_insert_err_f1": 0.995575221238938,
1535
  "eval_unc_insert_err_number": 902,
1536
  "eval_unc_insert_err_precision": 0.9933774834437086,
 
1587
  "eval_ne_word_err_precision": 0.9964784456587735,
1588
  "eval_ne_word_err_recall": 0.9950284952103795,
1589
  "eval_overall_accuracy": 0.9993720230337212,
1590
+ "eval_runtime": 11.5195,
1591
+ "eval_samples_per_second": 1596.249,
1592
+ "eval_steps_per_second": 99.831,
1593
  "eval_unc_insert_err_f1": 0.9955703211517165,
1594
  "eval_unc_insert_err_number": 902,
1595
  "eval_unc_insert_err_precision": 0.9944690265486725,
 
1646
  "eval_ne_word_err_precision": 0.9963578972927036,
1647
  "eval_ne_word_err_recall": 0.9951497514247605,
1648
  "eval_overall_accuracy": 0.9993838716557264,
1649
+ "eval_runtime": 11.5765,
1650
+ "eval_samples_per_second": 1588.392,
1651
+ "eval_steps_per_second": 99.339,
1652
  "eval_unc_insert_err_f1": 0.9955703211517165,
1653
  "eval_unc_insert_err_number": 902,
1654
  "eval_unc_insert_err_precision": 0.9944690265486725,
 
1705
  "eval_ne_word_err_precision": 0.9962374074523607,
1706
  "eval_ne_word_err_recall": 0.9952710076391416,
1707
  "eval_overall_accuracy": 0.9993957202777317,
1708
+ "eval_runtime": 11.5017,
1709
+ "eval_samples_per_second": 1598.724,
1710
+ "eval_steps_per_second": 99.985,
1711
  "eval_unc_insert_err_f1": 0.9961175818080976,
1712
  "eval_unc_insert_err_number": 902,
1713
  "eval_unc_insert_err_precision": 0.9966703662597114,
 
1764
  "eval_ne_word_err_precision": 0.9970827762246263,
1765
  "eval_ne_word_err_recall": 0.9946647265672366,
1766
  "eval_overall_accuracy": 0.9993957202777317,
1767
+ "eval_runtime": 11.5014,
1768
+ "eval_samples_per_second": 1598.761,
1769
+ "eval_steps_per_second": 99.988,
1770
  "eval_unc_insert_err_f1": 0.9961218836565098,
1771
  "eval_unc_insert_err_number": 902,
1772
  "eval_unc_insert_err_precision": 0.9955703211517165,
 
1782
  "step": 17250,
1783
  "total_flos": 7911429330344064.0,
1784
  "train_loss": 0.06519987745561462,
1785
+ "train_runtime": 1743.8633,
1786
+ "train_samples_per_second": 316.332,
1787
+ "train_steps_per_second": 9.892
1788
  }
1789
  ],
1790
  "max_steps": 17250,
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b4c6b5e11b5bd25aac69af9ca386e301fbfbec9996b7dd5cb1ba740476d0951a
3
  size 3387
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:735e977a5aabe6e9dacf785770cbcf801ab51c2533de47ea8a4cedd007b5807f
3
  size 3387