Commit
·
ff24bac
1
Parent(s):
5378162
Training in progress, epoch 1
Browse files- all_results.json +6 -6
- eval_results.json +3 -3
- pytorch_model.bin +1 -1
- runs/Mar03_01-20-39_home-3090/events.out.tfevents.1677786630.home-3090.52004.2 +3 -0
- runs/Mar03_15-28-56_home-3090/1677835755.4833965/events.out.tfevents.1677835755.home-3090.22403.1 +3 -0
- runs/Mar03_15-28-56_home-3090/events.out.tfevents.1677835755.home-3090.22403.0 +3 -0
- train_results.json +3 -3
- trainer_state.json +93 -93
- training_args.bin +1 -1
all_results.json
CHANGED
@@ -38,10 +38,10 @@
|
|
38 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
39 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
40 |
"eval_overall_accuracy": 0.9993957202777317,
|
41 |
-
"eval_runtime": 11.
|
42 |
"eval_samples": 18388,
|
43 |
-
"eval_samples_per_second":
|
44 |
-
"eval_steps_per_second":
|
45 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
46 |
"eval_unc_insert_err_number": 902,
|
47 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
@@ -51,8 +51,8 @@
|
|
51 |
"eval_weighted_avg_precision": 0.9936401344515604,
|
52 |
"eval_weighted_avg_recall": 0.9931156910287495,
|
53 |
"train_loss": 0.06519987745561462,
|
54 |
-
"train_runtime": 1743.
|
55 |
"train_samples": 18388,
|
56 |
-
"train_samples_per_second": 316.
|
57 |
-
"train_steps_per_second": 9.
|
58 |
}
|
|
|
38 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
39 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
40 |
"eval_overall_accuracy": 0.9993957202777317,
|
41 |
+
"eval_runtime": 11.4329,
|
42 |
"eval_samples": 18388,
|
43 |
+
"eval_samples_per_second": 1608.342,
|
44 |
+
"eval_steps_per_second": 100.587,
|
45 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
46 |
"eval_unc_insert_err_number": 902,
|
47 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
|
|
51 |
"eval_weighted_avg_precision": 0.9936401344515604,
|
52 |
"eval_weighted_avg_recall": 0.9931156910287495,
|
53 |
"train_loss": 0.06519987745561462,
|
54 |
+
"train_runtime": 1743.8633,
|
55 |
"train_samples": 18388,
|
56 |
+
"train_samples_per_second": 316.332,
|
57 |
+
"train_steps_per_second": 9.892
|
58 |
}
|
eval_results.json
CHANGED
@@ -38,10 +38,10 @@
|
|
38 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
39 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
40 |
"eval_overall_accuracy": 0.9993957202777317,
|
41 |
-
"eval_runtime": 11.
|
42 |
"eval_samples": 18388,
|
43 |
-
"eval_samples_per_second":
|
44 |
-
"eval_steps_per_second":
|
45 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
46 |
"eval_unc_insert_err_number": 902,
|
47 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
|
|
38 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
39 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
40 |
"eval_overall_accuracy": 0.9993957202777317,
|
41 |
+
"eval_runtime": 11.4329,
|
42 |
"eval_samples": 18388,
|
43 |
+
"eval_samples_per_second": 1608.342,
|
44 |
+
"eval_steps_per_second": 100.587,
|
45 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
46 |
"eval_unc_insert_err_number": 902,
|
47 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
pytorch_model.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 440204333
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:782a74d01c2012b5d99332313c0794974e8965c7c8027eb0901f5118df32f7f3
|
3 |
size 440204333
|
runs/Mar03_01-20-39_home-3090/events.out.tfevents.1677786630.home-3090.52004.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39373ce231698dc357cc544e011a293aa1868f277921b0565725b850385cdef0
|
3 |
+
size 2994
|
runs/Mar03_15-28-56_home-3090/1677835755.4833965/events.out.tfevents.1677835755.home-3090.22403.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6e69d61ff4a983ba335c65dc90e26811b6900344b603bb5126edff8dd4be54f
|
3 |
+
size 5523
|
runs/Mar03_15-28-56_home-3090/events.out.tfevents.1677835755.home-3090.22403.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7b8e1128585d66a929bdb76df7bdece7d52108c15b5b3897af64bde3d519505
|
3 |
+
size 7325
|
train_results.json
CHANGED
@@ -1,8 +1,8 @@
|
|
1 |
{
|
2 |
"epoch": 30.0,
|
3 |
"train_loss": 0.06519987745561462,
|
4 |
-
"train_runtime": 1743.
|
5 |
"train_samples": 18388,
|
6 |
-
"train_samples_per_second": 316.
|
7 |
-
"train_steps_per_second": 9.
|
8 |
}
|
|
|
1 |
{
|
2 |
"epoch": 30.0,
|
3 |
"train_loss": 0.06519987745561462,
|
4 |
+
"train_runtime": 1743.8633,
|
5 |
"train_samples": 18388,
|
6 |
+
"train_samples_per_second": 316.332,
|
7 |
+
"train_steps_per_second": 9.892
|
8 |
}
|
trainer_state.json
CHANGED
@@ -53,9 +53,9 @@
|
|
53 |
"eval_ne_word_err_precision": 0.6340406114533425,
|
54 |
"eval_ne_word_err_recall": 0.33697101976476296,
|
55 |
"eval_overall_accuracy": 0.9313016896134979,
|
56 |
-
"eval_runtime": 11.
|
57 |
-
"eval_samples_per_second":
|
58 |
-
"eval_steps_per_second":
|
59 |
"eval_unc_insert_err_f1": 0.0,
|
60 |
"eval_unc_insert_err_number": 902,
|
61 |
"eval_unc_insert_err_precision": 0.0,
|
@@ -112,9 +112,9 @@
|
|
112 |
"eval_ne_word_err_precision": 0.7050460865489767,
|
113 |
"eval_ne_word_err_recall": 0.5472292955013944,
|
114 |
"eval_overall_accuracy": 0.9455378089528188,
|
115 |
-
"eval_runtime":
|
116 |
-
"eval_samples_per_second":
|
117 |
-
"eval_steps_per_second":
|
118 |
"eval_unc_insert_err_f1": 0.0022148394241417496,
|
119 |
"eval_unc_insert_err_number": 902,
|
120 |
"eval_unc_insert_err_precision": 1.0,
|
@@ -171,9 +171,9 @@
|
|
171 |
"eval_ne_word_err_precision": 0.7622462787550744,
|
172 |
"eval_ne_word_err_recall": 0.6830362556080999,
|
173 |
"eval_overall_accuracy": 0.9567288324367876,
|
174 |
-
"eval_runtime": 11.
|
175 |
-
"eval_samples_per_second":
|
176 |
-
"eval_steps_per_second":
|
177 |
"eval_unc_insert_err_f1": 0.3054662379421222,
|
178 |
"eval_unc_insert_err_number": 902,
|
179 |
"eval_unc_insert_err_precision": 0.5555555555555556,
|
@@ -230,9 +230,9 @@
|
|
230 |
"eval_ne_word_err_precision": 0.8228239366963402,
|
231 |
"eval_ne_word_err_recall": 0.8069601067054687,
|
232 |
"eval_overall_accuracy": 0.9701177753027322,
|
233 |
-
"eval_runtime": 11.
|
234 |
-
"eval_samples_per_second":
|
235 |
-
"eval_steps_per_second": 99.
|
236 |
"eval_unc_insert_err_f1": 0.37326813365933176,
|
237 |
"eval_unc_insert_err_number": 902,
|
238 |
"eval_unc_insert_err_precision": 0.7046153846153846,
|
@@ -289,9 +289,9 @@
|
|
289 |
"eval_ne_word_err_precision": 0.887815750371471,
|
290 |
"eval_ne_word_err_recall": 0.869407057111677,
|
291 |
"eval_overall_accuracy": 0.9797270077489988,
|
292 |
-
"eval_runtime": 11.
|
293 |
-
"eval_samples_per_second":
|
294 |
-
"eval_steps_per_second": 99.
|
295 |
"eval_unc_insert_err_f1": 0.5340674466620785,
|
296 |
"eval_unc_insert_err_number": 902,
|
297 |
"eval_unc_insert_err_precision": 0.7041742286751361,
|
@@ -348,9 +348,9 @@
|
|
348 |
"eval_ne_word_err_precision": 0.918532634587899,
|
349 |
"eval_ne_word_err_recall": 0.935127925306172,
|
350 |
"eval_overall_accuracy": 0.9874049148084078,
|
351 |
-
"eval_runtime": 11.
|
352 |
-
"eval_samples_per_second":
|
353 |
-
"eval_steps_per_second":
|
354 |
"eval_unc_insert_err_f1": 0.7559591373439274,
|
355 |
"eval_unc_insert_err_number": 902,
|
356 |
"eval_unc_insert_err_precision": 0.7744186046511627,
|
@@ -407,9 +407,9 @@
|
|
407 |
"eval_ne_word_err_precision": 0.9517692680562287,
|
408 |
"eval_ne_word_err_recall": 0.9523463077482721,
|
409 |
"eval_overall_accuracy": 0.9913860518021754,
|
410 |
-
"eval_runtime": 11.
|
411 |
-
"eval_samples_per_second":
|
412 |
-
"eval_steps_per_second":
|
413 |
"eval_unc_insert_err_f1": 0.8407367280606717,
|
414 |
"eval_unc_insert_err_number": 902,
|
415 |
"eval_unc_insert_err_precision": 0.8220338983050848,
|
@@ -466,9 +466,9 @@
|
|
466 |
"eval_ne_word_err_precision": 0.9697043435941112,
|
467 |
"eval_ne_word_err_recall": 0.9664120286164666,
|
468 |
"eval_overall_accuracy": 0.9938387165572644,
|
469 |
-
"eval_runtime": 11.
|
470 |
-
"eval_samples_per_second":
|
471 |
-
"eval_steps_per_second": 99.
|
472 |
"eval_unc_insert_err_f1": 0.897196261682243,
|
473 |
"eval_unc_insert_err_number": 902,
|
474 |
"eval_unc_insert_err_precision": 0.8898582333696837,
|
@@ -525,9 +525,9 @@
|
|
525 |
"eval_ne_word_err_precision": 0.9782503037667072,
|
526 |
"eval_ne_word_err_recall": 0.9762337819813266,
|
527 |
"eval_overall_accuracy": 0.9954619777719851,
|
528 |
-
"eval_runtime": 11.
|
529 |
-
"eval_samples_per_second":
|
530 |
-
"eval_steps_per_second":
|
531 |
"eval_unc_insert_err_f1": 0.934559221200649,
|
532 |
"eval_unc_insert_err_number": 902,
|
533 |
"eval_unc_insert_err_precision": 0.9123548046462513,
|
@@ -584,9 +584,9 @@
|
|
584 |
"eval_ne_word_err_precision": 0.9809141745684415,
|
585 |
"eval_ne_word_err_recall": 0.9784163938401843,
|
586 |
"eval_overall_accuracy": 0.9963387758003744,
|
587 |
-
"eval_runtime": 11.
|
588 |
-
"eval_samples_per_second":
|
589 |
-
"eval_steps_per_second": 99.
|
590 |
"eval_unc_insert_err_f1": 0.9537289058247141,
|
591 |
"eval_unc_insert_err_number": 902,
|
592 |
"eval_unc_insert_err_precision": 0.9368983957219251,
|
@@ -643,9 +643,9 @@
|
|
643 |
"eval_ne_word_err_precision": 0.989462075726014,
|
644 |
"eval_ne_word_err_recall": 0.9791439311264702,
|
645 |
"eval_overall_accuracy": 0.9968541908576033,
|
646 |
-
"eval_runtime": 11.
|
647 |
-
"eval_samples_per_second":
|
648 |
-
"eval_steps_per_second":
|
649 |
"eval_unc_insert_err_f1": 0.9379310344827587,
|
650 |
"eval_unc_insert_err_number": 902,
|
651 |
"eval_unc_insert_err_precision": 0.8992878942014242,
|
@@ -702,9 +702,9 @@
|
|
702 |
"eval_ne_word_err_precision": 0.9917153996101364,
|
703 |
"eval_ne_word_err_recall": 0.9870255850612344,
|
704 |
"eval_overall_accuracy": 0.9976184269769426,
|
705 |
-
"eval_runtime": 11.
|
706 |
-
"eval_samples_per_second":
|
707 |
-
"eval_steps_per_second":
|
708 |
"eval_unc_insert_err_f1": 0.9763866007688083,
|
709 |
"eval_unc_insert_err_number": 902,
|
710 |
"eval_unc_insert_err_precision": 0.9673558215451578,
|
@@ -761,9 +761,9 @@
|
|
761 |
"eval_ne_word_err_precision": 0.991969826012897,
|
762 |
"eval_ne_word_err_recall": 0.9886019158481872,
|
763 |
"eval_overall_accuracy": 0.9980627503021399,
|
764 |
-
"eval_runtime": 11.
|
765 |
-
"eval_samples_per_second":
|
766 |
-
"eval_steps_per_second": 99.
|
767 |
"eval_unc_insert_err_f1": 0.9796367638965328,
|
768 |
"eval_unc_insert_err_number": 902,
|
769 |
"eval_unc_insert_err_precision": 0.9726775956284153,
|
@@ -820,9 +820,9 @@
|
|
820 |
"eval_ne_word_err_precision": 0.9943957115009746,
|
821 |
"eval_ne_word_err_recall": 0.9896932217776161,
|
822 |
"eval_overall_accuracy": 0.9983589658522714,
|
823 |
-
"eval_runtime": 11.
|
824 |
-
"eval_samples_per_second":
|
825 |
-
"eval_steps_per_second":
|
826 |
"eval_unc_insert_err_f1": 0.9839513004980631,
|
827 |
"eval_unc_insert_err_number": 902,
|
828 |
"eval_unc_insert_err_precision": 0.9823204419889503,
|
@@ -879,9 +879,9 @@
|
|
879 |
"eval_ne_word_err_precision": 0.9951290793960058,
|
880 |
"eval_ne_word_err_recall": 0.9909057839214259,
|
881 |
"eval_overall_accuracy": 0.9986137112253844,
|
882 |
-
"eval_runtime": 11.
|
883 |
-
"eval_samples_per_second":
|
884 |
-
"eval_steps_per_second":
|
885 |
"eval_unc_insert_err_f1": 0.991111111111111,
|
886 |
"eval_unc_insert_err_number": 902,
|
887 |
"eval_unc_insert_err_precision": 0.9933184855233853,
|
@@ -938,9 +938,9 @@
|
|
938 |
"eval_ne_word_err_precision": 0.9948998178506375,
|
939 |
"eval_ne_word_err_recall": 0.9934521644234267,
|
940 |
"eval_overall_accuracy": 0.998862532287495,
|
941 |
-
"eval_runtime":
|
942 |
-
"eval_samples_per_second":
|
943 |
-
"eval_steps_per_second":
|
944 |
"eval_unc_insert_err_f1": 0.9900662251655629,
|
945 |
"eval_unc_insert_err_number": 902,
|
946 |
"eval_unc_insert_err_precision": 0.9857142857142858,
|
@@ -997,9 +997,9 @@
|
|
997 |
"eval_ne_word_err_precision": 0.9945454545454545,
|
998 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
999 |
"eval_overall_accuracy": 0.9990106400625607,
|
1000 |
-
"eval_runtime": 11.
|
1001 |
-
"eval_samples_per_second":
|
1002 |
-
"eval_steps_per_second": 99.
|
1003 |
"eval_unc_insert_err_f1": 0.9927897947864671,
|
1004 |
"eval_unc_insert_err_number": 902,
|
1005 |
"eval_unc_insert_err_precision": 0.9933407325194229,
|
@@ -1056,9 +1056,9 @@
|
|
1056 |
"eval_ne_word_err_precision": 0.9949097079141922,
|
1057 |
"eval_ne_word_err_recall": 0.9953922638535225,
|
1058 |
"eval_overall_accuracy": 0.9991054290386028,
|
1059 |
-
"eval_runtime": 11.
|
1060 |
-
"eval_samples_per_second":
|
1061 |
-
"eval_steps_per_second":
|
1062 |
"eval_unc_insert_err_f1": 0.9927897947864671,
|
1063 |
"eval_unc_insert_err_number": 902,
|
1064 |
"eval_unc_insert_err_precision": 0.9933407325194229,
|
@@ -1115,9 +1115,9 @@
|
|
1115 |
"eval_ne_word_err_precision": 0.9956300072833212,
|
1116 |
"eval_ne_word_err_recall": 0.9945434703528556,
|
1117 |
"eval_overall_accuracy": 0.9992179909476527,
|
1118 |
-
"eval_runtime": 11.
|
1119 |
-
"eval_samples_per_second":
|
1120 |
-
"eval_steps_per_second":
|
1121 |
"eval_unc_insert_err_f1": 0.9933701657458565,
|
1122 |
"eval_unc_insert_err_number": 902,
|
1123 |
"eval_unc_insert_err_precision": 0.9900881057268722,
|
@@ -1174,9 +1174,9 @@
|
|
1174 |
"eval_ne_word_err_precision": 0.9959941733430444,
|
1175 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
1176 |
"eval_overall_accuracy": 0.9992594611246712,
|
1177 |
-
"eval_runtime": 11.
|
1178 |
-
"eval_samples_per_second":
|
1179 |
-
"eval_steps_per_second":
|
1180 |
"eval_unc_insert_err_f1": 0.9944444444444444,
|
1181 |
"eval_unc_insert_err_number": 902,
|
1182 |
"eval_unc_insert_err_precision": 0.9966592427616926,
|
@@ -1233,9 +1233,9 @@
|
|
1233 |
"eval_ne_word_err_precision": 0.9953922638535225,
|
1234 |
"eval_ne_word_err_recall": 0.9953922638535225,
|
1235 |
"eval_overall_accuracy": 0.999295006990687,
|
1236 |
-
"eval_runtime": 11.
|
1237 |
-
"eval_samples_per_second":
|
1238 |
-
"eval_steps_per_second":
|
1239 |
"eval_unc_insert_err_f1": 0.9944506104328523,
|
1240 |
"eval_unc_insert_err_number": 902,
|
1241 |
"eval_unc_insert_err_precision": 0.9955555555555555,
|
@@ -1292,9 +1292,9 @@
|
|
1292 |
"eval_ne_word_err_precision": 0.996719319562576,
|
1293 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
1294 |
"eval_overall_accuracy": 0.9993127799236948,
|
1295 |
-
"eval_runtime": 11.
|
1296 |
-
"eval_samples_per_second":
|
1297 |
-
"eval_steps_per_second":
|
1298 |
"eval_unc_insert_err_f1": 0.9939125622578859,
|
1299 |
"eval_unc_insert_err_number": 902,
|
1300 |
"eval_unc_insert_err_precision": 0.9922651933701657,
|
@@ -1351,9 +1351,9 @@
|
|
1351 |
"eval_ne_word_err_precision": 0.9975666139433021,
|
1352 |
"eval_ne_word_err_recall": 0.9941797017097126,
|
1353 |
"eval_overall_accuracy": 0.9993601744117159,
|
1354 |
-
"eval_runtime": 11.
|
1355 |
-
"eval_samples_per_second":
|
1356 |
-
"eval_steps_per_second": 99.
|
1357 |
"eval_unc_insert_err_f1": 0.9950193691200886,
|
1358 |
"eval_unc_insert_err_number": 902,
|
1359 |
"eval_unc_insert_err_precision": 0.9933701657458563,
|
@@ -1410,9 +1410,9 @@
|
|
1410 |
"eval_ne_word_err_precision": 0.9959966031784544,
|
1411 |
"eval_ne_word_err_recall": 0.9955135200679035,
|
1412 |
"eval_overall_accuracy": 0.9993720230337212,
|
1413 |
-
"eval_runtime": 11.
|
1414 |
-
"eval_samples_per_second":
|
1415 |
-
"eval_steps_per_second":
|
1416 |
"eval_unc_insert_err_f1": 0.9950138504155125,
|
1417 |
"eval_unc_insert_err_number": 902,
|
1418 |
"eval_unc_insert_err_precision": 0.9944629014396457,
|
@@ -1469,9 +1469,9 @@
|
|
1469 |
"eval_ne_word_err_precision": 0.9968412100595311,
|
1470 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
1471 |
"eval_overall_accuracy": 0.9993720230337212,
|
1472 |
-
"eval_runtime": 11.
|
1473 |
-
"eval_samples_per_second":
|
1474 |
-
"eval_steps_per_second": 98.
|
1475 |
"eval_unc_insert_err_f1": 0.9955654101995566,
|
1476 |
"eval_unc_insert_err_number": 902,
|
1477 |
"eval_unc_insert_err_precision": 0.9955654101995566,
|
@@ -1528,9 +1528,9 @@
|
|
1528 |
"eval_ne_word_err_precision": 0.9957565470417071,
|
1529 |
"eval_ne_word_err_recall": 0.9958772887110464,
|
1530 |
"eval_overall_accuracy": 0.9993779473447238,
|
1531 |
-
"eval_runtime": 11.
|
1532 |
-
"eval_samples_per_second":
|
1533 |
-
"eval_steps_per_second": 99.
|
1534 |
"eval_unc_insert_err_f1": 0.995575221238938,
|
1535 |
"eval_unc_insert_err_number": 902,
|
1536 |
"eval_unc_insert_err_precision": 0.9933774834437086,
|
@@ -1587,9 +1587,9 @@
|
|
1587 |
"eval_ne_word_err_precision": 0.9964784456587735,
|
1588 |
"eval_ne_word_err_recall": 0.9950284952103795,
|
1589 |
"eval_overall_accuracy": 0.9993720230337212,
|
1590 |
-
"eval_runtime": 11.
|
1591 |
-
"eval_samples_per_second":
|
1592 |
-
"eval_steps_per_second":
|
1593 |
"eval_unc_insert_err_f1": 0.9955703211517165,
|
1594 |
"eval_unc_insert_err_number": 902,
|
1595 |
"eval_unc_insert_err_precision": 0.9944690265486725,
|
@@ -1646,9 +1646,9 @@
|
|
1646 |
"eval_ne_word_err_precision": 0.9963578972927036,
|
1647 |
"eval_ne_word_err_recall": 0.9951497514247605,
|
1648 |
"eval_overall_accuracy": 0.9993838716557264,
|
1649 |
-
"eval_runtime": 11.
|
1650 |
-
"eval_samples_per_second":
|
1651 |
-
"eval_steps_per_second":
|
1652 |
"eval_unc_insert_err_f1": 0.9955703211517165,
|
1653 |
"eval_unc_insert_err_number": 902,
|
1654 |
"eval_unc_insert_err_precision": 0.9944690265486725,
|
@@ -1705,9 +1705,9 @@
|
|
1705 |
"eval_ne_word_err_precision": 0.9962374074523607,
|
1706 |
"eval_ne_word_err_recall": 0.9952710076391416,
|
1707 |
"eval_overall_accuracy": 0.9993957202777317,
|
1708 |
-
"eval_runtime": 11.
|
1709 |
-
"eval_samples_per_second":
|
1710 |
-
"eval_steps_per_second": 99.
|
1711 |
"eval_unc_insert_err_f1": 0.9961175818080976,
|
1712 |
"eval_unc_insert_err_number": 902,
|
1713 |
"eval_unc_insert_err_precision": 0.9966703662597114,
|
@@ -1764,9 +1764,9 @@
|
|
1764 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
1765 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
1766 |
"eval_overall_accuracy": 0.9993957202777317,
|
1767 |
-
"eval_runtime": 11.
|
1768 |
-
"eval_samples_per_second":
|
1769 |
-
"eval_steps_per_second":
|
1770 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
1771 |
"eval_unc_insert_err_number": 902,
|
1772 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
@@ -1782,9 +1782,9 @@
|
|
1782 |
"step": 17250,
|
1783 |
"total_flos": 7911429330344064.0,
|
1784 |
"train_loss": 0.06519987745561462,
|
1785 |
-
"train_runtime": 1743.
|
1786 |
-
"train_samples_per_second": 316.
|
1787 |
-
"train_steps_per_second": 9.
|
1788 |
}
|
1789 |
],
|
1790 |
"max_steps": 17250,
|
|
|
53 |
"eval_ne_word_err_precision": 0.6340406114533425,
|
54 |
"eval_ne_word_err_recall": 0.33697101976476296,
|
55 |
"eval_overall_accuracy": 0.9313016896134979,
|
56 |
+
"eval_runtime": 11.367,
|
57 |
+
"eval_samples_per_second": 1617.671,
|
58 |
+
"eval_steps_per_second": 101.17,
|
59 |
"eval_unc_insert_err_f1": 0.0,
|
60 |
"eval_unc_insert_err_number": 902,
|
61 |
"eval_unc_insert_err_precision": 0.0,
|
|
|
112 |
"eval_ne_word_err_precision": 0.7050460865489767,
|
113 |
"eval_ne_word_err_recall": 0.5472292955013944,
|
114 |
"eval_overall_accuracy": 0.9455378089528188,
|
115 |
+
"eval_runtime": 11.0987,
|
116 |
+
"eval_samples_per_second": 1656.776,
|
117 |
+
"eval_steps_per_second": 103.616,
|
118 |
"eval_unc_insert_err_f1": 0.0022148394241417496,
|
119 |
"eval_unc_insert_err_number": 902,
|
120 |
"eval_unc_insert_err_precision": 1.0,
|
|
|
171 |
"eval_ne_word_err_precision": 0.7622462787550744,
|
172 |
"eval_ne_word_err_recall": 0.6830362556080999,
|
173 |
"eval_overall_accuracy": 0.9567288324367876,
|
174 |
+
"eval_runtime": 11.1567,
|
175 |
+
"eval_samples_per_second": 1648.155,
|
176 |
+
"eval_steps_per_second": 103.077,
|
177 |
"eval_unc_insert_err_f1": 0.3054662379421222,
|
178 |
"eval_unc_insert_err_number": 902,
|
179 |
"eval_unc_insert_err_precision": 0.5555555555555556,
|
|
|
230 |
"eval_ne_word_err_precision": 0.8228239366963402,
|
231 |
"eval_ne_word_err_recall": 0.8069601067054687,
|
232 |
"eval_overall_accuracy": 0.9701177753027322,
|
233 |
+
"eval_runtime": 11.5543,
|
234 |
+
"eval_samples_per_second": 1591.447,
|
235 |
+
"eval_steps_per_second": 99.53,
|
236 |
"eval_unc_insert_err_f1": 0.37326813365933176,
|
237 |
"eval_unc_insert_err_number": 902,
|
238 |
"eval_unc_insert_err_precision": 0.7046153846153846,
|
|
|
289 |
"eval_ne_word_err_precision": 0.887815750371471,
|
290 |
"eval_ne_word_err_recall": 0.869407057111677,
|
291 |
"eval_overall_accuracy": 0.9797270077489988,
|
292 |
+
"eval_runtime": 11.5559,
|
293 |
+
"eval_samples_per_second": 1591.224,
|
294 |
+
"eval_steps_per_second": 99.516,
|
295 |
"eval_unc_insert_err_f1": 0.5340674466620785,
|
296 |
"eval_unc_insert_err_number": 902,
|
297 |
"eval_unc_insert_err_precision": 0.7041742286751361,
|
|
|
348 |
"eval_ne_word_err_precision": 0.918532634587899,
|
349 |
"eval_ne_word_err_recall": 0.935127925306172,
|
350 |
"eval_overall_accuracy": 0.9874049148084078,
|
351 |
+
"eval_runtime": 11.4906,
|
352 |
+
"eval_samples_per_second": 1600.268,
|
353 |
+
"eval_steps_per_second": 100.082,
|
354 |
"eval_unc_insert_err_f1": 0.7559591373439274,
|
355 |
"eval_unc_insert_err_number": 902,
|
356 |
"eval_unc_insert_err_precision": 0.7744186046511627,
|
|
|
407 |
"eval_ne_word_err_precision": 0.9517692680562287,
|
408 |
"eval_ne_word_err_recall": 0.9523463077482721,
|
409 |
"eval_overall_accuracy": 0.9913860518021754,
|
410 |
+
"eval_runtime": 11.5809,
|
411 |
+
"eval_samples_per_second": 1587.783,
|
412 |
+
"eval_steps_per_second": 99.301,
|
413 |
"eval_unc_insert_err_f1": 0.8407367280606717,
|
414 |
"eval_unc_insert_err_number": 902,
|
415 |
"eval_unc_insert_err_precision": 0.8220338983050848,
|
|
|
466 |
"eval_ne_word_err_precision": 0.9697043435941112,
|
467 |
"eval_ne_word_err_recall": 0.9664120286164666,
|
468 |
"eval_overall_accuracy": 0.9938387165572644,
|
469 |
+
"eval_runtime": 11.5948,
|
470 |
+
"eval_samples_per_second": 1585.884,
|
471 |
+
"eval_steps_per_second": 99.182,
|
472 |
"eval_unc_insert_err_f1": 0.897196261682243,
|
473 |
"eval_unc_insert_err_number": 902,
|
474 |
"eval_unc_insert_err_precision": 0.8898582333696837,
|
|
|
525 |
"eval_ne_word_err_precision": 0.9782503037667072,
|
526 |
"eval_ne_word_err_recall": 0.9762337819813266,
|
527 |
"eval_overall_accuracy": 0.9954619777719851,
|
528 |
+
"eval_runtime": 11.4901,
|
529 |
+
"eval_samples_per_second": 1600.333,
|
530 |
+
"eval_steps_per_second": 100.086,
|
531 |
"eval_unc_insert_err_f1": 0.934559221200649,
|
532 |
"eval_unc_insert_err_number": 902,
|
533 |
"eval_unc_insert_err_precision": 0.9123548046462513,
|
|
|
584 |
"eval_ne_word_err_precision": 0.9809141745684415,
|
585 |
"eval_ne_word_err_recall": 0.9784163938401843,
|
586 |
"eval_overall_accuracy": 0.9963387758003744,
|
587 |
+
"eval_runtime": 11.5603,
|
588 |
+
"eval_samples_per_second": 1590.617,
|
589 |
+
"eval_steps_per_second": 99.478,
|
590 |
"eval_unc_insert_err_f1": 0.9537289058247141,
|
591 |
"eval_unc_insert_err_number": 902,
|
592 |
"eval_unc_insert_err_precision": 0.9368983957219251,
|
|
|
643 |
"eval_ne_word_err_precision": 0.989462075726014,
|
644 |
"eval_ne_word_err_recall": 0.9791439311264702,
|
645 |
"eval_overall_accuracy": 0.9968541908576033,
|
646 |
+
"eval_runtime": 11.4621,
|
647 |
+
"eval_samples_per_second": 1604.24,
|
648 |
+
"eval_steps_per_second": 100.33,
|
649 |
"eval_unc_insert_err_f1": 0.9379310344827587,
|
650 |
"eval_unc_insert_err_number": 902,
|
651 |
"eval_unc_insert_err_precision": 0.8992878942014242,
|
|
|
702 |
"eval_ne_word_err_precision": 0.9917153996101364,
|
703 |
"eval_ne_word_err_recall": 0.9870255850612344,
|
704 |
"eval_overall_accuracy": 0.9976184269769426,
|
705 |
+
"eval_runtime": 11.7351,
|
706 |
+
"eval_samples_per_second": 1566.929,
|
707 |
+
"eval_steps_per_second": 97.997,
|
708 |
"eval_unc_insert_err_f1": 0.9763866007688083,
|
709 |
"eval_unc_insert_err_number": 902,
|
710 |
"eval_unc_insert_err_precision": 0.9673558215451578,
|
|
|
761 |
"eval_ne_word_err_precision": 0.991969826012897,
|
762 |
"eval_ne_word_err_recall": 0.9886019158481872,
|
763 |
"eval_overall_accuracy": 0.9980627503021399,
|
764 |
+
"eval_runtime": 11.5718,
|
765 |
+
"eval_samples_per_second": 1589.041,
|
766 |
+
"eval_steps_per_second": 99.38,
|
767 |
"eval_unc_insert_err_f1": 0.9796367638965328,
|
768 |
"eval_unc_insert_err_number": 902,
|
769 |
"eval_unc_insert_err_precision": 0.9726775956284153,
|
|
|
820 |
"eval_ne_word_err_precision": 0.9943957115009746,
|
821 |
"eval_ne_word_err_recall": 0.9896932217776161,
|
822 |
"eval_overall_accuracy": 0.9983589658522714,
|
823 |
+
"eval_runtime": 11.4901,
|
824 |
+
"eval_samples_per_second": 1600.34,
|
825 |
+
"eval_steps_per_second": 100.087,
|
826 |
"eval_unc_insert_err_f1": 0.9839513004980631,
|
827 |
"eval_unc_insert_err_number": 902,
|
828 |
"eval_unc_insert_err_precision": 0.9823204419889503,
|
|
|
879 |
"eval_ne_word_err_precision": 0.9951290793960058,
|
880 |
"eval_ne_word_err_recall": 0.9909057839214259,
|
881 |
"eval_overall_accuracy": 0.9986137112253844,
|
882 |
+
"eval_runtime": 11.4842,
|
883 |
+
"eval_samples_per_second": 1601.155,
|
884 |
+
"eval_steps_per_second": 100.137,
|
885 |
"eval_unc_insert_err_f1": 0.991111111111111,
|
886 |
"eval_unc_insert_err_number": 902,
|
887 |
"eval_unc_insert_err_precision": 0.9933184855233853,
|
|
|
938 |
"eval_ne_word_err_precision": 0.9948998178506375,
|
939 |
"eval_ne_word_err_recall": 0.9934521644234267,
|
940 |
"eval_overall_accuracy": 0.998862532287495,
|
941 |
+
"eval_runtime": 11.5461,
|
942 |
+
"eval_samples_per_second": 1592.57,
|
943 |
+
"eval_steps_per_second": 99.601,
|
944 |
"eval_unc_insert_err_f1": 0.9900662251655629,
|
945 |
"eval_unc_insert_err_number": 902,
|
946 |
"eval_unc_insert_err_precision": 0.9857142857142858,
|
|
|
997 |
"eval_ne_word_err_precision": 0.9945454545454545,
|
998 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
999 |
"eval_overall_accuracy": 0.9990106400625607,
|
1000 |
+
"eval_runtime": 11.5275,
|
1001 |
+
"eval_samples_per_second": 1595.144,
|
1002 |
+
"eval_steps_per_second": 99.762,
|
1003 |
"eval_unc_insert_err_f1": 0.9927897947864671,
|
1004 |
"eval_unc_insert_err_number": 902,
|
1005 |
"eval_unc_insert_err_precision": 0.9933407325194229,
|
|
|
1056 |
"eval_ne_word_err_precision": 0.9949097079141922,
|
1057 |
"eval_ne_word_err_recall": 0.9953922638535225,
|
1058 |
"eval_overall_accuracy": 0.9991054290386028,
|
1059 |
+
"eval_runtime": 11.4848,
|
1060 |
+
"eval_samples_per_second": 1601.066,
|
1061 |
+
"eval_steps_per_second": 100.132,
|
1062 |
"eval_unc_insert_err_f1": 0.9927897947864671,
|
1063 |
"eval_unc_insert_err_number": 902,
|
1064 |
"eval_unc_insert_err_precision": 0.9933407325194229,
|
|
|
1115 |
"eval_ne_word_err_precision": 0.9956300072833212,
|
1116 |
"eval_ne_word_err_recall": 0.9945434703528556,
|
1117 |
"eval_overall_accuracy": 0.9992179909476527,
|
1118 |
+
"eval_runtime": 11.5451,
|
1119 |
+
"eval_samples_per_second": 1592.714,
|
1120 |
+
"eval_steps_per_second": 99.61,
|
1121 |
"eval_unc_insert_err_f1": 0.9933701657458565,
|
1122 |
"eval_unc_insert_err_number": 902,
|
1123 |
"eval_unc_insert_err_precision": 0.9900881057268722,
|
|
|
1174 |
"eval_ne_word_err_precision": 0.9959941733430444,
|
1175 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
1176 |
"eval_overall_accuracy": 0.9992594611246712,
|
1177 |
+
"eval_runtime": 11.5037,
|
1178 |
+
"eval_samples_per_second": 1598.447,
|
1179 |
+
"eval_steps_per_second": 99.968,
|
1180 |
"eval_unc_insert_err_f1": 0.9944444444444444,
|
1181 |
"eval_unc_insert_err_number": 902,
|
1182 |
"eval_unc_insert_err_precision": 0.9966592427616926,
|
|
|
1233 |
"eval_ne_word_err_precision": 0.9953922638535225,
|
1234 |
"eval_ne_word_err_recall": 0.9953922638535225,
|
1235 |
"eval_overall_accuracy": 0.999295006990687,
|
1236 |
+
"eval_runtime": 11.4631,
|
1237 |
+
"eval_samples_per_second": 1604.101,
|
1238 |
+
"eval_steps_per_second": 100.322,
|
1239 |
"eval_unc_insert_err_f1": 0.9944506104328523,
|
1240 |
"eval_unc_insert_err_number": 902,
|
1241 |
"eval_unc_insert_err_precision": 0.9955555555555555,
|
|
|
1292 |
"eval_ne_word_err_precision": 0.996719319562576,
|
1293 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
1294 |
"eval_overall_accuracy": 0.9993127799236948,
|
1295 |
+
"eval_runtime": 11.5654,
|
1296 |
+
"eval_samples_per_second": 1589.911,
|
1297 |
+
"eval_steps_per_second": 99.434,
|
1298 |
"eval_unc_insert_err_f1": 0.9939125622578859,
|
1299 |
"eval_unc_insert_err_number": 902,
|
1300 |
"eval_unc_insert_err_precision": 0.9922651933701657,
|
|
|
1351 |
"eval_ne_word_err_precision": 0.9975666139433021,
|
1352 |
"eval_ne_word_err_recall": 0.9941797017097126,
|
1353 |
"eval_overall_accuracy": 0.9993601744117159,
|
1354 |
+
"eval_runtime": 11.5142,
|
1355 |
+
"eval_samples_per_second": 1596.978,
|
1356 |
+
"eval_steps_per_second": 99.876,
|
1357 |
"eval_unc_insert_err_f1": 0.9950193691200886,
|
1358 |
"eval_unc_insert_err_number": 902,
|
1359 |
"eval_unc_insert_err_precision": 0.9933701657458563,
|
|
|
1410 |
"eval_ne_word_err_precision": 0.9959966031784544,
|
1411 |
"eval_ne_word_err_recall": 0.9955135200679035,
|
1412 |
"eval_overall_accuracy": 0.9993720230337212,
|
1413 |
+
"eval_runtime": 11.4924,
|
1414 |
+
"eval_samples_per_second": 1600.014,
|
1415 |
+
"eval_steps_per_second": 100.066,
|
1416 |
"eval_unc_insert_err_f1": 0.9950138504155125,
|
1417 |
"eval_unc_insert_err_number": 902,
|
1418 |
"eval_unc_insert_err_precision": 0.9944629014396457,
|
|
|
1469 |
"eval_ne_word_err_precision": 0.9968412100595311,
|
1470 |
"eval_ne_word_err_recall": 0.9949072389959985,
|
1471 |
"eval_overall_accuracy": 0.9993720230337212,
|
1472 |
+
"eval_runtime": 11.6279,
|
1473 |
+
"eval_samples_per_second": 1581.368,
|
1474 |
+
"eval_steps_per_second": 98.9,
|
1475 |
"eval_unc_insert_err_f1": 0.9955654101995566,
|
1476 |
"eval_unc_insert_err_number": 902,
|
1477 |
"eval_unc_insert_err_precision": 0.9955654101995566,
|
|
|
1528 |
"eval_ne_word_err_precision": 0.9957565470417071,
|
1529 |
"eval_ne_word_err_recall": 0.9958772887110464,
|
1530 |
"eval_overall_accuracy": 0.9993779473447238,
|
1531 |
+
"eval_runtime": 11.5517,
|
1532 |
+
"eval_samples_per_second": 1591.803,
|
1533 |
+
"eval_steps_per_second": 99.553,
|
1534 |
"eval_unc_insert_err_f1": 0.995575221238938,
|
1535 |
"eval_unc_insert_err_number": 902,
|
1536 |
"eval_unc_insert_err_precision": 0.9933774834437086,
|
|
|
1587 |
"eval_ne_word_err_precision": 0.9964784456587735,
|
1588 |
"eval_ne_word_err_recall": 0.9950284952103795,
|
1589 |
"eval_overall_accuracy": 0.9993720230337212,
|
1590 |
+
"eval_runtime": 11.5195,
|
1591 |
+
"eval_samples_per_second": 1596.249,
|
1592 |
+
"eval_steps_per_second": 99.831,
|
1593 |
"eval_unc_insert_err_f1": 0.9955703211517165,
|
1594 |
"eval_unc_insert_err_number": 902,
|
1595 |
"eval_unc_insert_err_precision": 0.9944690265486725,
|
|
|
1646 |
"eval_ne_word_err_precision": 0.9963578972927036,
|
1647 |
"eval_ne_word_err_recall": 0.9951497514247605,
|
1648 |
"eval_overall_accuracy": 0.9993838716557264,
|
1649 |
+
"eval_runtime": 11.5765,
|
1650 |
+
"eval_samples_per_second": 1588.392,
|
1651 |
+
"eval_steps_per_second": 99.339,
|
1652 |
"eval_unc_insert_err_f1": 0.9955703211517165,
|
1653 |
"eval_unc_insert_err_number": 902,
|
1654 |
"eval_unc_insert_err_precision": 0.9944690265486725,
|
|
|
1705 |
"eval_ne_word_err_precision": 0.9962374074523607,
|
1706 |
"eval_ne_word_err_recall": 0.9952710076391416,
|
1707 |
"eval_overall_accuracy": 0.9993957202777317,
|
1708 |
+
"eval_runtime": 11.5017,
|
1709 |
+
"eval_samples_per_second": 1598.724,
|
1710 |
+
"eval_steps_per_second": 99.985,
|
1711 |
"eval_unc_insert_err_f1": 0.9961175818080976,
|
1712 |
"eval_unc_insert_err_number": 902,
|
1713 |
"eval_unc_insert_err_precision": 0.9966703662597114,
|
|
|
1764 |
"eval_ne_word_err_precision": 0.9970827762246263,
|
1765 |
"eval_ne_word_err_recall": 0.9946647265672366,
|
1766 |
"eval_overall_accuracy": 0.9993957202777317,
|
1767 |
+
"eval_runtime": 11.5014,
|
1768 |
+
"eval_samples_per_second": 1598.761,
|
1769 |
+
"eval_steps_per_second": 99.988,
|
1770 |
"eval_unc_insert_err_f1": 0.9961218836565098,
|
1771 |
"eval_unc_insert_err_number": 902,
|
1772 |
"eval_unc_insert_err_precision": 0.9955703211517165,
|
|
|
1782 |
"step": 17250,
|
1783 |
"total_flos": 7911429330344064.0,
|
1784 |
"train_loss": 0.06519987745561462,
|
1785 |
+
"train_runtime": 1743.8633,
|
1786 |
+
"train_samples_per_second": 316.332,
|
1787 |
+
"train_steps_per_second": 9.892
|
1788 |
}
|
1789 |
],
|
1790 |
"max_steps": 17250,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3387
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:735e977a5aabe6e9dacf785770cbcf801ab51c2533de47ea8a4cedd007b5807f
|
3 |
size 3387
|