Shadman-Rohan commited on
Commit
3735434
·
1 Parent(s): ed3cd85

Training in progress, epoch 1

Browse files
all_results.json ADDED
@@ -0,0 +1,58 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_5_err_f1": 0.9850746268656716,
4
+ "eval_5_err_number": 34,
5
+ "eval_5_err_precision": 1.0,
6
+ "eval_5_err_recall": 0.9705882352941176,
7
+ "eval___f1": 0.9912903388209234,
8
+ "eval___number": 9934,
9
+ "eval___precision": 0.9915399335280491,
10
+ "eval___recall": 0.9910408697402859,
11
+ "eval__err_f1": 0.9808695652173912,
12
+ "eval__err_number": 285,
13
+ "eval__err_precision": 0.9724137931034482,
14
+ "eval__err_recall": 0.9894736842105263,
15
+ "eval_egin_err_f1": 0.9933598937583,
16
+ "eval_egin_err_number": 1126,
17
+ "eval_egin_err_precision": 0.9902912621359223,
18
+ "eval_egin_err_recall": 0.9964476021314387,
19
+ "eval_el_err_f1": 0.9956584659913169,
20
+ "eval_el_err_number": 1380,
21
+ "eval_el_err_precision": 0.9942196531791907,
22
+ "eval_el_err_recall": 0.9971014492753624,
23
+ "eval_loss": 0.0013192046899348497,
24
+ "eval_macro_avg_f1": 0.9912800394235617,
25
+ "eval_macro_avg_number": 23096,
26
+ "eval_macro_avg_precision": 0.991795835558829,
27
+ "eval_macro_avg_recall": 0.990841420701172,
28
+ "eval_micro_avg_f1": 0.993373754872239,
29
+ "eval_micro_avg_number": 23096,
30
+ "eval_micro_avg_precision": 0.9936319528677872,
31
+ "eval_micro_avg_recall": 0.9931156910287495,
32
+ "eval_nd_err_f1": 0.9919932574799832,
33
+ "eval_nd_err_number": 1188,
34
+ "eval_nd_err_precision": 0.9932489451476794,
35
+ "eval_nd_err_recall": 0.9907407407407407,
36
+ "eval_ne_word_err_f1": 0.9958722835983974,
37
+ "eval_ne_word_err_number": 8247,
38
+ "eval_ne_word_err_precision": 0.9970827762246263,
39
+ "eval_ne_word_err_recall": 0.9946647265672366,
40
+ "eval_overall_accuracy": 0.9993957202777317,
41
+ "eval_runtime": 11.3466,
42
+ "eval_samples": 18388,
43
+ "eval_samples_per_second": 1620.567,
44
+ "eval_steps_per_second": 101.352,
45
+ "eval_unc_insert_err_f1": 0.9961218836565098,
46
+ "eval_unc_insert_err_number": 902,
47
+ "eval_unc_insert_err_precision": 0.9955703211517165,
48
+ "eval_unc_insert_err_recall": 0.9966740576496674,
49
+ "eval_weighted_avg_f1": 0.993375440096453,
50
+ "eval_weighted_avg_number": 23096,
51
+ "eval_weighted_avg_precision": 0.9936401344515604,
52
+ "eval_weighted_avg_recall": 0.9931156910287495,
53
+ "train_loss": 0.06519987745561462,
54
+ "train_runtime": 1743.5904,
55
+ "train_samples": 18388,
56
+ "train_samples_per_second": 316.382,
57
+ "train_steps_per_second": 9.893
58
+ }
eval_results.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "eval_5_err_f1": 0.9850746268656716,
4
+ "eval_5_err_number": 34,
5
+ "eval_5_err_precision": 1.0,
6
+ "eval_5_err_recall": 0.9705882352941176,
7
+ "eval___f1": 0.9912903388209234,
8
+ "eval___number": 9934,
9
+ "eval___precision": 0.9915399335280491,
10
+ "eval___recall": 0.9910408697402859,
11
+ "eval__err_f1": 0.9808695652173912,
12
+ "eval__err_number": 285,
13
+ "eval__err_precision": 0.9724137931034482,
14
+ "eval__err_recall": 0.9894736842105263,
15
+ "eval_egin_err_f1": 0.9933598937583,
16
+ "eval_egin_err_number": 1126,
17
+ "eval_egin_err_precision": 0.9902912621359223,
18
+ "eval_egin_err_recall": 0.9964476021314387,
19
+ "eval_el_err_f1": 0.9956584659913169,
20
+ "eval_el_err_number": 1380,
21
+ "eval_el_err_precision": 0.9942196531791907,
22
+ "eval_el_err_recall": 0.9971014492753624,
23
+ "eval_loss": 0.0013192046899348497,
24
+ "eval_macro_avg_f1": 0.9912800394235617,
25
+ "eval_macro_avg_number": 23096,
26
+ "eval_macro_avg_precision": 0.991795835558829,
27
+ "eval_macro_avg_recall": 0.990841420701172,
28
+ "eval_micro_avg_f1": 0.993373754872239,
29
+ "eval_micro_avg_number": 23096,
30
+ "eval_micro_avg_precision": 0.9936319528677872,
31
+ "eval_micro_avg_recall": 0.9931156910287495,
32
+ "eval_nd_err_f1": 0.9919932574799832,
33
+ "eval_nd_err_number": 1188,
34
+ "eval_nd_err_precision": 0.9932489451476794,
35
+ "eval_nd_err_recall": 0.9907407407407407,
36
+ "eval_ne_word_err_f1": 0.9958722835983974,
37
+ "eval_ne_word_err_number": 8247,
38
+ "eval_ne_word_err_precision": 0.9970827762246263,
39
+ "eval_ne_word_err_recall": 0.9946647265672366,
40
+ "eval_overall_accuracy": 0.9993957202777317,
41
+ "eval_runtime": 11.3466,
42
+ "eval_samples": 18388,
43
+ "eval_samples_per_second": 1620.567,
44
+ "eval_steps_per_second": 101.352,
45
+ "eval_unc_insert_err_f1": 0.9961218836565098,
46
+ "eval_unc_insert_err_number": 902,
47
+ "eval_unc_insert_err_precision": 0.9955703211517165,
48
+ "eval_unc_insert_err_recall": 0.9966740576496674,
49
+ "eval_weighted_avg_f1": 0.993375440096453,
50
+ "eval_weighted_avg_number": 23096,
51
+ "eval_weighted_avg_precision": 0.9936401344515604,
52
+ "eval_weighted_avg_recall": 0.9931156910287495
53
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cb8de0288b5a6e76feea0bd3fc8fd584ac1e2b3cae7999f2b363d2d1f1869015
3
  size 440204333
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f97a01ef0c9cf5ab55573541c020f69350a7193a786138e1d42112eb77868c8c
3
  size 440204333
runs/Mar02_00-52-19_home-3090/events.out.tfevents.1677698625.home-3090.10497.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f80bf45c97d4bf7f9cd5f5b54374434516b794b4b6e0a1fb5c00b642fd552a87
3
+ size 2994
runs/Mar03_01-20-39_home-3090/1677784859.1870086/events.out.tfevents.1677784859.home-3090.52004.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be276b4ce297fe687e5ab6dc08cbfbc7b8e3ef647e3f55ee0ea58bac5371c68b
3
+ size 5523
runs/Mar03_01-20-39_home-3090/events.out.tfevents.1677784859.home-3090.52004.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00b7d5cc1bc54910f4e653ce177391178c3000bb10858458c2b6da0b017509f4
3
+ size 7325
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 30.0,
3
+ "train_loss": 0.06519987745561462,
4
+ "train_runtime": 1743.5904,
5
+ "train_samples": 18388,
6
+ "train_samples_per_second": 316.382,
7
+ "train_steps_per_second": 9.893
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,1795 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 30.0,
5
+ "global_step": 17250,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.0,
12
+ "learning_rate": 6.666666666666667e-06,
13
+ "loss": 0.7818,
14
+ "step": 575
15
+ },
16
+ {
17
+ "epoch": 1.0,
18
+ "eval_5_err_f1": 0.0,
19
+ "eval_5_err_number": 34,
20
+ "eval_5_err_precision": 0.0,
21
+ "eval_5_err_recall": 0.0,
22
+ "eval___f1": 0.15277177825773938,
23
+ "eval___number": 9934,
24
+ "eval___precision": 0.26820020222446916,
25
+ "eval___recall": 0.1068049124219851,
26
+ "eval__err_f1": 0.0,
27
+ "eval__err_number": 285,
28
+ "eval__err_precision": 0.0,
29
+ "eval__err_recall": 0.0,
30
+ "eval_egin_err_f1": 0.0,
31
+ "eval_egin_err_number": 1126,
32
+ "eval_egin_err_precision": 0.0,
33
+ "eval_egin_err_recall": 0.0,
34
+ "eval_el_err_f1": 0.0,
35
+ "eval_el_err_number": 1380,
36
+ "eval_el_err_precision": 0.0,
37
+ "eval_el_err_recall": 0.0,
38
+ "eval_loss": 0.283189594745636,
39
+ "eval_macro_avg_f1": 0.07410438993859113,
40
+ "eval_macro_avg_number": 23096,
41
+ "eval_macro_avg_precision": 0.11278010170972645,
42
+ "eval_macro_avg_recall": 0.055471991523343506,
43
+ "eval_micro_avg_f1": 0.24431366311436298,
44
+ "eval_micro_avg_number": 23096,
45
+ "eval_micro_avg_precision": 0.4604868689291282,
46
+ "eval_micro_avg_recall": 0.16626255628680292,
47
+ "eval_nd_err_f1": 0.0,
48
+ "eval_nd_err_number": 1188,
49
+ "eval_nd_err_precision": 0.0,
50
+ "eval_nd_err_recall": 0.0,
51
+ "eval_ne_word_err_f1": 0.44006334125098967,
52
+ "eval_ne_word_err_number": 8247,
53
+ "eval_ne_word_err_precision": 0.6340406114533425,
54
+ "eval_ne_word_err_recall": 0.33697101976476296,
55
+ "eval_overall_accuracy": 0.9313016896134979,
56
+ "eval_runtime": 11.4511,
57
+ "eval_samples_per_second": 1605.79,
58
+ "eval_steps_per_second": 100.427,
59
+ "eval_unc_insert_err_f1": 0.0,
60
+ "eval_unc_insert_err_number": 902,
61
+ "eval_unc_insert_err_precision": 0.0,
62
+ "eval_unc_insert_err_recall": 0.0,
63
+ "eval_weighted_avg_f1": 0.22284539402967157,
64
+ "eval_weighted_avg_number": 23096,
65
+ "eval_weighted_avg_precision": 0.3417576087440939,
66
+ "eval_weighted_avg_recall": 0.16626255628680292,
67
+ "step": 575
68
+ },
69
+ {
70
+ "epoch": 2.0,
71
+ "learning_rate": 1.3333333333333333e-05,
72
+ "loss": 0.2475,
73
+ "step": 1150
74
+ },
75
+ {
76
+ "epoch": 2.0,
77
+ "eval_5_err_f1": 0.0,
78
+ "eval_5_err_number": 34,
79
+ "eval_5_err_precision": 0.0,
80
+ "eval_5_err_recall": 0.0,
81
+ "eval___f1": 0.2921747656106379,
82
+ "eval___number": 9934,
83
+ "eval___precision": 0.3733750978856695,
84
+ "eval___recall": 0.2399838936984095,
85
+ "eval__err_f1": 0.0,
86
+ "eval__err_number": 285,
87
+ "eval__err_precision": 0.0,
88
+ "eval__err_recall": 0.0,
89
+ "eval_egin_err_f1": 0.4211180124223602,
90
+ "eval_egin_err_number": 1126,
91
+ "eval_egin_err_precision": 0.7004132231404959,
92
+ "eval_egin_err_recall": 0.30106571936056836,
93
+ "eval_el_err_f1": 0.23684210526315788,
94
+ "eval_el_err_number": 1380,
95
+ "eval_el_err_precision": 0.875,
96
+ "eval_el_err_recall": 0.13695652173913042,
97
+ "eval_loss": 0.1883164346218109,
98
+ "eval_macro_avg_f1": 0.25811167808226654,
99
+ "eval_macro_avg_number": 23096,
100
+ "eval_macro_avg_precision": 0.5382361502619613,
101
+ "eval_macro_avg_recall": 0.2033771848028768,
102
+ "eval_micro_avg_f1": 0.42355211320451314,
103
+ "eval_micro_avg_number": 23096,
104
+ "eval_micro_avg_precision": 0.5558134627558556,
105
+ "eval_micro_avg_recall": 0.3421371666089366,
106
+ "eval_nd_err_f1": 0.49635036496350365,
107
+ "eval_nd_err_number": 1188,
108
+ "eval_nd_err_precision": 0.6520547945205479,
109
+ "eval_nd_err_recall": 0.4006734006734007,
110
+ "eval_ne_word_err_f1": 0.616193336974331,
111
+ "eval_ne_word_err_number": 8247,
112
+ "eval_ne_word_err_precision": 0.7050460865489767,
113
+ "eval_ne_word_err_recall": 0.5472292955013944,
114
+ "eval_overall_accuracy": 0.9455378089528188,
115
+ "eval_runtime": 12.2219,
116
+ "eval_samples_per_second": 1504.512,
117
+ "eval_steps_per_second": 94.093,
118
+ "eval_unc_insert_err_f1": 0.0022148394241417496,
119
+ "eval_unc_insert_err_number": 902,
120
+ "eval_unc_insert_err_precision": 1.0,
121
+ "eval_unc_insert_err_recall": 0.0011086474501108647,
122
+ "eval_weighted_avg_f1": 0.40599643131240637,
123
+ "eval_weighted_avg_number": 23096,
124
+ "eval_weighted_avg_precision": 0.571372951303787,
125
+ "eval_weighted_avg_recall": 0.3421371666089366,
126
+ "step": 1150
127
+ },
128
+ {
129
+ "epoch": 3.0,
130
+ "learning_rate": 2e-05,
131
+ "loss": 0.1897,
132
+ "step": 1725
133
+ },
134
+ {
135
+ "epoch": 3.0,
136
+ "eval_5_err_f1": 0.0,
137
+ "eval_5_err_number": 34,
138
+ "eval_5_err_precision": 0.0,
139
+ "eval_5_err_recall": 0.0,
140
+ "eval___f1": 0.4270756692512309,
141
+ "eval___number": 9934,
142
+ "eval___precision": 0.48778280542986424,
143
+ "eval___recall": 0.379806724380914,
144
+ "eval__err_f1": 0.0,
145
+ "eval__err_number": 285,
146
+ "eval__err_precision": 0.0,
147
+ "eval__err_recall": 0.0,
148
+ "eval_egin_err_f1": 0.6587155963302753,
149
+ "eval_egin_err_number": 1126,
150
+ "eval_egin_err_precision": 0.681214421252372,
151
+ "eval_egin_err_recall": 0.6376554174067496,
152
+ "eval_el_err_f1": 0.39977851605758585,
153
+ "eval_el_err_number": 1380,
154
+ "eval_el_err_precision": 0.8474178403755869,
155
+ "eval_el_err_recall": 0.26159420289855073,
156
+ "eval_loss": 0.1407451629638672,
157
+ "eval_macro_avg_f1": 0.393737200401998,
158
+ "eval_macro_avg_number": 23096,
159
+ "eval_macro_avg_precision": 0.4998071399685999,
160
+ "eval_macro_avg_recall": 0.3484017162866866,
161
+ "eval_micro_avg_f1": 0.5544212726654028,
162
+ "eval_micro_avg_number": 23096,
163
+ "eval_micro_avg_precision": 0.6319960101961654,
164
+ "eval_micro_avg_recall": 0.4938084516799446,
165
+ "eval_nd_err_f1": 0.6383909051158723,
166
+ "eval_nd_err_number": 1188,
167
+ "eval_nd_err_precision": 0.6642402183803457,
168
+ "eval_nd_err_recall": 0.6144781144781145,
169
+ "eval_ne_word_err_f1": 0.7204706785188976,
170
+ "eval_ne_word_err_number": 8247,
171
+ "eval_ne_word_err_precision": 0.7622462787550744,
172
+ "eval_ne_word_err_recall": 0.6830362556080999,
173
+ "eval_overall_accuracy": 0.9567288324367876,
174
+ "eval_runtime": 11.5134,
175
+ "eval_samples_per_second": 1597.097,
176
+ "eval_steps_per_second": 99.884,
177
+ "eval_unc_insert_err_f1": 0.3054662379421222,
178
+ "eval_unc_insert_err_number": 902,
179
+ "eval_unc_insert_err_precision": 0.5555555555555556,
180
+ "eval_unc_insert_err_recall": 0.2106430155210643,
181
+ "eval_weighted_avg_f1": 0.541723174559053,
182
+ "eval_weighted_avg_number": 23096,
183
+ "eval_weighted_avg_precision": 0.6216917214508492,
184
+ "eval_weighted_avg_recall": 0.4938084516799446,
185
+ "step": 1725
186
+ },
187
+ {
188
+ "epoch": 4.0,
189
+ "learning_rate": 1.925925925925926e-05,
190
+ "loss": 0.1506,
191
+ "step": 2300
192
+ },
193
+ {
194
+ "epoch": 4.0,
195
+ "eval_5_err_f1": 0.0,
196
+ "eval_5_err_number": 34,
197
+ "eval_5_err_precision": 0.0,
198
+ "eval_5_err_recall": 0.0,
199
+ "eval___f1": 0.5822524859489839,
200
+ "eval___number": 9934,
201
+ "eval___precision": 0.6285880980163361,
202
+ "eval___recall": 0.5422790416750554,
203
+ "eval__err_f1": 0.10526315789473685,
204
+ "eval__err_number": 285,
205
+ "eval__err_precision": 0.8421052631578947,
206
+ "eval__err_recall": 0.056140350877192984,
207
+ "eval_egin_err_f1": 0.7867298578199051,
208
+ "eval_egin_err_number": 1126,
209
+ "eval_egin_err_precision": 0.8434959349593496,
210
+ "eval_egin_err_recall": 0.7371225577264654,
211
+ "eval_el_err_f1": 0.5848513902205178,
212
+ "eval_el_err_number": 1380,
213
+ "eval_el_err_precision": 0.8640226628895185,
214
+ "eval_el_err_recall": 0.4420289855072464,
215
+ "eval_loss": 0.10146419703960419,
216
+ "eval_macro_avg_f1": 0.5028590528776729,
217
+ "eval_macro_avg_number": 23096,
218
+ "eval_macro_avg_precision": 0.6915397433751863,
219
+ "eval_macro_avg_recall": 0.4461313799008184,
220
+ "eval_micro_avg_f1": 0.6814043606144078,
221
+ "eval_micro_avg_number": 23096,
222
+ "eval_micro_avg_precision": 0.7392867997163408,
223
+ "eval_micro_avg_recall": 0.6319276065119501,
224
+ "eval_nd_err_f1": 0.7756925826630922,
225
+ "eval_nd_err_number": 1188,
226
+ "eval_nd_err_precision": 0.8266666666666667,
227
+ "eval_nd_err_recall": 0.7306397306397306,
228
+ "eval_ne_word_err_f1": 0.8148148148148148,
229
+ "eval_ne_word_err_number": 8247,
230
+ "eval_ne_word_err_precision": 0.8228239366963402,
231
+ "eval_ne_word_err_recall": 0.8069601067054687,
232
+ "eval_overall_accuracy": 0.9701177753027322,
233
+ "eval_runtime": 11.6132,
234
+ "eval_samples_per_second": 1583.375,
235
+ "eval_steps_per_second": 99.026,
236
+ "eval_unc_insert_err_f1": 0.37326813365933176,
237
+ "eval_unc_insert_err_number": 902,
238
+ "eval_unc_insert_err_precision": 0.7046153846153846,
239
+ "eval_unc_insert_err_recall": 0.25388026607538805,
240
+ "eval_weighted_avg_f1": 0.6704640351735791,
241
+ "eval_weighted_avg_number": 23096,
242
+ "eval_weighted_avg_precision": 0.7373568559968757,
243
+ "eval_weighted_avg_recall": 0.6319276065119501,
244
+ "step": 2300
245
+ },
246
+ {
247
+ "epoch": 5.0,
248
+ "learning_rate": 1.851851851851852e-05,
249
+ "loss": 0.1156,
250
+ "step": 2875
251
+ },
252
+ {
253
+ "epoch": 5.0,
254
+ "eval_5_err_f1": 0.0,
255
+ "eval_5_err_number": 34,
256
+ "eval_5_err_precision": 0.0,
257
+ "eval_5_err_recall": 0.0,
258
+ "eval___f1": 0.7171141287446875,
259
+ "eval___number": 9934,
260
+ "eval___precision": 0.7391025641025641,
261
+ "eval___recall": 0.6963962150191262,
262
+ "eval__err_f1": 0.3314917127071823,
263
+ "eval__err_number": 285,
264
+ "eval__err_precision": 0.7792207792207793,
265
+ "eval__err_recall": 0.21052631578947367,
266
+ "eval_egin_err_f1": 0.853273137697517,
267
+ "eval_egin_err_number": 1126,
268
+ "eval_egin_err_precision": 0.8677685950413223,
269
+ "eval_egin_err_recall": 0.8392539964476021,
270
+ "eval_el_err_f1": 0.7756132756132756,
271
+ "eval_el_err_number": 1380,
272
+ "eval_el_err_precision": 0.7722701149425287,
273
+ "eval_el_err_recall": 0.7789855072463768,
274
+ "eval_loss": 0.07168415188789368,
275
+ "eval_macro_avg_f1": 0.6164482191003791,
276
+ "eval_macro_avg_number": 23096,
277
+ "eval_macro_avg_precision": 0.7024262910397409,
278
+ "eval_macro_avg_recall": 0.5800476084892296,
279
+ "eval_micro_avg_f1": 0.7831352220931272,
280
+ "eval_micro_avg_number": 23096,
281
+ "eval_micro_avg_precision": 0.8090951061865189,
282
+ "eval_micro_avg_recall": 0.7587894007620367,
283
+ "eval_nd_err_f1": 0.841511072514112,
284
+ "eval_nd_err_number": 1188,
285
+ "eval_nd_err_precision": 0.8690582959641255,
286
+ "eval_nd_err_recall": 0.8156565656565656,
287
+ "eval_ne_word_err_f1": 0.8785149788641794,
288
+ "eval_ne_word_err_number": 8247,
289
+ "eval_ne_word_err_precision": 0.887815750371471,
290
+ "eval_ne_word_err_recall": 0.869407057111677,
291
+ "eval_overall_accuracy": 0.9797270077489988,
292
+ "eval_runtime": 11.582,
293
+ "eval_samples_per_second": 1587.637,
294
+ "eval_steps_per_second": 99.292,
295
+ "eval_unc_insert_err_f1": 0.5340674466620785,
296
+ "eval_unc_insert_err_number": 902,
297
+ "eval_unc_insert_err_precision": 0.7041742286751361,
298
+ "eval_unc_insert_err_recall": 0.43015521064301554,
299
+ "eval_weighted_avg_f1": 0.7783155433059336,
300
+ "eval_weighted_avg_number": 23096,
301
+ "eval_weighted_avg_precision": 0.8051864346074598,
302
+ "eval_weighted_avg_recall": 0.7587894007620367,
303
+ "step": 2875
304
+ },
305
+ {
306
+ "epoch": 6.0,
307
+ "learning_rate": 1.7777777777777777e-05,
308
+ "loss": 0.0872,
309
+ "step": 3450
310
+ },
311
+ {
312
+ "epoch": 6.0,
313
+ "eval_5_err_f1": 0.0,
314
+ "eval_5_err_number": 34,
315
+ "eval_5_err_precision": 0.0,
316
+ "eval_5_err_recall": 0.0,
317
+ "eval___f1": 0.8336382113821139,
318
+ "eval___number": 9934,
319
+ "eval___precision": 0.8416786373896984,
320
+ "eval___recall": 0.8257499496678076,
321
+ "eval__err_f1": 0.5062034739454094,
322
+ "eval__err_number": 285,
323
+ "eval__err_precision": 0.864406779661017,
324
+ "eval__err_recall": 0.35789473684210527,
325
+ "eval_egin_err_f1": 0.8927116342236305,
326
+ "eval_egin_err_number": 1126,
327
+ "eval_egin_err_precision": 0.9104339796860572,
328
+ "eval_egin_err_recall": 0.8756660746003553,
329
+ "eval_el_err_f1": 0.8574585635359115,
330
+ "eval_el_err_number": 1380,
331
+ "eval_el_err_precision": 0.8719101123595505,
332
+ "eval_el_err_recall": 0.8434782608695652,
333
+ "eval_loss": 0.048479896038770676,
334
+ "eval_macro_avg_f1": 0.7046115753196951,
335
+ "eval_macro_avg_number": 23096,
336
+ "eval_macro_avg_precision": 0.7584152991122148,
337
+ "eval_macro_avg_recall": 0.677463811561773,
338
+ "eval_micro_avg_f1": 0.8668196219818638,
339
+ "eval_micro_avg_number": 23096,
340
+ "eval_micro_avg_precision": 0.8749834575852485,
341
+ "eval_micro_avg_recall": 0.8588067197783166,
342
+ "eval_nd_err_f1": 0.8641655886157827,
343
+ "eval_nd_err_number": 1188,
344
+ "eval_nd_err_precision": 0.8859416445623343,
345
+ "eval_nd_err_recall": 0.8434343434343434,
346
+ "eval_ne_word_err_f1": 0.9267559935107854,
347
+ "eval_ne_word_err_number": 8247,
348
+ "eval_ne_word_err_precision": 0.918532634587899,
349
+ "eval_ne_word_err_recall": 0.935127925306172,
350
+ "eval_overall_accuracy": 0.9874049148084078,
351
+ "eval_runtime": 11.5539,
352
+ "eval_samples_per_second": 1591.493,
353
+ "eval_steps_per_second": 99.533,
354
+ "eval_unc_insert_err_f1": 0.7559591373439274,
355
+ "eval_unc_insert_err_number": 902,
356
+ "eval_unc_insert_err_precision": 0.7744186046511627,
357
+ "eval_unc_insert_err_recall": 0.738359201773836,
358
+ "eval_weighted_avg_f1": 0.8644603671372942,
359
+ "eval_weighted_avg_number": 23096,
360
+ "eval_weighted_avg_precision": 0.872971035018927,
361
+ "eval_weighted_avg_recall": 0.8588067197783166,
362
+ "step": 3450
363
+ },
364
+ {
365
+ "epoch": 7.0,
366
+ "learning_rate": 1.7037037037037038e-05,
367
+ "loss": 0.0675,
368
+ "step": 4025
369
+ },
370
+ {
371
+ "epoch": 7.0,
372
+ "eval_5_err_f1": 0.0,
373
+ "eval_5_err_number": 34,
374
+ "eval_5_err_precision": 0.0,
375
+ "eval_5_err_recall": 0.0,
376
+ "eval___f1": 0.8946004977904202,
377
+ "eval___number": 9934,
378
+ "eval___precision": 0.9029016712806316,
379
+ "eval___recall": 0.8864505737869942,
380
+ "eval__err_f1": 0.6258503401360545,
381
+ "eval__err_number": 285,
382
+ "eval__err_precision": 0.8846153846153846,
383
+ "eval__err_recall": 0.4842105263157895,
384
+ "eval_egin_err_f1": 0.8920105355575065,
385
+ "eval_egin_err_number": 1126,
386
+ "eval_egin_err_precision": 0.8819444444444444,
387
+ "eval_egin_err_recall": 0.9023090586145648,
388
+ "eval_el_err_f1": 0.8992424242424242,
389
+ "eval_el_err_number": 1380,
390
+ "eval_el_err_precision": 0.942063492063492,
391
+ "eval_el_err_recall": 0.8601449275362318,
392
+ "eval_loss": 0.035397969186306,
393
+ "eval_macro_avg_f1": 0.7470366372560805,
394
+ "eval_macro_avg_number": 23096,
395
+ "eval_macro_avg_precision": 0.7838431031789916,
396
+ "eval_macro_avg_recall": 0.7255447092342178,
397
+ "eval_micro_avg_f1": 0.9088604829017808,
398
+ "eval_micro_avg_number": 23096,
399
+ "eval_micro_avg_precision": 0.9174202655608982,
400
+ "eval_micro_avg_recall": 0.9004589539314167,
401
+ "eval_nd_err_f1": 0.8717948717948718,
402
+ "eval_nd_err_number": 1188,
403
+ "eval_nd_err_precision": 0.8854166666666666,
404
+ "eval_nd_err_recall": 0.8585858585858586,
405
+ "eval_ne_word_err_f1": 0.9520577004666949,
406
+ "eval_ne_word_err_number": 8247,
407
+ "eval_ne_word_err_precision": 0.9517692680562287,
408
+ "eval_ne_word_err_recall": 0.9523463077482721,
409
+ "eval_overall_accuracy": 0.9913860518021754,
410
+ "eval_runtime": 11.6281,
411
+ "eval_samples_per_second": 1581.339,
412
+ "eval_steps_per_second": 98.898,
413
+ "eval_unc_insert_err_f1": 0.8407367280606717,
414
+ "eval_unc_insert_err_number": 902,
415
+ "eval_unc_insert_err_precision": 0.8220338983050848,
416
+ "eval_unc_insert_err_recall": 0.8603104212860311,
417
+ "eval_weighted_avg_f1": 0.9073581482781856,
418
+ "eval_weighted_avg_number": 23096,
419
+ "eval_weighted_avg_precision": 0.9160568228498506,
420
+ "eval_weighted_avg_recall": 0.9004589539314167,
421
+ "step": 4025
422
+ },
423
+ {
424
+ "epoch": 8.0,
425
+ "learning_rate": 1.6296296296296297e-05,
426
+ "loss": 0.0532,
427
+ "step": 4600
428
+ },
429
+ {
430
+ "epoch": 8.0,
431
+ "eval_5_err_f1": 0.0,
432
+ "eval_5_err_number": 34,
433
+ "eval_5_err_precision": 0.0,
434
+ "eval_5_err_recall": 0.0,
435
+ "eval___f1": 0.9236796580848683,
436
+ "eval___number": 9934,
437
+ "eval___precision": 0.9338477366255145,
438
+ "eval___recall": 0.913730622105899,
439
+ "eval__err_f1": 0.7455621301775148,
440
+ "eval__err_number": 285,
441
+ "eval__err_precision": 0.8513513513513513,
442
+ "eval__err_recall": 0.6631578947368421,
443
+ "eval_egin_err_f1": 0.929652715939448,
444
+ "eval_egin_err_number": 1126,
445
+ "eval_egin_err_precision": 0.9321428571428572,
446
+ "eval_egin_err_recall": 0.9271758436944938,
447
+ "eval_el_err_f1": 0.9120669965740388,
448
+ "eval_el_err_number": 1380,
449
+ "eval_el_err_precision": 0.9607056936647955,
450
+ "eval_el_err_recall": 0.8681159420289855,
451
+ "eval_loss": 0.02567952871322632,
452
+ "eval_macro_avg_f1": 0.7841691959478824,
453
+ "eval_macro_avg_number": 23096,
454
+ "eval_macro_avg_precision": 0.805945865713128,
455
+ "eval_macro_avg_recall": 0.7659910981441609,
456
+ "eval_micro_avg_f1": 0.9342174369747899,
457
+ "eval_micro_avg_number": 23096,
458
+ "eval_micro_avg_precision": 0.9444690265486726,
459
+ "eval_micro_avg_recall": 0.9241860062348458,
460
+ "eval_nd_err_f1": 0.8971404182671789,
461
+ "eval_nd_err_number": 1188,
462
+ "eval_nd_err_precision": 0.90995670995671,
463
+ "eval_nd_err_recall": 0.8846801346801347,
464
+ "eval_ne_word_err_f1": 0.9680553868577675,
465
+ "eval_ne_word_err_number": 8247,
466
+ "eval_ne_word_err_precision": 0.9697043435941112,
467
+ "eval_ne_word_err_recall": 0.9664120286164666,
468
+ "eval_overall_accuracy": 0.9938387165572644,
469
+ "eval_runtime": 11.5399,
470
+ "eval_samples_per_second": 1593.424,
471
+ "eval_steps_per_second": 99.654,
472
+ "eval_unc_insert_err_f1": 0.897196261682243,
473
+ "eval_unc_insert_err_number": 902,
474
+ "eval_unc_insert_err_precision": 0.8898582333696837,
475
+ "eval_unc_insert_err_recall": 0.9046563192904656,
476
+ "eval_weighted_avg_f1": 0.9331653517617972,
477
+ "eval_weighted_avg_number": 23096,
478
+ "eval_weighted_avg_precision": 0.9428332908175411,
479
+ "eval_weighted_avg_recall": 0.9241860062348458,
480
+ "step": 4600
481
+ },
482
+ {
483
+ "epoch": 9.0,
484
+ "learning_rate": 1.555555555555556e-05,
485
+ "loss": 0.0418,
486
+ "step": 5175
487
+ },
488
+ {
489
+ "epoch": 9.0,
490
+ "eval_5_err_f1": 0.0,
491
+ "eval_5_err_number": 34,
492
+ "eval_5_err_precision": 0.0,
493
+ "eval_5_err_recall": 0.0,
494
+ "eval___f1": 0.9510765187506318,
495
+ "eval___number": 9934,
496
+ "eval___precision": 0.9550345107592367,
497
+ "eval___recall": 0.9471511979061807,
498
+ "eval__err_f1": 0.8208955223880597,
499
+ "eval__err_number": 285,
500
+ "eval__err_precision": 0.8764940239043825,
501
+ "eval__err_recall": 0.7719298245614035,
502
+ "eval_egin_err_f1": 0.9310954063604241,
503
+ "eval_egin_err_number": 1126,
504
+ "eval_egin_err_precision": 0.9261862917398945,
505
+ "eval_egin_err_recall": 0.9360568383658969,
506
+ "eval_el_err_f1": 0.9391495601173021,
507
+ "eval_el_err_number": 1380,
508
+ "eval_el_err_precision": 0.9502967359050445,
509
+ "eval_el_err_recall": 0.9282608695652174,
510
+ "eval_loss": 0.01935717649757862,
511
+ "eval_macro_avg_f1": 0.8072644057238675,
512
+ "eval_macro_avg_number": 23096,
513
+ "eval_macro_avg_precision": 0.8132706801082134,
514
+ "eval_macro_avg_recall": 0.8022721637436516,
515
+ "eval_micro_avg_f1": 0.9534545296583481,
516
+ "eval_micro_avg_number": 23096,
517
+ "eval_micro_avg_precision": 0.9565918500762693,
518
+ "eval_micro_avg_recall": 0.9503377208174576,
519
+ "eval_nd_err_f1": 0.9040980143641741,
520
+ "eval_nd_err_number": 1188,
521
+ "eval_nd_err_precision": 0.90754877014419,
522
+ "eval_nd_err_recall": 0.9006734006734006,
523
+ "eval_ne_word_err_f1": 0.9772410026096984,
524
+ "eval_ne_word_err_number": 8247,
525
+ "eval_ne_word_err_precision": 0.9782503037667072,
526
+ "eval_ne_word_err_recall": 0.9762337819813266,
527
+ "eval_overall_accuracy": 0.9954619777719851,
528
+ "eval_runtime": 11.5934,
529
+ "eval_samples_per_second": 1586.069,
530
+ "eval_steps_per_second": 99.194,
531
+ "eval_unc_insert_err_f1": 0.934559221200649,
532
+ "eval_unc_insert_err_number": 902,
533
+ "eval_unc_insert_err_precision": 0.9123548046462513,
534
+ "eval_unc_insert_err_recall": 0.9578713968957872,
535
+ "eval_weighted_avg_f1": 0.9526643829573475,
536
+ "eval_weighted_avg_number": 23096,
537
+ "eval_weighted_avg_precision": 0.9551502907269372,
538
+ "eval_weighted_avg_recall": 0.9503377208174576,
539
+ "step": 5175
540
+ },
541
+ {
542
+ "epoch": 10.0,
543
+ "learning_rate": 1.4814814814814815e-05,
544
+ "loss": 0.0329,
545
+ "step": 5750
546
+ },
547
+ {
548
+ "epoch": 10.0,
549
+ "eval_5_err_f1": 0.0,
550
+ "eval_5_err_number": 34,
551
+ "eval_5_err_precision": 0.0,
552
+ "eval_5_err_recall": 0.0,
553
+ "eval___f1": 0.9608594774538484,
554
+ "eval___number": 9934,
555
+ "eval___precision": 0.9628993125758188,
556
+ "eval___recall": 0.9588282665592913,
557
+ "eval__err_f1": 0.8358208955223881,
558
+ "eval__err_number": 285,
559
+ "eval__err_precision": 0.7924528301886793,
560
+ "eval__err_recall": 0.8842105263157894,
561
+ "eval_egin_err_f1": 0.9470899470899471,
562
+ "eval_egin_err_number": 1126,
563
+ "eval_egin_err_precision": 0.9404553415061296,
564
+ "eval_egin_err_recall": 0.9538188277087034,
565
+ "eval_el_err_f1": 0.9549150036954914,
566
+ "eval_el_err_number": 1380,
567
+ "eval_el_err_precision": 0.9743589743589743,
568
+ "eval_el_err_recall": 0.936231884057971,
569
+ "eval_loss": 0.015092139132320881,
570
+ "eval_macro_avg_f1": 0.8193214504048429,
571
+ "eval_macro_avg_number": 23096,
572
+ "eval_macro_avg_precision": 0.8139063162203923,
573
+ "eval_macro_avg_recall": 0.8255497795620286,
574
+ "eval_micro_avg_f1": 0.961947919602784,
575
+ "eval_micro_avg_number": 23096,
576
+ "eval_micro_avg_precision": 0.9634310532030401,
577
+ "eval_micro_avg_recall": 0.9604693453411847,
578
+ "eval_nd_err_f1": 0.9224936815501265,
579
+ "eval_nd_err_number": 1188,
580
+ "eval_nd_err_precision": 0.9232715008431703,
581
+ "eval_nd_err_recall": 0.9217171717171717,
582
+ "eval_ne_word_err_f1": 0.9796636921022278,
583
+ "eval_ne_word_err_number": 8247,
584
+ "eval_ne_word_err_precision": 0.9809141745684415,
585
+ "eval_ne_word_err_recall": 0.9784163938401843,
586
+ "eval_overall_accuracy": 0.9963387758003744,
587
+ "eval_runtime": 11.5919,
588
+ "eval_samples_per_second": 1586.275,
589
+ "eval_steps_per_second": 99.207,
590
+ "eval_unc_insert_err_f1": 0.9537289058247141,
591
+ "eval_unc_insert_err_number": 902,
592
+ "eval_unc_insert_err_precision": 0.9368983957219251,
593
+ "eval_unc_insert_err_recall": 0.9711751662971175,
594
+ "eval_weighted_avg_f1": 0.9613381289087282,
595
+ "eval_weighted_avg_number": 23096,
596
+ "eval_weighted_avg_precision": 0.9623478966267772,
597
+ "eval_weighted_avg_recall": 0.9604693453411847,
598
+ "step": 5750
599
+ },
600
+ {
601
+ "epoch": 11.0,
602
+ "learning_rate": 1.4074074074074075e-05,
603
+ "loss": 0.027,
604
+ "step": 6325
605
+ },
606
+ {
607
+ "epoch": 11.0,
608
+ "eval_5_err_f1": 0.0,
609
+ "eval_5_err_number": 34,
610
+ "eval_5_err_precision": 0.0,
611
+ "eval_5_err_recall": 0.0,
612
+ "eval___f1": 0.9646227605349483,
613
+ "eval___number": 9934,
614
+ "eval___precision": 0.9672097965792936,
615
+ "eval___recall": 0.9620495268773908,
616
+ "eval__err_f1": 0.8822495606326889,
617
+ "eval__err_number": 285,
618
+ "eval__err_precision": 0.8838028169014085,
619
+ "eval__err_recall": 0.8807017543859649,
620
+ "eval_egin_err_f1": 0.9626998223801065,
621
+ "eval_egin_err_number": 1126,
622
+ "eval_egin_err_precision": 0.9626998223801065,
623
+ "eval_egin_err_recall": 0.9626998223801065,
624
+ "eval_el_err_f1": 0.9632623071271125,
625
+ "eval_el_err_number": 1380,
626
+ "eval_el_err_precision": 0.9769001490312966,
627
+ "eval_el_err_recall": 0.95,
628
+ "eval_loss": 0.012891112826764584,
629
+ "eval_macro_avg_f1": 0.8290086444888856,
630
+ "eval_macro_avg_number": 23096,
631
+ "eval_macro_avg_precision": 0.8267544902067143,
632
+ "eval_macro_avg_recall": 0.8317541650077346,
633
+ "eval_micro_avg_f1": 0.967199947901969,
634
+ "eval_micro_avg_number": 23096,
635
+ "eval_micro_avg_precision": 0.9698315267075879,
636
+ "eval_micro_avg_recall": 0.964582611707655,
637
+ "eval_nd_err_f1": 0.9370277078085643,
638
+ "eval_nd_err_number": 1188,
639
+ "eval_nd_err_precision": 0.9346733668341709,
640
+ "eval_nd_err_recall": 0.9393939393939394,
641
+ "eval_ne_word_err_f1": 0.9842759629449049,
642
+ "eval_ne_word_err_number": 8247,
643
+ "eval_ne_word_err_precision": 0.989462075726014,
644
+ "eval_ne_word_err_recall": 0.9791439311264702,
645
+ "eval_overall_accuracy": 0.9968541908576033,
646
+ "eval_runtime": 11.5138,
647
+ "eval_samples_per_second": 1597.044,
648
+ "eval_steps_per_second": 99.88,
649
+ "eval_unc_insert_err_f1": 0.9379310344827587,
650
+ "eval_unc_insert_err_number": 902,
651
+ "eval_unc_insert_err_precision": 0.8992878942014242,
652
+ "eval_unc_insert_err_recall": 0.9800443458980045,
653
+ "eval_weighted_avg_f1": 0.9665670327397197,
654
+ "eval_weighted_avg_number": 23096,
655
+ "eval_weighted_avg_precision": 0.9687353440673672,
656
+ "eval_weighted_avg_recall": 0.964582611707655,
657
+ "step": 6325
658
+ },
659
+ {
660
+ "epoch": 12.0,
661
+ "learning_rate": 1.3333333333333333e-05,
662
+ "loss": 0.0228,
663
+ "step": 6900
664
+ },
665
+ {
666
+ "epoch": 12.0,
667
+ "eval_5_err_f1": 0.05714285714285715,
668
+ "eval_5_err_number": 34,
669
+ "eval_5_err_precision": 1.0,
670
+ "eval_5_err_recall": 0.029411764705882353,
671
+ "eval___f1": 0.9747602221100454,
672
+ "eval___number": 9934,
673
+ "eval___precision": 0.9776225192385581,
674
+ "eval___recall": 0.9719146366015704,
675
+ "eval__err_f1": 0.9033391915641477,
676
+ "eval__err_number": 285,
677
+ "eval__err_precision": 0.9049295774647887,
678
+ "eval__err_recall": 0.9017543859649123,
679
+ "eval_egin_err_f1": 0.957931638913234,
680
+ "eval_egin_err_number": 1126,
681
+ "eval_egin_err_precision": 0.9455017301038062,
682
+ "eval_egin_err_recall": 0.9706927175843695,
683
+ "eval_el_err_f1": 0.9700292397660818,
684
+ "eval_el_err_number": 1380,
685
+ "eval_el_err_precision": 0.9786135693215339,
686
+ "eval_el_err_recall": 0.9615942028985507,
687
+ "eval_loss": 0.00973260123282671,
688
+ "eval_macro_avg_f1": 0.8465241770192731,
689
+ "eval_macro_avg_number": 23096,
690
+ "eval_macro_avg_precision": 0.9626461351075175,
691
+ "eval_macro_avg_recall": 0.8448949158929412,
692
+ "eval_micro_avg_f1": 0.9757070969980912,
693
+ "eval_micro_avg_number": 23096,
694
+ "eval_micro_avg_precision": 0.9775730180806675,
695
+ "eval_micro_avg_recall": 0.9738482854173883,
696
+ "eval_nd_err_f1": 0.9432387312186977,
697
+ "eval_nd_err_number": 1188,
698
+ "eval_nd_err_precision": 0.9354304635761589,
699
+ "eval_nd_err_recall": 0.9511784511784511,
700
+ "eval_ne_word_err_f1": 0.989364934670313,
701
+ "eval_ne_word_err_number": 8247,
702
+ "eval_ne_word_err_precision": 0.9917153996101364,
703
+ "eval_ne_word_err_recall": 0.9870255850612344,
704
+ "eval_overall_accuracy": 0.9976184269769426,
705
+ "eval_runtime": 11.5829,
706
+ "eval_samples_per_second": 1587.51,
707
+ "eval_steps_per_second": 99.284,
708
+ "eval_unc_insert_err_f1": 0.9763866007688083,
709
+ "eval_unc_insert_err_number": 902,
710
+ "eval_unc_insert_err_precision": 0.9673558215451578,
711
+ "eval_unc_insert_err_recall": 0.9855875831485588,
712
+ "eval_weighted_avg_f1": 0.9750820441756441,
713
+ "eval_weighted_avg_number": 23096,
714
+ "eval_weighted_avg_precision": 0.9777126754330147,
715
+ "eval_weighted_avg_recall": 0.9738482854173883,
716
+ "step": 6900
717
+ },
718
+ {
719
+ "epoch": 13.0,
720
+ "learning_rate": 1.2592592592592593e-05,
721
+ "loss": 0.0187,
722
+ "step": 7475
723
+ },
724
+ {
725
+ "epoch": 13.0,
726
+ "eval_5_err_f1": 0.1111111111111111,
727
+ "eval_5_err_number": 34,
728
+ "eval_5_err_precision": 1.0,
729
+ "eval_5_err_recall": 0.058823529411764705,
730
+ "eval___f1": 0.9772773177135933,
731
+ "eval___number": 9934,
732
+ "eval___precision": 0.9804457953394123,
733
+ "eval___recall": 0.9741292530702638,
734
+ "eval__err_f1": 0.9159212880143113,
735
+ "eval__err_number": 285,
736
+ "eval__err_precision": 0.9343065693430657,
737
+ "eval__err_recall": 0.8982456140350877,
738
+ "eval_egin_err_f1": 0.9725420726306466,
739
+ "eval_egin_err_number": 1126,
740
+ "eval_egin_err_precision": 0.9699646643109541,
741
+ "eval_egin_err_recall": 0.9751332149200711,
742
+ "eval_el_err_f1": 0.9773391812865497,
743
+ "eval_el_err_number": 1380,
744
+ "eval_el_err_precision": 0.9859882005899705,
745
+ "eval_el_err_recall": 0.9688405797101449,
746
+ "eval_loss": 0.00791421253234148,
747
+ "eval_macro_avg_f1": 0.860476059382429,
748
+ "eval_macro_avg_number": 23096,
749
+ "eval_macro_avg_precision": 0.9740798854231898,
750
+ "eval_macro_avg_recall": 0.8515739437144252,
751
+ "eval_micro_avg_f1": 0.9794606800121586,
752
+ "eval_micro_avg_number": 23096,
753
+ "eval_micro_avg_precision": 0.9823186133612055,
754
+ "eval_micro_avg_recall": 0.9766193280221683,
755
+ "eval_nd_err_f1": 0.9596977329974811,
756
+ "eval_nd_err_number": 1188,
757
+ "eval_nd_err_precision": 0.957286432160804,
758
+ "eval_nd_err_recall": 0.9621212121212122,
759
+ "eval_ne_word_err_f1": 0.9902830074092069,
760
+ "eval_ne_word_err_number": 8247,
761
+ "eval_ne_word_err_precision": 0.991969826012897,
762
+ "eval_ne_word_err_recall": 0.9886019158481872,
763
+ "eval_overall_accuracy": 0.9980627503021399,
764
+ "eval_runtime": 11.6079,
765
+ "eval_samples_per_second": 1584.097,
766
+ "eval_steps_per_second": 99.071,
767
+ "eval_unc_insert_err_f1": 0.9796367638965328,
768
+ "eval_unc_insert_err_number": 902,
769
+ "eval_unc_insert_err_precision": 0.9726775956284153,
770
+ "eval_unc_insert_err_recall": 0.9866962305986696,
771
+ "eval_weighted_avg_f1": 0.9788498394927975,
772
+ "eval_weighted_avg_number": 23096,
773
+ "eval_weighted_avg_precision": 0.9823457074725067,
774
+ "eval_weighted_avg_recall": 0.9766193280221683,
775
+ "step": 7475
776
+ },
777
+ {
778
+ "epoch": 14.0,
779
+ "learning_rate": 1.1851851851851852e-05,
780
+ "loss": 0.0164,
781
+ "step": 8050
782
+ },
783
+ {
784
+ "epoch": 14.0,
785
+ "eval_5_err_f1": 0.21052631578947367,
786
+ "eval_5_err_number": 34,
787
+ "eval_5_err_precision": 1.0,
788
+ "eval_5_err_recall": 0.11764705882352941,
789
+ "eval___f1": 0.9825428859737638,
790
+ "eval___number": 9934,
791
+ "eval___precision": 0.9849281812664374,
792
+ "eval___recall": 0.9801691161667002,
793
+ "eval__err_f1": 0.9261261261261261,
794
+ "eval__err_number": 285,
795
+ "eval__err_precision": 0.9518518518518518,
796
+ "eval__err_recall": 0.9017543859649123,
797
+ "eval_egin_err_f1": 0.9721362229102167,
798
+ "eval_egin_err_number": 1126,
799
+ "eval_egin_err_precision": 0.9682819383259912,
800
+ "eval_egin_err_recall": 0.9760213143872114,
801
+ "eval_el_err_f1": 0.9807762060210373,
802
+ "eval_el_err_number": 1380,
803
+ "eval_el_err_precision": 0.9818445896877269,
804
+ "eval_el_err_recall": 0.9797101449275363,
805
+ "eval_loss": 0.006334466394037008,
806
+ "eval_macro_avg_f1": 0.876297239717871,
807
+ "eval_macro_avg_number": 23096,
808
+ "eval_macro_avg_precision": 0.9777358109471072,
809
+ "eval_macro_avg_recall": 0.8621140989407539,
810
+ "eval_micro_avg_f1": 0.9830074437379284,
811
+ "eval_micro_avg_number": 23096,
812
+ "eval_micro_avg_precision": 0.9854240090501675,
813
+ "eval_micro_avg_recall": 0.9806027017665396,
814
+ "eval_nd_err_f1": 0.9622799664710813,
815
+ "eval_nd_err_number": 1188,
816
+ "eval_nd_err_precision": 0.9582637729549248,
817
+ "eval_nd_err_recall": 0.9663299663299664,
818
+ "eval_ne_word_err_f1": 0.9920388939532057,
819
+ "eval_ne_word_err_number": 8247,
820
+ "eval_ne_word_err_precision": 0.9943957115009746,
821
+ "eval_ne_word_err_recall": 0.9896932217776161,
822
+ "eval_overall_accuracy": 0.9983589658522714,
823
+ "eval_runtime": 11.6047,
824
+ "eval_samples_per_second": 1584.53,
825
+ "eval_steps_per_second": 99.098,
826
+ "eval_unc_insert_err_f1": 0.9839513004980631,
827
+ "eval_unc_insert_err_number": 902,
828
+ "eval_unc_insert_err_precision": 0.9823204419889503,
829
+ "eval_unc_insert_err_recall": 0.9855875831485588,
830
+ "eval_weighted_avg_f1": 0.9825008162842519,
831
+ "eval_weighted_avg_number": 23096,
832
+ "eval_weighted_avg_precision": 0.9854536352829805,
833
+ "eval_weighted_avg_recall": 0.9806027017665396,
834
+ "step": 8050
835
+ },
836
+ {
837
+ "epoch": 15.0,
838
+ "learning_rate": 1.1111111111111113e-05,
839
+ "loss": 0.014,
840
+ "step": 8625
841
+ },
842
+ {
843
+ "epoch": 15.0,
844
+ "eval_5_err_f1": 0.45454545454545453,
845
+ "eval_5_err_number": 34,
846
+ "eval_5_err_precision": 1.0,
847
+ "eval_5_err_recall": 0.29411764705882354,
848
+ "eval___f1": 0.9852837415583107,
849
+ "eval___number": 9934,
850
+ "eval___precision": 0.9865765038352846,
851
+ "eval___recall": 0.9839943627944433,
852
+ "eval__err_f1": 0.9288135593220339,
853
+ "eval__err_number": 285,
854
+ "eval__err_precision": 0.898360655737705,
855
+ "eval__err_recall": 0.9614035087719298,
856
+ "eval_egin_err_f1": 0.9774635439681837,
857
+ "eval_egin_err_number": 1126,
858
+ "eval_egin_err_precision": 0.9727352682497801,
859
+ "eval_egin_err_recall": 0.9822380106571936,
860
+ "eval_el_err_f1": 0.9829524845846935,
861
+ "eval_el_err_number": 1380,
862
+ "eval_el_err_precision": 0.9840232389251997,
863
+ "eval_el_err_recall": 0.9818840579710145,
864
+ "eval_loss": 0.0052265021950006485,
865
+ "eval_macro_avg_f1": 0.9105764259707885,
866
+ "eval_macro_avg_number": 23096,
867
+ "eval_macro_avg_precision": 0.9749927361731852,
868
+ "eval_macro_avg_recall": 0.8945651087172118,
869
+ "eval_micro_avg_f1": 0.9858025360355478,
870
+ "eval_micro_avg_number": 23096,
871
+ "eval_micro_avg_precision": 0.9870220061634619,
872
+ "eval_micro_avg_recall": 0.9845860755109109,
873
+ "eval_nd_err_f1": 0.9714285714285714,
874
+ "eval_nd_err_number": 1188,
875
+ "eval_nd_err_precision": 0.9697986577181208,
876
+ "eval_nd_err_recall": 0.9730639730639731,
877
+ "eval_ne_word_err_f1": 0.9930129412479494,
878
+ "eval_ne_word_err_number": 8247,
879
+ "eval_ne_word_err_precision": 0.9951290793960058,
880
+ "eval_ne_word_err_recall": 0.9909057839214259,
881
+ "eval_overall_accuracy": 0.9986137112253844,
882
+ "eval_runtime": 11.5772,
883
+ "eval_samples_per_second": 1588.3,
884
+ "eval_steps_per_second": 99.334,
885
+ "eval_unc_insert_err_f1": 0.991111111111111,
886
+ "eval_unc_insert_err_number": 902,
887
+ "eval_unc_insert_err_precision": 0.9933184855233853,
888
+ "eval_unc_insert_err_recall": 0.9889135254988913,
889
+ "eval_weighted_avg_f1": 0.9855598618500103,
890
+ "eval_weighted_avg_number": 23096,
891
+ "eval_weighted_avg_precision": 0.9871345408226997,
892
+ "eval_weighted_avg_recall": 0.9845860755109109,
893
+ "step": 8625
894
+ },
895
+ {
896
+ "epoch": 16.0,
897
+ "learning_rate": 1.037037037037037e-05,
898
+ "loss": 0.0123,
899
+ "step": 9200
900
+ },
901
+ {
902
+ "epoch": 16.0,
903
+ "eval_5_err_f1": 0.6,
904
+ "eval_5_err_number": 34,
905
+ "eval_5_err_precision": 0.9375,
906
+ "eval_5_err_recall": 0.4411764705882353,
907
+ "eval___f1": 0.9873099002920738,
908
+ "eval___number": 9934,
909
+ "eval___precision": 0.987807335751713,
910
+ "eval___recall": 0.9868129655727803,
911
+ "eval__err_f1": 0.9515570934256056,
912
+ "eval__err_number": 285,
913
+ "eval__err_precision": 0.9385665529010239,
914
+ "eval__err_recall": 0.9649122807017544,
915
+ "eval_egin_err_f1": 0.9800973020787261,
916
+ "eval_egin_err_number": 1126,
917
+ "eval_egin_err_precision": 0.9762114537444934,
918
+ "eval_egin_err_recall": 0.9840142095914742,
919
+ "eval_el_err_f1": 0.988056460369164,
920
+ "eval_el_err_number": 1380,
921
+ "eval_el_err_precision": 0.9869848156182213,
922
+ "eval_el_err_recall": 0.9891304347826086,
923
+ "eval_loss": 0.004177143797278404,
924
+ "eval_macro_avg_f1": 0.9331542372543383,
925
+ "eval_macro_avg_number": 23096,
926
+ "eval_macro_avg_precision": 0.9724010687109472,
927
+ "eval_macro_avg_recall": 0.9162982831050877,
928
+ "eval_micro_avg_f1": 0.9880050231671935,
929
+ "eval_micro_avg_number": 23096,
930
+ "eval_micro_avg_precision": 0.9881333910783889,
931
+ "eval_micro_avg_recall": 0.9878766886040873,
932
+ "eval_nd_err_f1": 0.9739714525608731,
933
+ "eval_nd_err_number": 1188,
934
+ "eval_nd_err_precision": 0.9715242881072027,
935
+ "eval_nd_err_recall": 0.9764309764309764,
936
+ "eval_ne_word_err_f1": 0.9941754641427012,
937
+ "eval_ne_word_err_number": 8247,
938
+ "eval_ne_word_err_precision": 0.9948998178506375,
939
+ "eval_ne_word_err_recall": 0.9934521644234267,
940
+ "eval_overall_accuracy": 0.998862532287495,
941
+ "eval_runtime": 12.719,
942
+ "eval_samples_per_second": 1445.712,
943
+ "eval_steps_per_second": 90.416,
944
+ "eval_unc_insert_err_f1": 0.9900662251655629,
945
+ "eval_unc_insert_err_number": 902,
946
+ "eval_unc_insert_err_precision": 0.9857142857142858,
947
+ "eval_unc_insert_err_recall": 0.9944567627494457,
948
+ "eval_weighted_avg_f1": 0.9878645943931573,
949
+ "eval_weighted_avg_number": 23096,
950
+ "eval_weighted_avg_precision": 0.9881244207310185,
951
+ "eval_weighted_avg_recall": 0.9878766886040873,
952
+ "step": 9200
953
+ },
954
+ {
955
+ "epoch": 17.0,
956
+ "learning_rate": 9.62962962962963e-06,
957
+ "loss": 0.0105,
958
+ "step": 9775
959
+ },
960
+ {
961
+ "epoch": 17.0,
962
+ "eval_5_err_f1": 0.6909090909090908,
963
+ "eval_5_err_number": 34,
964
+ "eval_5_err_precision": 0.9047619047619048,
965
+ "eval_5_err_recall": 0.5588235294117647,
966
+ "eval___f1": 0.9881665743491614,
967
+ "eval___number": 9934,
968
+ "eval___precision": 0.9886146095717884,
969
+ "eval___recall": 0.9877189450372458,
970
+ "eval__err_f1": 0.9619377162629758,
971
+ "eval__err_number": 285,
972
+ "eval__err_precision": 0.9488054607508533,
973
+ "eval__err_recall": 0.9754385964912281,
974
+ "eval_egin_err_f1": 0.983111111111111,
975
+ "eval_egin_err_number": 1126,
976
+ "eval_egin_err_precision": 0.9839857651245552,
977
+ "eval_egin_err_recall": 0.9822380106571936,
978
+ "eval_el_err_f1": 0.9902491874322861,
979
+ "eval_el_err_number": 1380,
980
+ "eval_el_err_precision": 0.9870410367170627,
981
+ "eval_el_err_recall": 0.9934782608695653,
982
+ "eval_loss": 0.0035622185096144676,
983
+ "eval_macro_avg_f1": 0.9477625393802664,
984
+ "eval_macro_avg_number": 23096,
985
+ "eval_macro_avg_precision": 0.9727147980473216,
986
+ "eval_macro_avg_recall": 0.9330802536387749,
987
+ "eval_micro_avg_f1": 0.989477330792881,
988
+ "eval_micro_avg_number": 23096,
989
+ "eval_micro_avg_precision": 0.9896058899956691,
990
+ "eval_micro_avg_recall": 0.9893488049878767,
991
+ "eval_nd_err_f1": 0.9802105263157895,
992
+ "eval_nd_err_number": 1188,
993
+ "eval_nd_err_precision": 0.9806234203875316,
994
+ "eval_nd_err_recall": 0.9797979797979798,
995
+ "eval_ne_word_err_f1": 0.99472631387525,
996
+ "eval_ne_word_err_number": 8247,
997
+ "eval_ne_word_err_precision": 0.9945454545454545,
998
+ "eval_ne_word_err_recall": 0.9949072389959985,
999
+ "eval_overall_accuracy": 0.9990106400625607,
1000
+ "eval_runtime": 11.5897,
1001
+ "eval_samples_per_second": 1586.578,
1002
+ "eval_steps_per_second": 99.226,
1003
+ "eval_unc_insert_err_f1": 0.9927897947864671,
1004
+ "eval_unc_insert_err_number": 902,
1005
+ "eval_unc_insert_err_precision": 0.9933407325194229,
1006
+ "eval_unc_insert_err_recall": 0.9922394678492239,
1007
+ "eval_weighted_avg_f1": 0.9893969219028329,
1008
+ "eval_weighted_avg_number": 23096,
1009
+ "eval_weighted_avg_precision": 0.9895715241838893,
1010
+ "eval_weighted_avg_recall": 0.9893488049878767,
1011
+ "step": 9775
1012
+ },
1013
+ {
1014
+ "epoch": 18.0,
1015
+ "learning_rate": 8.888888888888888e-06,
1016
+ "loss": 0.0093,
1017
+ "step": 10350
1018
+ },
1019
+ {
1020
+ "epoch": 18.0,
1021
+ "eval_5_err_f1": 0.7169811320754718,
1022
+ "eval_5_err_number": 34,
1023
+ "eval_5_err_precision": 1.0,
1024
+ "eval_5_err_recall": 0.5588235294117647,
1025
+ "eval___f1": 0.9897851356111308,
1026
+ "eval___number": 9934,
1027
+ "eval___precision": 0.9895361706409096,
1028
+ "eval___recall": 0.9900342258908799,
1029
+ "eval__err_f1": 0.9686411149825784,
1030
+ "eval__err_number": 285,
1031
+ "eval__err_precision": 0.9619377162629758,
1032
+ "eval__err_recall": 0.9754385964912281,
1033
+ "eval_egin_err_f1": 0.984982332155477,
1034
+ "eval_egin_err_number": 1126,
1035
+ "eval_egin_err_precision": 0.9797891036906854,
1036
+ "eval_egin_err_recall": 0.9902309058614565,
1037
+ "eval_el_err_f1": 0.993128390596745,
1038
+ "eval_el_err_number": 1380,
1039
+ "eval_el_err_precision": 0.9913357400722022,
1040
+ "eval_el_err_recall": 0.994927536231884,
1041
+ "eval_loss": 0.003151776734739542,
1042
+ "eval_macro_avg_f1": 0.9528278117999003,
1043
+ "eval_macro_avg_number": 23096,
1044
+ "eval_macro_avg_precision": 0.9858378283192721,
1045
+ "eval_macro_avg_recall": 0.9354523140152433,
1046
+ "eval_micro_avg_f1": 0.9907613751920207,
1047
+ "eval_micro_avg_number": 23096,
1048
+ "eval_micro_avg_precision": 0.9901829347403018,
1049
+ "eval_micro_avg_recall": 0.9913404918600623,
1050
+ "eval_nd_err_f1": 0.981163666806195,
1051
+ "eval_nd_err_number": 1188,
1052
+ "eval_nd_err_precision": 0.9758534554537885,
1053
+ "eval_nd_err_recall": 0.9865319865319865,
1054
+ "eval_ne_word_err_f1": 0.9951509273851376,
1055
+ "eval_ne_word_err_number": 8247,
1056
+ "eval_ne_word_err_precision": 0.9949097079141922,
1057
+ "eval_ne_word_err_recall": 0.9953922638535225,
1058
+ "eval_overall_accuracy": 0.9991054290386028,
1059
+ "eval_runtime": 11.5456,
1060
+ "eval_samples_per_second": 1592.643,
1061
+ "eval_steps_per_second": 99.605,
1062
+ "eval_unc_insert_err_f1": 0.9927897947864671,
1063
+ "eval_unc_insert_err_number": 902,
1064
+ "eval_unc_insert_err_precision": 0.9933407325194229,
1065
+ "eval_unc_insert_err_recall": 0.9922394678492239,
1066
+ "eval_weighted_avg_f1": 0.9906781013015472,
1067
+ "eval_weighted_avg_number": 23096,
1068
+ "eval_weighted_avg_precision": 0.9902068768322245,
1069
+ "eval_weighted_avg_recall": 0.9913404918600623,
1070
+ "step": 10350
1071
+ },
1072
+ {
1073
+ "epoch": 19.0,
1074
+ "learning_rate": 8.148148148148148e-06,
1075
+ "loss": 0.0077,
1076
+ "step": 10925
1077
+ },
1078
+ {
1079
+ "epoch": 19.0,
1080
+ "eval_5_err_f1": 0.8135593220338982,
1081
+ "eval_5_err_number": 34,
1082
+ "eval_5_err_precision": 0.96,
1083
+ "eval_5_err_recall": 0.7058823529411765,
1084
+ "eval___f1": 0.9900820621255602,
1085
+ "eval___number": 9934,
1086
+ "eval___precision": 0.9903313526034847,
1087
+ "eval___recall": 0.9898328971209986,
1088
+ "eval__err_f1": 0.9705372616984402,
1089
+ "eval__err_number": 285,
1090
+ "eval__err_precision": 0.958904109589041,
1091
+ "eval__err_recall": 0.9824561403508771,
1092
+ "eval_egin_err_f1": 0.9897913892587662,
1093
+ "eval_egin_err_number": 1126,
1094
+ "eval_egin_err_precision": 0.9893522626441881,
1095
+ "eval_egin_err_recall": 0.9902309058614565,
1096
+ "eval_el_err_f1": 0.9934829833454019,
1097
+ "eval_el_err_number": 1380,
1098
+ "eval_el_err_precision": 0.9927641099855282,
1099
+ "eval_el_err_recall": 0.9942028985507246,
1100
+ "eval_loss": 0.0027081461157649755,
1101
+ "eval_macro_avg_f1": 0.9666657167263342,
1102
+ "eval_macro_avg_number": 23096,
1103
+ "eval_macro_avg_precision": 0.9826479575258772,
1104
+ "eval_macro_avg_recall": 0.9555704329460621,
1105
+ "eval_micro_avg_f1": 0.9915788106423051,
1106
+ "eval_micro_avg_number": 23096,
1107
+ "eval_micro_avg_precision": 0.9915573451097545,
1108
+ "eval_micro_avg_recall": 0.9916002771042605,
1109
+ "eval_nd_err_f1": 0.9874161073825503,
1110
+ "eval_nd_err_number": 1188,
1111
+ "eval_nd_err_precision": 0.9841137123745819,
1112
+ "eval_nd_err_recall": 0.9907407407407407,
1113
+ "eval_ne_word_err_f1": 0.9950864422202002,
1114
+ "eval_ne_word_err_number": 8247,
1115
+ "eval_ne_word_err_precision": 0.9956300072833212,
1116
+ "eval_ne_word_err_recall": 0.9945434703528556,
1117
+ "eval_overall_accuracy": 0.9992179909476527,
1118
+ "eval_runtime": 11.6822,
1119
+ "eval_samples_per_second": 1574.022,
1120
+ "eval_steps_per_second": 98.441,
1121
+ "eval_unc_insert_err_f1": 0.9933701657458565,
1122
+ "eval_unc_insert_err_number": 902,
1123
+ "eval_unc_insert_err_precision": 0.9900881057268722,
1124
+ "eval_unc_insert_err_recall": 0.9966740576496674,
1125
+ "eval_weighted_avg_f1": 0.9915482800949849,
1126
+ "eval_weighted_avg_number": 23096,
1127
+ "eval_weighted_avg_precision": 0.9915592171477948,
1128
+ "eval_weighted_avg_recall": 0.9916002771042605,
1129
+ "step": 10925
1130
+ },
1131
+ {
1132
+ "epoch": 20.0,
1133
+ "learning_rate": 7.4074074074074075e-06,
1134
+ "loss": 0.0072,
1135
+ "step": 11500
1136
+ },
1137
+ {
1138
+ "epoch": 20.0,
1139
+ "eval_5_err_f1": 0.8474576271186441,
1140
+ "eval_5_err_number": 34,
1141
+ "eval_5_err_precision": 1.0,
1142
+ "eval_5_err_recall": 0.7352941176470589,
1143
+ "eval___f1": 0.9909347300564061,
1144
+ "eval___number": 9934,
1145
+ "eval___precision": 0.9915339649264261,
1146
+ "eval___recall": 0.9903362190457017,
1147
+ "eval__err_f1": 0.9738219895287958,
1148
+ "eval__err_number": 285,
1149
+ "eval__err_precision": 0.96875,
1150
+ "eval__err_recall": 0.9789473684210527,
1151
+ "eval_egin_err_f1": 0.9871738168951791,
1152
+ "eval_egin_err_number": 1126,
1153
+ "eval_egin_err_precision": 0.9832599118942731,
1154
+ "eval_egin_err_recall": 0.9911190053285968,
1155
+ "eval_el_err_f1": 0.9942154736080984,
1156
+ "eval_el_err_number": 1380,
1157
+ "eval_el_err_precision": 0.9920634920634921,
1158
+ "eval_el_err_recall": 0.9963768115942029,
1159
+ "eval_loss": 0.0023903592955321074,
1160
+ "eval_macro_avg_f1": 0.97173084894704,
1161
+ "eval_macro_avg_number": 23096,
1162
+ "eval_macro_avg_precision": 0.9894635604667124,
1163
+ "eval_macro_avg_recall": 0.9590607777684785,
1164
+ "eval_micro_avg_f1": 0.9922698828573284,
1165
+ "eval_micro_avg_number": 23096,
1166
+ "eval_micro_avg_precision": 0.9924632910295837,
1167
+ "eval_micro_avg_recall": 0.992076550051957,
1168
+ "eval_nd_err_f1": 0.9903483004616032,
1169
+ "eval_nd_err_number": 1188,
1170
+ "eval_nd_err_precision": 0.9874476987447699,
1171
+ "eval_nd_err_recall": 0.9932659932659933,
1172
+ "eval_ne_word_err_f1": 0.9954504094631482,
1173
+ "eval_ne_word_err_number": 8247,
1174
+ "eval_ne_word_err_precision": 0.9959941733430444,
1175
+ "eval_ne_word_err_recall": 0.9949072389959985,
1176
+ "eval_overall_accuracy": 0.9992594611246712,
1177
+ "eval_runtime": 11.3322,
1178
+ "eval_samples_per_second": 1622.634,
1179
+ "eval_steps_per_second": 101.481,
1180
+ "eval_unc_insert_err_f1": 0.9944444444444444,
1181
+ "eval_unc_insert_err_number": 902,
1182
+ "eval_unc_insert_err_precision": 0.9966592427616926,
1183
+ "eval_unc_insert_err_recall": 0.9922394678492239,
1184
+ "eval_weighted_avg_f1": 0.9922443584517268,
1185
+ "eval_weighted_avg_number": 23096,
1186
+ "eval_weighted_avg_precision": 0.9924761382083309,
1187
+ "eval_weighted_avg_recall": 0.992076550051957,
1188
+ "step": 11500
1189
+ },
1190
+ {
1191
+ "epoch": 21.0,
1192
+ "learning_rate": 6.666666666666667e-06,
1193
+ "loss": 0.0065,
1194
+ "step": 12075
1195
+ },
1196
+ {
1197
+ "epoch": 21.0,
1198
+ "eval_5_err_f1": 0.9206349206349206,
1199
+ "eval_5_err_number": 34,
1200
+ "eval_5_err_precision": 1.0,
1201
+ "eval_5_err_recall": 0.8529411764705882,
1202
+ "eval___f1": 0.9908903316724545,
1203
+ "eval___number": 9934,
1204
+ "eval___precision": 0.9908404630095622,
1205
+ "eval___recall": 0.9909402053553453,
1206
+ "eval__err_f1": 0.979020979020979,
1207
+ "eval__err_number": 285,
1208
+ "eval__err_precision": 0.975609756097561,
1209
+ "eval__err_recall": 0.9824561403508771,
1210
+ "eval_egin_err_f1": 0.9907038512616202,
1211
+ "eval_egin_err_number": 1126,
1212
+ "eval_egin_err_precision": 0.9876434245366285,
1213
+ "eval_egin_err_recall": 0.9937833037300178,
1214
+ "eval_el_err_f1": 0.9934876989869754,
1215
+ "eval_el_err_number": 1380,
1216
+ "eval_el_err_precision": 0.9920520231213873,
1217
+ "eval_el_err_recall": 0.994927536231884,
1218
+ "eval_loss": 0.002177101792767644,
1219
+ "eval_macro_avg_f1": 0.981866119540616,
1220
+ "eval_macro_avg_number": 23096,
1221
+ "eval_macro_avg_precision": 0.9905676481148733,
1222
+ "eval_macro_avg_recall": 0.9746318418196954,
1223
+ "eval_micro_avg_f1": 0.9925117950049778,
1224
+ "eval_micro_avg_number": 23096,
1225
+ "eval_micro_avg_precision": 0.9922111639982691,
1226
+ "eval_micro_avg_recall": 0.9928126082438518,
1227
+ "eval_nd_err_f1": 0.9903483004616032,
1228
+ "eval_nd_err_number": 1188,
1229
+ "eval_nd_err_precision": 0.9874476987447699,
1230
+ "eval_nd_err_recall": 0.9932659932659933,
1231
+ "eval_ne_word_err_f1": 0.9953922638535225,
1232
+ "eval_ne_word_err_number": 8247,
1233
+ "eval_ne_word_err_precision": 0.9953922638535225,
1234
+ "eval_ne_word_err_recall": 0.9953922638535225,
1235
+ "eval_overall_accuracy": 0.999295006990687,
1236
+ "eval_runtime": 11.5781,
1237
+ "eval_samples_per_second": 1588.177,
1238
+ "eval_steps_per_second": 99.326,
1239
+ "eval_unc_insert_err_f1": 0.9944506104328523,
1240
+ "eval_unc_insert_err_number": 902,
1241
+ "eval_unc_insert_err_precision": 0.9955555555555555,
1242
+ "eval_unc_insert_err_recall": 0.9933481152993349,
1243
+ "eval_weighted_avg_f1": 0.9925052352718289,
1244
+ "eval_weighted_avg_number": 23096,
1245
+ "eval_weighted_avg_precision": 0.9922174924307435,
1246
+ "eval_weighted_avg_recall": 0.9928126082438518,
1247
+ "step": 12075
1248
+ },
1249
+ {
1250
+ "epoch": 22.0,
1251
+ "learning_rate": 5.925925925925926e-06,
1252
+ "loss": 0.0056,
1253
+ "step": 12650
1254
+ },
1255
+ {
1256
+ "epoch": 22.0,
1257
+ "eval_5_err_f1": 0.9032258064516129,
1258
+ "eval_5_err_number": 34,
1259
+ "eval_5_err_precision": 1.0,
1260
+ "eval_5_err_recall": 0.8235294117647058,
1261
+ "eval___f1": 0.9906862004732417,
1262
+ "eval___number": 9934,
1263
+ "eval___precision": 0.990935643065767,
1264
+ "eval___recall": 0.9904368834306423,
1265
+ "eval__err_f1": 0.9791666666666666,
1266
+ "eval__err_number": 285,
1267
+ "eval__err_precision": 0.9690721649484536,
1268
+ "eval__err_recall": 0.9894736842105263,
1269
+ "eval_egin_err_f1": 0.9915817456801064,
1270
+ "eval_egin_err_number": 1126,
1271
+ "eval_egin_err_precision": 0.9893899204244032,
1272
+ "eval_egin_err_recall": 0.9937833037300178,
1273
+ "eval_el_err_f1": 0.9942154736080984,
1274
+ "eval_el_err_number": 1380,
1275
+ "eval_el_err_precision": 0.9920634920634921,
1276
+ "eval_el_err_recall": 0.9963768115942029,
1277
+ "eval_loss": 0.0019981798250228167,
1278
+ "eval_macro_avg_f1": 0.9798494009715082,
1279
+ "eval_macro_avg_number": 23096,
1280
+ "eval_macro_avg_precision": 0.9901473342025248,
1281
+ "eval_macro_avg_recall": 0.9717161526744847,
1282
+ "eval_micro_avg_f1": 0.9925730247060607,
1283
+ "eval_micro_avg_number": 23096,
1284
+ "eval_micro_avg_precision": 0.9927664919651752,
1285
+ "eval_micro_avg_recall": 0.9923796328368548,
1286
+ "eval_nd_err_f1": 0.9903157894736843,
1287
+ "eval_nd_err_number": 1188,
1288
+ "eval_nd_err_precision": 0.9907329401853412,
1289
+ "eval_nd_err_recall": 0.98989898989899,
1290
+ "eval_ne_word_err_f1": 0.9956909631607697,
1291
+ "eval_ne_word_err_number": 8247,
1292
+ "eval_ne_word_err_precision": 0.996719319562576,
1293
+ "eval_ne_word_err_recall": 0.9946647265672366,
1294
+ "eval_overall_accuracy": 0.9993127799236948,
1295
+ "eval_runtime": 11.7025,
1296
+ "eval_samples_per_second": 1571.285,
1297
+ "eval_steps_per_second": 98.269,
1298
+ "eval_unc_insert_err_f1": 0.9939125622578859,
1299
+ "eval_unc_insert_err_number": 902,
1300
+ "eval_unc_insert_err_precision": 0.9922651933701657,
1301
+ "eval_unc_insert_err_recall": 0.9955654101995566,
1302
+ "eval_weighted_avg_f1": 0.9925638618970269,
1303
+ "eval_weighted_avg_number": 23096,
1304
+ "eval_weighted_avg_precision": 0.9927779303976348,
1305
+ "eval_weighted_avg_recall": 0.9923796328368548,
1306
+ "step": 12650
1307
+ },
1308
+ {
1309
+ "epoch": 23.0,
1310
+ "learning_rate": 5.185185185185185e-06,
1311
+ "loss": 0.005,
1312
+ "step": 13225
1313
+ },
1314
+ {
1315
+ "epoch": 23.0,
1316
+ "eval_5_err_f1": 0.9375,
1317
+ "eval_5_err_number": 34,
1318
+ "eval_5_err_precision": 1.0,
1319
+ "eval_5_err_recall": 0.8823529411764706,
1320
+ "eval___f1": 0.9914409425032725,
1321
+ "eval___number": 9934,
1322
+ "eval___precision": 0.99174053182917,
1323
+ "eval___recall": 0.9911415341252265,
1324
+ "eval__err_f1": 0.9791666666666666,
1325
+ "eval__err_number": 285,
1326
+ "eval__err_precision": 0.9690721649484536,
1327
+ "eval__err_recall": 0.9894736842105263,
1328
+ "eval_egin_err_f1": 0.9924745462594068,
1329
+ "eval_egin_err_number": 1126,
1330
+ "eval_egin_err_precision": 0.9894086496028244,
1331
+ "eval_egin_err_recall": 0.9955595026642984,
1332
+ "eval_el_err_f1": 0.9945828819068254,
1333
+ "eval_el_err_number": 1380,
1334
+ "eval_el_err_precision": 0.9913606911447084,
1335
+ "eval_el_err_recall": 0.9978260869565218,
1336
+ "eval_loss": 0.0018450135830789804,
1337
+ "eval_macro_avg_f1": 0.9846004015975137,
1338
+ "eval_macro_avg_number": 23096,
1339
+ "eval_macro_avg_precision": 0.9903043479501087,
1340
+ "eval_macro_avg_recall": 0.9798487500093644,
1341
+ "eval_micro_avg_f1": 0.9931357051601308,
1342
+ "eval_micro_avg_number": 23096,
1343
+ "eval_micro_avg_precision": 0.9933723196881091,
1344
+ "eval_micro_avg_recall": 0.9928992033252512,
1345
+ "eval_nd_err_f1": 0.9907485281749369,
1346
+ "eval_nd_err_number": 1188,
1347
+ "eval_nd_err_precision": 0.9899159663865547,
1348
+ "eval_nd_err_recall": 0.9915824915824916,
1349
+ "eval_ne_word_err_f1": 0.9958702781489128,
1350
+ "eval_ne_word_err_number": 8247,
1351
+ "eval_ne_word_err_precision": 0.9975666139433021,
1352
+ "eval_ne_word_err_recall": 0.9941797017097126,
1353
+ "eval_overall_accuracy": 0.9993601744117159,
1354
+ "eval_runtime": 11.5685,
1355
+ "eval_samples_per_second": 1589.49,
1356
+ "eval_steps_per_second": 99.408,
1357
+ "eval_unc_insert_err_f1": 0.9950193691200886,
1358
+ "eval_unc_insert_err_number": 902,
1359
+ "eval_unc_insert_err_precision": 0.9933701657458563,
1360
+ "eval_unc_insert_err_recall": 0.9966740576496674,
1361
+ "eval_weighted_avg_f1": 0.9931339385720146,
1362
+ "eval_weighted_avg_number": 23096,
1363
+ "eval_weighted_avg_precision": 0.9933867261081645,
1364
+ "eval_weighted_avg_recall": 0.9928992033252512,
1365
+ "step": 13225
1366
+ },
1367
+ {
1368
+ "epoch": 24.0,
1369
+ "learning_rate": 4.444444444444444e-06,
1370
+ "loss": 0.0044,
1371
+ "step": 13800
1372
+ },
1373
+ {
1374
+ "epoch": 24.0,
1375
+ "eval_5_err_f1": 0.9538461538461539,
1376
+ "eval_5_err_number": 34,
1377
+ "eval_5_err_precision": 1.0,
1378
+ "eval_5_err_recall": 0.9117647058823529,
1379
+ "eval___f1": 0.9912947214814068,
1380
+ "eval___number": 9934,
1381
+ "eval___precision": 0.9910453767984707,
1382
+ "eval___recall": 0.991544191664989,
1383
+ "eval__err_f1": 0.9807355516637477,
1384
+ "eval__err_number": 285,
1385
+ "eval__err_precision": 0.9790209790209791,
1386
+ "eval__err_recall": 0.9824561403508771,
1387
+ "eval_egin_err_f1": 0.9924745462594068,
1388
+ "eval_egin_err_number": 1126,
1389
+ "eval_egin_err_precision": 0.9894086496028244,
1390
+ "eval_egin_err_recall": 0.9955595026642984,
1391
+ "eval_el_err_f1": 0.9953051643192489,
1392
+ "eval_el_err_number": 1380,
1393
+ "eval_el_err_precision": 0.9920806335493161,
1394
+ "eval_el_err_recall": 0.9985507246376811,
1395
+ "eval_loss": 0.0016574990004301071,
1396
+ "eval_macro_avg_f1": 0.9870548052559327,
1397
+ "eval_macro_avg_number": 23096,
1398
+ "eval_macro_avg_precision": 0.9915974009252017,
1399
+ "eval_macro_avg_recall": 0.9830275235917065,
1400
+ "eval_micro_avg_f1": 0.9931834411720154,
1401
+ "eval_micro_avg_number": 23096,
1402
+ "eval_micro_avg_precision": 0.9927752541639628,
1403
+ "eval_micro_avg_recall": 0.9935919639764461,
1404
+ "eval_nd_err_f1": 0.9920134510298445,
1405
+ "eval_nd_err_number": 1188,
1406
+ "eval_nd_err_precision": 0.9907640638119227,
1407
+ "eval_nd_err_recall": 0.9932659932659933,
1408
+ "eval_ne_word_err_f1": 0.9957550030321406,
1409
+ "eval_ne_word_err_number": 8247,
1410
+ "eval_ne_word_err_precision": 0.9959966031784544,
1411
+ "eval_ne_word_err_recall": 0.9955135200679035,
1412
+ "eval_overall_accuracy": 0.9993720230337212,
1413
+ "eval_runtime": 11.5823,
1414
+ "eval_samples_per_second": 1587.59,
1415
+ "eval_steps_per_second": 99.289,
1416
+ "eval_unc_insert_err_f1": 0.9950138504155125,
1417
+ "eval_unc_insert_err_number": 902,
1418
+ "eval_unc_insert_err_precision": 0.9944629014396457,
1419
+ "eval_unc_insert_err_recall": 0.9955654101995566,
1420
+ "eval_weighted_avg_f1": 0.9931813133618028,
1421
+ "eval_weighted_avg_number": 23096,
1422
+ "eval_weighted_avg_precision": 0.9927791997405465,
1423
+ "eval_weighted_avg_recall": 0.9935919639764461,
1424
+ "step": 13800
1425
+ },
1426
+ {
1427
+ "epoch": 25.0,
1428
+ "learning_rate": 3.7037037037037037e-06,
1429
+ "loss": 0.0042,
1430
+ "step": 14375
1431
+ },
1432
+ {
1433
+ "epoch": 25.0,
1434
+ "eval_5_err_f1": 0.9538461538461539,
1435
+ "eval_5_err_number": 34,
1436
+ "eval_5_err_precision": 1.0,
1437
+ "eval_5_err_recall": 0.9117647058823529,
1438
+ "eval___f1": 0.9912404349577124,
1439
+ "eval___number": 9934,
1440
+ "eval___precision": 0.9914400805639476,
1441
+ "eval___recall": 0.9910408697402859,
1442
+ "eval__err_f1": 0.9792387543252596,
1443
+ "eval__err_number": 285,
1444
+ "eval__err_precision": 0.9658703071672355,
1445
+ "eval__err_recall": 0.9929824561403509,
1446
+ "eval_egin_err_f1": 0.9920141969831411,
1447
+ "eval_egin_err_number": 1126,
1448
+ "eval_egin_err_precision": 0.9911347517730497,
1449
+ "eval_egin_err_recall": 0.9928952042628775,
1450
+ "eval_el_err_f1": 0.9956521739130435,
1451
+ "eval_el_err_number": 1380,
1452
+ "eval_el_err_precision": 0.9956521739130435,
1453
+ "eval_el_err_recall": 0.9956521739130435,
1454
+ "eval_loss": 0.0016160767991095781,
1455
+ "eval_macro_avg_f1": 0.9869810337461777,
1456
+ "eval_macro_avg_number": 23096,
1457
+ "eval_macro_avg_precision": 0.9912198213891408,
1458
+ "eval_macro_avg_recall": 0.9832988188396197,
1459
+ "eval_micro_avg_f1": 0.9932217337635619,
1460
+ "eval_micro_avg_number": 23096,
1461
+ "eval_micro_avg_precision": 0.993544473809627,
1462
+ "eval_micro_avg_recall": 0.9928992033252512,
1463
+ "eval_nd_err_f1": 0.9924178601516429,
1464
+ "eval_nd_err_number": 1188,
1465
+ "eval_nd_err_precision": 0.9932546374367622,
1466
+ "eval_nd_err_recall": 0.9915824915824916,
1467
+ "eval_ne_word_err_f1": 0.9958732855929119,
1468
+ "eval_ne_word_err_number": 8247,
1469
+ "eval_ne_word_err_precision": 0.9968412100595311,
1470
+ "eval_ne_word_err_recall": 0.9949072389959985,
1471
+ "eval_overall_accuracy": 0.9993720230337212,
1472
+ "eval_runtime": 11.6443,
1473
+ "eval_samples_per_second": 1579.141,
1474
+ "eval_steps_per_second": 98.761,
1475
+ "eval_unc_insert_err_f1": 0.9955654101995566,
1476
+ "eval_unc_insert_err_number": 902,
1477
+ "eval_unc_insert_err_precision": 0.9955654101995566,
1478
+ "eval_unc_insert_err_recall": 0.9955654101995566,
1479
+ "eval_weighted_avg_f1": 0.9932223625316633,
1480
+ "eval_weighted_avg_number": 23096,
1481
+ "eval_weighted_avg_precision": 0.993557001082317,
1482
+ "eval_weighted_avg_recall": 0.9928992033252512,
1483
+ "step": 14375
1484
+ },
1485
+ {
1486
+ "epoch": 26.0,
1487
+ "learning_rate": 2.962962962962963e-06,
1488
+ "loss": 0.0037,
1489
+ "step": 14950
1490
+ },
1491
+ {
1492
+ "epoch": 26.0,
1493
+ "eval_5_err_f1": 0.9696969696969697,
1494
+ "eval_5_err_number": 34,
1495
+ "eval_5_err_precision": 1.0,
1496
+ "eval_5_err_recall": 0.9411764705882353,
1497
+ "eval___f1": 0.9912990997334405,
1498
+ "eval___number": 9934,
1499
+ "eval___precision": 0.9905518142526887,
1500
+ "eval___recall": 0.992047513589692,
1501
+ "eval__err_f1": 0.9808695652173912,
1502
+ "eval__err_number": 285,
1503
+ "eval__err_precision": 0.9724137931034482,
1504
+ "eval__err_recall": 0.9894736842105263,
1505
+ "eval_egin_err_f1": 0.9924678777137793,
1506
+ "eval_egin_err_number": 1126,
1507
+ "eval_egin_err_precision": 0.9902740937223696,
1508
+ "eval_egin_err_recall": 0.9946714031971581,
1509
+ "eval_el_err_f1": 0.9956616052060738,
1510
+ "eval_el_err_number": 1380,
1511
+ "eval_el_err_precision": 0.9935064935064936,
1512
+ "eval_el_err_recall": 0.9978260869565218,
1513
+ "eval_loss": 0.0014384619425982237,
1514
+ "eval_macro_avg_f1": 0.9891194437273718,
1515
+ "eval_macro_avg_number": 23096,
1516
+ "eval_macro_avg_precision": 0.9911404335392073,
1517
+ "eval_macro_avg_recall": 0.9873442677814935,
1518
+ "eval_micro_avg_f1": 0.9932499675479209,
1519
+ "eval_micro_avg_number": 23096,
1520
+ "eval_micro_avg_precision": 0.992605725157831,
1521
+ "eval_micro_avg_recall": 0.993895046761344,
1522
+ "eval_nd_err_f1": 0.9915682967959528,
1523
+ "eval_nd_err_number": 1188,
1524
+ "eval_nd_err_precision": 0.9932432432432432,
1525
+ "eval_nd_err_recall": 0.98989898989899,
1526
+ "eval_ne_word_err_f1": 0.9958169142164293,
1527
+ "eval_ne_word_err_number": 8247,
1528
+ "eval_ne_word_err_precision": 0.9957565470417071,
1529
+ "eval_ne_word_err_recall": 0.9958772887110464,
1530
+ "eval_overall_accuracy": 0.9993779473447238,
1531
+ "eval_runtime": 11.6017,
1532
+ "eval_samples_per_second": 1584.944,
1533
+ "eval_steps_per_second": 99.124,
1534
+ "eval_unc_insert_err_f1": 0.995575221238938,
1535
+ "eval_unc_insert_err_number": 902,
1536
+ "eval_unc_insert_err_precision": 0.9933774834437086,
1537
+ "eval_unc_insert_err_recall": 0.9977827050997783,
1538
+ "eval_weighted_avg_f1": 0.9932502902231016,
1539
+ "eval_weighted_avg_number": 23096,
1540
+ "eval_weighted_avg_precision": 0.9926121818013163,
1541
+ "eval_weighted_avg_recall": 0.993895046761344,
1542
+ "step": 14950
1543
+ },
1544
+ {
1545
+ "epoch": 27.0,
1546
+ "learning_rate": 2.222222222222222e-06,
1547
+ "loss": 0.0034,
1548
+ "step": 15525
1549
+ },
1550
+ {
1551
+ "epoch": 27.0,
1552
+ "eval_5_err_f1": 0.9696969696969697,
1553
+ "eval_5_err_number": 34,
1554
+ "eval_5_err_precision": 1.0,
1555
+ "eval_5_err_recall": 0.9411764705882353,
1556
+ "eval___f1": 0.9911379657603223,
1557
+ "eval___number": 9934,
1558
+ "eval___precision": 0.9915373765867419,
1559
+ "eval___recall": 0.9907388765854641,
1560
+ "eval__err_f1": 0.9808695652173912,
1561
+ "eval__err_number": 285,
1562
+ "eval__err_precision": 0.9724137931034482,
1563
+ "eval__err_recall": 0.9894736842105263,
1564
+ "eval_egin_err_f1": 0.9924611973392462,
1565
+ "eval_egin_err_number": 1126,
1566
+ "eval_egin_err_precision": 0.9911426040744021,
1567
+ "eval_egin_err_recall": 0.9937833037300178,
1568
+ "eval_el_err_f1": 0.9956521739130435,
1569
+ "eval_el_err_number": 1380,
1570
+ "eval_el_err_precision": 0.9956521739130435,
1571
+ "eval_el_err_recall": 0.9956521739130435,
1572
+ "eval_loss": 0.0014439761871472,
1573
+ "eval_macro_avg_f1": 0.9890904534081543,
1574
+ "eval_macro_avg_number": 23096,
1575
+ "eval_macro_avg_precision": 0.9916594889334467,
1576
+ "eval_macro_avg_recall": 0.9867636941837281,
1577
+ "eval_micro_avg_f1": 0.9931572109138155,
1578
+ "eval_micro_avg_number": 23096,
1579
+ "eval_micro_avg_precision": 0.993415352625195,
1580
+ "eval_micro_avg_recall": 0.9928992033252512,
1581
+ "eval_nd_err_f1": 0.9915824915824916,
1582
+ "eval_nd_err_number": 1188,
1583
+ "eval_nd_err_precision": 0.9915824915824916,
1584
+ "eval_nd_err_recall": 0.9915824915824916,
1585
+ "eval_ne_word_err_f1": 0.9957529426040529,
1586
+ "eval_ne_word_err_number": 8247,
1587
+ "eval_ne_word_err_precision": 0.9964784456587735,
1588
+ "eval_ne_word_err_recall": 0.9950284952103795,
1589
+ "eval_overall_accuracy": 0.9993720230337212,
1590
+ "eval_runtime": 11.6586,
1591
+ "eval_samples_per_second": 1577.202,
1592
+ "eval_steps_per_second": 98.639,
1593
+ "eval_unc_insert_err_f1": 0.9955703211517165,
1594
+ "eval_unc_insert_err_number": 902,
1595
+ "eval_unc_insert_err_precision": 0.9944690265486725,
1596
+ "eval_unc_insert_err_recall": 0.9966740576496674,
1597
+ "eval_weighted_avg_f1": 0.9931577905463351,
1598
+ "eval_weighted_avg_number": 23096,
1599
+ "eval_weighted_avg_precision": 0.9934216143717426,
1600
+ "eval_weighted_avg_recall": 0.9928992033252512,
1601
+ "step": 15525
1602
+ },
1603
+ {
1604
+ "epoch": 28.0,
1605
+ "learning_rate": 1.4814814814814815e-06,
1606
+ "loss": 0.0034,
1607
+ "step": 16100
1608
+ },
1609
+ {
1610
+ "epoch": 28.0,
1611
+ "eval_5_err_f1": 0.9696969696969697,
1612
+ "eval_5_err_number": 34,
1613
+ "eval_5_err_precision": 1.0,
1614
+ "eval_5_err_recall": 0.9411764705882353,
1615
+ "eval___f1": 0.9912947214814068,
1616
+ "eval___number": 9934,
1617
+ "eval___precision": 0.9910453767984707,
1618
+ "eval___recall": 0.991544191664989,
1619
+ "eval__err_f1": 0.9808695652173912,
1620
+ "eval__err_number": 285,
1621
+ "eval__err_precision": 0.9724137931034482,
1622
+ "eval__err_recall": 0.9894736842105263,
1623
+ "eval_egin_err_f1": 0.9924678777137793,
1624
+ "eval_egin_err_number": 1126,
1625
+ "eval_egin_err_precision": 0.9902740937223696,
1626
+ "eval_egin_err_recall": 0.9946714031971581,
1627
+ "eval_el_err_f1": 0.9956584659913169,
1628
+ "eval_el_err_number": 1380,
1629
+ "eval_el_err_precision": 0.9942196531791907,
1630
+ "eval_el_err_recall": 0.9971014492753624,
1631
+ "eval_loss": 0.0013684964505955577,
1632
+ "eval_macro_avg_f1": 0.9892169526969239,
1633
+ "eval_macro_avg_number": 23096,
1634
+ "eval_macro_avg_precision": 0.9914005103836372,
1635
+ "eval_macro_avg_recall": 0.9872769063043677,
1636
+ "eval_micro_avg_f1": 0.9932685439709097,
1637
+ "eval_micro_avg_number": 23096,
1638
+ "eval_micro_avg_precision": 0.9930750919714347,
1639
+ "eval_micro_avg_recall": 0.993462071354347,
1640
+ "eval_nd_err_f1": 0.9924242424242424,
1641
+ "eval_nd_err_number": 1188,
1642
+ "eval_nd_err_precision": 0.9924242424242424,
1643
+ "eval_nd_err_recall": 0.9924242424242424,
1644
+ "eval_ne_word_err_f1": 0.9957534578985683,
1645
+ "eval_ne_word_err_number": 8247,
1646
+ "eval_ne_word_err_precision": 0.9963578972927036,
1647
+ "eval_ne_word_err_recall": 0.9951497514247605,
1648
+ "eval_overall_accuracy": 0.9993838716557264,
1649
+ "eval_runtime": 11.7106,
1650
+ "eval_samples_per_second": 1570.205,
1651
+ "eval_steps_per_second": 98.202,
1652
+ "eval_unc_insert_err_f1": 0.9955703211517165,
1653
+ "eval_unc_insert_err_number": 902,
1654
+ "eval_unc_insert_err_precision": 0.9944690265486725,
1655
+ "eval_unc_insert_err_recall": 0.9966740576496674,
1656
+ "eval_weighted_avg_f1": 0.9932693971508063,
1657
+ "eval_weighted_avg_number": 23096,
1658
+ "eval_weighted_avg_precision": 0.9930823127809575,
1659
+ "eval_weighted_avg_recall": 0.993462071354347,
1660
+ "step": 16100
1661
+ },
1662
+ {
1663
+ "epoch": 29.0,
1664
+ "learning_rate": 7.407407407407407e-07,
1665
+ "loss": 0.0032,
1666
+ "step": 16675
1667
+ },
1668
+ {
1669
+ "epoch": 29.0,
1670
+ "eval_5_err_f1": 0.9850746268656716,
1671
+ "eval_5_err_number": 34,
1672
+ "eval_5_err_precision": 1.0,
1673
+ "eval_5_err_recall": 0.9705882352941176,
1674
+ "eval___f1": 0.9913936282651367,
1675
+ "eval___number": 9934,
1676
+ "eval___precision": 0.991343734272773,
1677
+ "eval___recall": 0.9914435272800484,
1678
+ "eval__err_f1": 0.9808027923211169,
1679
+ "eval__err_number": 285,
1680
+ "eval__err_precision": 0.9756944444444444,
1681
+ "eval__err_recall": 0.9859649122807017,
1682
+ "eval_egin_err_f1": 0.9933598937583,
1683
+ "eval_egin_err_number": 1126,
1684
+ "eval_egin_err_precision": 0.9902912621359223,
1685
+ "eval_egin_err_recall": 0.9964476021314387,
1686
+ "eval_el_err_f1": 0.9956584659913169,
1687
+ "eval_el_err_number": 1380,
1688
+ "eval_el_err_precision": 0.9942196531791907,
1689
+ "eval_el_err_recall": 0.9971014492753624,
1690
+ "eval_loss": 0.0013222108827903867,
1691
+ "eval_macro_avg_f1": 0.9913746293199734,
1692
+ "eval_macro_avg_number": 23096,
1693
+ "eval_macro_avg_precision": 0.9923187118435777,
1694
+ "eval_macro_avg_recall": 0.9904955794603574,
1695
+ "eval_micro_avg_f1": 0.9934190587522189,
1696
+ "eval_micro_avg_number": 23096,
1697
+ "eval_micro_avg_precision": 0.993376049874448,
1698
+ "eval_micro_avg_recall": 0.993462071354347,
1699
+ "eval_nd_err_f1": 0.9928360724820903,
1700
+ "eval_nd_err_number": 1188,
1701
+ "eval_nd_err_precision": 0.9940928270042194,
1702
+ "eval_nd_err_recall": 0.9915824915824916,
1703
+ "eval_ne_word_err_f1": 0.9957539730680578,
1704
+ "eval_ne_word_err_number": 8247,
1705
+ "eval_ne_word_err_precision": 0.9962374074523607,
1706
+ "eval_ne_word_err_recall": 0.9952710076391416,
1707
+ "eval_overall_accuracy": 0.9993957202777317,
1708
+ "eval_runtime": 11.6052,
1709
+ "eval_samples_per_second": 1584.462,
1710
+ "eval_steps_per_second": 99.094,
1711
+ "eval_unc_insert_err_f1": 0.9961175818080976,
1712
+ "eval_unc_insert_err_number": 902,
1713
+ "eval_unc_insert_err_precision": 0.9966703662597114,
1714
+ "eval_unc_insert_err_recall": 0.9955654101995566,
1715
+ "eval_weighted_avg_f1": 0.9934199813189548,
1716
+ "eval_weighted_avg_number": 23096,
1717
+ "eval_weighted_avg_precision": 0.9933807370796509,
1718
+ "eval_weighted_avg_recall": 0.993462071354347,
1719
+ "step": 16675
1720
+ },
1721
+ {
1722
+ "epoch": 30.0,
1723
+ "learning_rate": 0.0,
1724
+ "loss": 0.003,
1725
+ "step": 17250
1726
+ },
1727
+ {
1728
+ "epoch": 30.0,
1729
+ "eval_5_err_f1": 0.9850746268656716,
1730
+ "eval_5_err_number": 34,
1731
+ "eval_5_err_precision": 1.0,
1732
+ "eval_5_err_recall": 0.9705882352941176,
1733
+ "eval___f1": 0.9912903388209234,
1734
+ "eval___number": 9934,
1735
+ "eval___precision": 0.9915399335280491,
1736
+ "eval___recall": 0.9910408697402859,
1737
+ "eval__err_f1": 0.9808695652173912,
1738
+ "eval__err_number": 285,
1739
+ "eval__err_precision": 0.9724137931034482,
1740
+ "eval__err_recall": 0.9894736842105263,
1741
+ "eval_egin_err_f1": 0.9933598937583,
1742
+ "eval_egin_err_number": 1126,
1743
+ "eval_egin_err_precision": 0.9902912621359223,
1744
+ "eval_egin_err_recall": 0.9964476021314387,
1745
+ "eval_el_err_f1": 0.9956584659913169,
1746
+ "eval_el_err_number": 1380,
1747
+ "eval_el_err_precision": 0.9942196531791907,
1748
+ "eval_el_err_recall": 0.9971014492753624,
1749
+ "eval_loss": 0.0013192046899348497,
1750
+ "eval_macro_avg_f1": 0.9912800394235617,
1751
+ "eval_macro_avg_number": 23096,
1752
+ "eval_macro_avg_precision": 0.991795835558829,
1753
+ "eval_macro_avg_recall": 0.990841420701172,
1754
+ "eval_micro_avg_f1": 0.993373754872239,
1755
+ "eval_micro_avg_number": 23096,
1756
+ "eval_micro_avg_precision": 0.9936319528677872,
1757
+ "eval_micro_avg_recall": 0.9931156910287495,
1758
+ "eval_nd_err_f1": 0.9919932574799832,
1759
+ "eval_nd_err_number": 1188,
1760
+ "eval_nd_err_precision": 0.9932489451476794,
1761
+ "eval_nd_err_recall": 0.9907407407407407,
1762
+ "eval_ne_word_err_f1": 0.9958722835983974,
1763
+ "eval_ne_word_err_number": 8247,
1764
+ "eval_ne_word_err_precision": 0.9970827762246263,
1765
+ "eval_ne_word_err_recall": 0.9946647265672366,
1766
+ "eval_overall_accuracy": 0.9993957202777317,
1767
+ "eval_runtime": 11.623,
1768
+ "eval_samples_per_second": 1582.033,
1769
+ "eval_steps_per_second": 98.942,
1770
+ "eval_unc_insert_err_f1": 0.9961218836565098,
1771
+ "eval_unc_insert_err_number": 902,
1772
+ "eval_unc_insert_err_precision": 0.9955703211517165,
1773
+ "eval_unc_insert_err_recall": 0.9966740576496674,
1774
+ "eval_weighted_avg_f1": 0.993375440096453,
1775
+ "eval_weighted_avg_number": 23096,
1776
+ "eval_weighted_avg_precision": 0.9936401344515604,
1777
+ "eval_weighted_avg_recall": 0.9931156910287495,
1778
+ "step": 17250
1779
+ },
1780
+ {
1781
+ "epoch": 30.0,
1782
+ "step": 17250,
1783
+ "total_flos": 7911429330344064.0,
1784
+ "train_loss": 0.06519987745561462,
1785
+ "train_runtime": 1743.5904,
1786
+ "train_samples_per_second": 316.382,
1787
+ "train_steps_per_second": 9.893
1788
+ }
1789
+ ],
1790
+ "max_steps": 17250,
1791
+ "num_train_epochs": 30,
1792
+ "total_flos": 7911429330344064.0,
1793
+ "trial_name": null,
1794
+ "trial_params": null
1795
+ }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:12bde5271ad8217a9a362972db9ad2e96ed8d1769894d3a041c4e9d7e28af643
3
  size 3387
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c6b5e11b5bd25aac69af9ca386e301fbfbec9996b7dd5cb1ba740476d0951a
3
  size 3387