nlpso commited on
Commit
5becf8f
·
1 Parent(s): 935a82a

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-PER+O",
17
+ "2": "I-PER+i_TITREH",
18
+ "3": "I-ACT+O",
19
+ "4": "I-DESC+O",
20
+ "5": "I-DESC+i_ACT",
21
+ "6": "I-DESC+i_TITREP",
22
+ "7": "I-SPAT+O",
23
+ "8": "I-SPAT+i_LOC",
24
+ "9": "I-SPAT+i_CARDINAL",
25
+ "10": "I-SPAT+i_FT",
26
+ "11": "I-TITRE+O"
27
+ },
28
+ "initializer_range": 0.02,
29
+ "intermediate_size": 3072,
30
+ "label2id": {
31
+ "I-ACT+O": 3,
32
+ "I-DESC+O": 4,
33
+ "I-DESC+i_ACT": 5,
34
+ "I-DESC+i_TITREP": 6,
35
+ "I-PER+O": 1,
36
+ "I-PER+i_TITREH": 2,
37
+ "I-SPAT+O": 7,
38
+ "I-SPAT+i_CARDINAL": 9,
39
+ "I-SPAT+i_FT": 10,
40
+ "I-SPAT+i_LOC": 8,
41
+ "I-TITRE+O": 11,
42
+ "O+O": 0
43
+ },
44
+ "layer_norm_eps": 1e-05,
45
+ "max_position_embeddings": 514,
46
+ "model_type": "camembert",
47
+ "num_attention_heads": 12,
48
+ "num_hidden_layers": 12,
49
+ "output_past": true,
50
+ "pad_token_id": 1,
51
+ "position_embedding_type": "absolute",
52
+ "torch_dtype": "float32",
53
+ "transformers_version": "4.25.1",
54
+ "type_vocab_size": 1,
55
+ "use_cache": true,
56
+ "vocab_size": 32005
57
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f298156cd8d31bd294f7535180d3e43699856ac95c699fc5ddd32c726d468fd1
3
+ size 880440037
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37edfba93caf5f6eacbb069012788269835b79bc4f7ad5f5c3d0a30de474dc98
3
+ size 440233393
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd2f90d48802522604131ea1a7afaabd142d575f231aa3f928e53b2be73b84f0
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51041b89734cb38f61e5930792b2813f44d4562e4b27ac1f3179a1197589a078
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,2040 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9663670629167874,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/321-camembert-ner-hierarchical-loss-io/checkpoint-2000",
4
+ "epoch": 5.2493438320209975,
5
+ "global_step": 2000,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8378378378378379,
14
+ "number": 519,
15
+ "precision": 0.7868020304568528,
16
+ "recall": 0.8959537572254336
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.850091407678245,
20
+ "number": 503,
21
+ "precision": 0.7868020304568528,
22
+ "recall": 0.9244532803180915
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9687726942628904,
32
+ "number": 678,
33
+ "precision": 0.9542203147353362,
34
+ "recall": 0.9837758112094396
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.908150064683053,
50
+ "number": 761,
51
+ "precision": 0.8942675159235669,
52
+ "recall": 0.9224704336399474
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9078947368421053,
56
+ "number": 676,
57
+ "precision": 0.8973988439306358,
58
+ "recall": 0.9186390532544378
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.9194915254237289,
62
+ "number": 694,
63
+ "precision": 0.9016620498614959,
64
+ "recall": 0.9380403458213257
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.926600860541635,
85
+ "eval_accuracy-all": 0.950582131106049,
86
+ "eval_accuracy-das": 0.9424196405973171,
87
+ "eval_accuracy-l1": 0.9369779802581625,
88
+ "eval_accuracy-l2": 0.9641862819539357,
89
+ "eval_f1": 0.9032535473699298,
90
+ "eval_f1-all": 0.9009427121102248,
91
+ "eval_f1-das": 0.8991195891415995,
92
+ "eval_f1-l1": 0.8884910485933504,
93
+ "eval_f1-l2": 0.917252931323283,
94
+ "eval_loss": 0.3965435028076172,
95
+ "eval_precision": 0.8908679672038451,
96
+ "eval_precision-all": 0.8902264259100029,
97
+ "eval_precision-das": 0.8857968919407301,
98
+ "eval_precision-l1": 0.8663341645885286,
99
+ "eval_precision-l2": 0.9225067385444744,
100
+ "eval_recall": 0.9159883720930233,
101
+ "eval_recall-all": 0.9119201409277745,
102
+ "eval_recall-das": 0.9128491620111732,
103
+ "eval_recall-l1": 0.9118110236220472,
104
+ "eval_recall-l2": 0.9120586275816123,
105
+ "eval_runtime": 5.6993,
106
+ "eval_samples_per_second": 118.611,
107
+ "eval_steps_per_second": 7.545,
108
+ "step": 100
109
+ },
110
+ {
111
+ "epoch": 0.52,
112
+ "eval_ACT": {
113
+ "f1": 0.888888888888889,
114
+ "number": 519,
115
+ "precision": 0.8556149732620321,
116
+ "recall": 0.9248554913294798
117
+ },
118
+ "eval_ACT_L1": {
119
+ "f1": 0.9022556390977442,
120
+ "number": 503,
121
+ "precision": 0.8556149732620321,
122
+ "recall": 0.9542743538767395
123
+ },
124
+ "eval_ACT_L2": {
125
+ "f1": 0.0,
126
+ "number": 16,
127
+ "precision": 0.0,
128
+ "recall": 0.0
129
+ },
130
+ "eval_CARDINAL": {
131
+ "f1": 0.9744338933528124,
132
+ "number": 678,
133
+ "precision": 0.9652677279305355,
134
+ "recall": 0.9837758112094396
135
+ },
136
+ "eval_DESC": {
137
+ "f1": 0.0,
138
+ "number": 30,
139
+ "precision": 0.0,
140
+ "recall": 0.0
141
+ },
142
+ "eval_FT": {
143
+ "f1": 0.0,
144
+ "number": 7,
145
+ "precision": 0.0,
146
+ "recall": 0.0
147
+ },
148
+ "eval_LOC": {
149
+ "f1": 0.9430255402750493,
150
+ "number": 761,
151
+ "precision": 0.9399477806788512,
152
+ "recall": 0.9461235216819974
153
+ },
154
+ "eval_PER": {
155
+ "f1": 0.943952802359882,
156
+ "number": 676,
157
+ "precision": 0.9411764705882353,
158
+ "recall": 0.9467455621301775
159
+ },
160
+ "eval_SPAT": {
161
+ "f1": 0.9349535382416011,
162
+ "number": 694,
163
+ "precision": 0.9276595744680851,
164
+ "recall": 0.9423631123919308
165
+ },
166
+ "eval_TITRE": {
167
+ "f1": 0.0,
168
+ "number": 2,
169
+ "precision": 0.0,
170
+ "recall": 0.0
171
+ },
172
+ "eval_TITREH": {
173
+ "f1": 0.0,
174
+ "number": 33,
175
+ "precision": 0.0,
176
+ "recall": 0.0
177
+ },
178
+ "eval_TITREP": {
179
+ "f1": 0.0,
180
+ "number": 6,
181
+ "precision": 0.0,
182
+ "recall": 0.0
183
+ },
184
+ "eval_accuracy": 0.9360921285750443,
185
+ "eval_accuracy-all": 0.955960516324981,
186
+ "eval_accuracy-das": 0.9502657555049354,
187
+ "eval_accuracy-l1": 0.9448240951657808,
188
+ "eval_accuracy-l2": 0.9670969374841812,
189
+ "eval_f1": 0.931761967117707,
190
+ "eval_f1-all": 0.927931894906796,
191
+ "eval_f1-das": 0.9288500835965074,
192
+ "eval_f1-l1": 0.9203631647211413,
193
+ "eval_f1-l2": 0.9377958079783638,
194
+ "eval_loss": 0.279910147190094,
195
+ "eval_precision": 0.9327119137780367,
196
+ "eval_precision-all": 0.9277957147050191,
197
+ "eval_precision-das": 0.9266123054114158,
198
+ "eval_precision-l1": 0.9097435897435897,
199
+ "eval_precision-l2": 0.9519560741249142,
200
+ "eval_recall": 0.9308139534883721,
201
+ "eval_recall-all": 0.9280681150910158,
202
+ "eval_recall-das": 0.931098696461825,
203
+ "eval_recall-l1": 0.9312335958005249,
204
+ "eval_recall-l2": 0.9240506329113924,
205
+ "eval_runtime": 5.3228,
206
+ "eval_samples_per_second": 127.0,
207
+ "eval_steps_per_second": 8.078,
208
+ "step": 200
209
+ },
210
+ {
211
+ "epoch": 0.79,
212
+ "eval_ACT": {
213
+ "f1": 0.9224880382775119,
214
+ "number": 519,
215
+ "precision": 0.9163498098859315,
216
+ "recall": 0.928709055876686
217
+ },
218
+ "eval_ACT_L1": {
219
+ "f1": 0.9368318756073858,
220
+ "number": 503,
221
+ "precision": 0.9163498098859315,
222
+ "recall": 0.9582504970178927
223
+ },
224
+ "eval_ACT_L2": {
225
+ "f1": 0.0,
226
+ "number": 16,
227
+ "precision": 0.0,
228
+ "recall": 0.0
229
+ },
230
+ "eval_CARDINAL": {
231
+ "f1": 0.9773226042428675,
232
+ "number": 678,
233
+ "precision": 0.969521044992743,
234
+ "recall": 0.9852507374631269
235
+ },
236
+ "eval_DESC": {
237
+ "f1": 0.07692307692307691,
238
+ "number": 30,
239
+ "precision": 0.09090909090909091,
240
+ "recall": 0.06666666666666667
241
+ },
242
+ "eval_FT": {
243
+ "f1": 0.0,
244
+ "number": 7,
245
+ "precision": 0.0,
246
+ "recall": 0.0
247
+ },
248
+ "eval_LOC": {
249
+ "f1": 0.9381107491856677,
250
+ "number": 761,
251
+ "precision": 0.9302325581395349,
252
+ "recall": 0.9461235216819974
253
+ },
254
+ "eval_PER": {
255
+ "f1": 0.9358879882092852,
256
+ "number": 676,
257
+ "precision": 0.9324522760646109,
258
+ "recall": 0.9393491124260355
259
+ },
260
+ "eval_SPAT": {
261
+ "f1": 0.9390070921985816,
262
+ "number": 694,
263
+ "precision": 0.9245810055865922,
264
+ "recall": 0.9538904899135446
265
+ },
266
+ "eval_TITRE": {
267
+ "f1": 0.0,
268
+ "number": 2,
269
+ "precision": 0.0,
270
+ "recall": 0.0
271
+ },
272
+ "eval_TITREH": {
273
+ "f1": 0.3921568627450981,
274
+ "number": 33,
275
+ "precision": 0.5555555555555556,
276
+ "recall": 0.30303030303030304
277
+ },
278
+ "eval_TITREP": {
279
+ "f1": 0.0,
280
+ "number": 6,
281
+ "precision": 0.0,
282
+ "recall": 0.0
283
+ },
284
+ "eval_accuracy": 0.9426727410782081,
285
+ "eval_accuracy-all": 0.9577322196912175,
286
+ "eval_accuracy-das": 0.960389774740572,
287
+ "eval_accuracy-l1": 0.9483675018982536,
288
+ "eval_accuracy-l2": 0.9670969374841812,
289
+ "eval_f1": 0.939160737621606,
290
+ "eval_f1-all": 0.9306206088992975,
291
+ "eval_f1-das": 0.9402568397543273,
292
+ "eval_f1-l1": 0.925194805194805,
293
+ "eval_f1-l2": 0.937625754527163,
294
+ "eval_loss": 0.23822064697742462,
295
+ "eval_precision": 0.938207136640557,
296
+ "eval_precision-all": 0.9279042615294805,
297
+ "eval_precision-das": 0.9397321428571429,
298
+ "eval_precision-l1": 0.9156812339331619,
299
+ "eval_precision-l2": 0.9439567859554355,
300
+ "eval_recall": 0.9401162790697675,
301
+ "eval_recall-all": 0.9333529066353494,
302
+ "eval_recall-das": 0.9407821229050279,
303
+ "eval_recall-l1": 0.9349081364829396,
304
+ "eval_recall-l2": 0.9313790806129247,
305
+ "eval_runtime": 5.4317,
306
+ "eval_samples_per_second": 124.456,
307
+ "eval_steps_per_second": 7.917,
308
+ "step": 300
309
+ },
310
+ {
311
+ "epoch": 1.05,
312
+ "eval_ACT": {
313
+ "f1": 0.9135802469135802,
314
+ "number": 519,
315
+ "precision": 0.900749063670412,
316
+ "recall": 0.9267822736030829
317
+ },
318
+ "eval_ACT_L1": {
319
+ "f1": 0.9276759884281581,
320
+ "number": 503,
321
+ "precision": 0.900749063670412,
322
+ "recall": 0.9562624254473161
323
+ },
324
+ "eval_ACT_L2": {
325
+ "f1": 0.0,
326
+ "number": 16,
327
+ "precision": 0.0,
328
+ "recall": 0.0
329
+ },
330
+ "eval_CARDINAL": {
331
+ "f1": 0.9852941176470589,
332
+ "number": 678,
333
+ "precision": 0.9824046920821115,
334
+ "recall": 0.9882005899705014
335
+ },
336
+ "eval_DESC": {
337
+ "f1": 0.16129032258064516,
338
+ "number": 30,
339
+ "precision": 0.15625,
340
+ "recall": 0.16666666666666666
341
+ },
342
+ "eval_FT": {
343
+ "f1": 0.0,
344
+ "number": 7,
345
+ "precision": 0.0,
346
+ "recall": 0.0
347
+ },
348
+ "eval_LOC": {
349
+ "f1": 0.9414858645627877,
350
+ "number": 761,
351
+ "precision": 0.9421052631578948,
352
+ "recall": 0.9408672798948752
353
+ },
354
+ "eval_PER": {
355
+ "f1": 0.9646539027982327,
356
+ "number": 676,
357
+ "precision": 0.9604105571847508,
358
+ "recall": 0.9689349112426036
359
+ },
360
+ "eval_SPAT": {
361
+ "f1": 0.9440459110473458,
362
+ "number": 694,
363
+ "precision": 0.94,
364
+ "recall": 0.9481268011527377
365
+ },
366
+ "eval_TITRE": {
367
+ "f1": 0.0,
368
+ "number": 2,
369
+ "precision": 0.0,
370
+ "recall": 0.0
371
+ },
372
+ "eval_TITREH": {
373
+ "f1": 0.7118644067796609,
374
+ "number": 33,
375
+ "precision": 0.8076923076923077,
376
+ "recall": 0.6363636363636364
377
+ },
378
+ "eval_TITREP": {
379
+ "f1": 0.0,
380
+ "number": 6,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_accuracy": 0.9511516071880537,
385
+ "eval_accuracy-all": 0.9660212604403948,
386
+ "eval_accuracy-das": 0.9677296886864085,
387
+ "eval_accuracy-l1": 0.9574791192103265,
388
+ "eval_accuracy-l2": 0.9745634016704632,
389
+ "eval_f1": 0.9458987783595114,
390
+ "eval_f1-all": 0.9399003224860745,
391
+ "eval_f1-das": 0.9493293591654248,
392
+ "eval_f1-l1": 0.9338178043083311,
393
+ "eval_f1-l2": 0.9477938699898956,
394
+ "eval_loss": 0.18405073881149292,
395
+ "eval_precision": 0.9464493597206054,
396
+ "eval_precision-all": 0.9385245901639344,
397
+ "eval_precision-das": 0.9496831904584421,
398
+ "eval_precision-l1": 0.9235112936344969,
399
+ "eval_precision-l2": 0.9584468664850136,
400
+ "eval_recall": 0.9453488372093023,
401
+ "eval_recall-all": 0.9412800939518496,
402
+ "eval_recall-das": 0.948975791433892,
403
+ "eval_recall-l1": 0.9443569553805774,
404
+ "eval_recall-l2": 0.9373750832778148,
405
+ "eval_runtime": 5.2971,
406
+ "eval_samples_per_second": 127.616,
407
+ "eval_steps_per_second": 8.118,
408
+ "step": 400
409
+ },
410
+ {
411
+ "epoch": 1.31,
412
+ "learning_rate": 9e-05,
413
+ "loss": 0.3703,
414
+ "step": 500
415
+ },
416
+ {
417
+ "epoch": 1.31,
418
+ "eval_ACT": {
419
+ "f1": 0.9379178605539636,
420
+ "number": 519,
421
+ "precision": 0.9299242424242424,
422
+ "recall": 0.9460500963391136
423
+ },
424
+ "eval_ACT_L1": {
425
+ "f1": 0.9524733268671194,
426
+ "number": 503,
427
+ "precision": 0.9299242424242424,
428
+ "recall": 0.9761431411530815
429
+ },
430
+ "eval_ACT_L2": {
431
+ "f1": 0.0,
432
+ "number": 16,
433
+ "precision": 0.0,
434
+ "recall": 0.0
435
+ },
436
+ "eval_CARDINAL": {
437
+ "f1": 0.9816041206769685,
438
+ "number": 678,
439
+ "precision": 0.9794419970631424,
440
+ "recall": 0.9837758112094396
441
+ },
442
+ "eval_DESC": {
443
+ "f1": 0.22727272727272724,
444
+ "number": 30,
445
+ "precision": 0.35714285714285715,
446
+ "recall": 0.16666666666666666
447
+ },
448
+ "eval_FT": {
449
+ "f1": 0.0,
450
+ "number": 7,
451
+ "precision": 0.0,
452
+ "recall": 0.0
453
+ },
454
+ "eval_LOC": {
455
+ "f1": 0.9286640726329443,
456
+ "number": 761,
457
+ "precision": 0.9167733674775929,
458
+ "recall": 0.9408672798948752
459
+ },
460
+ "eval_PER": {
461
+ "f1": 0.960294117647059,
462
+ "number": 676,
463
+ "precision": 0.9546783625730995,
464
+ "recall": 0.9659763313609467
465
+ },
466
+ "eval_SPAT": {
467
+ "f1": 0.9291784702549575,
468
+ "number": 694,
469
+ "precision": 0.9136490250696379,
470
+ "recall": 0.9452449567723343
471
+ },
472
+ "eval_TITRE": {
473
+ "f1": 0.0,
474
+ "number": 2,
475
+ "precision": 0.0,
476
+ "recall": 0.0
477
+ },
478
+ "eval_TITREH": {
479
+ "f1": 0.7419354838709677,
480
+ "number": 33,
481
+ "precision": 0.7931034482758621,
482
+ "recall": 0.696969696969697
483
+ },
484
+ "eval_TITREP": {
485
+ "f1": 0.0,
486
+ "number": 6,
487
+ "precision": 0.0,
488
+ "recall": 0.0
489
+ },
490
+ "eval_accuracy": 0.951784358390281,
491
+ "eval_accuracy-all": 0.964123006833713,
492
+ "eval_accuracy-das": 0.9651986838774994,
493
+ "eval_accuracy-l1": 0.9583649708934447,
494
+ "eval_accuracy-l2": 0.9698810427739812,
495
+ "eval_f1": 0.9481932956029604,
496
+ "eval_f1-all": 0.9384772760485167,
497
+ "eval_f1-das": 0.9487940630797775,
498
+ "eval_f1-l1": 0.9379059495972979,
499
+ "eval_f1-l2": 0.9392117568470274,
500
+ "eval_loss": 0.20227569341659546,
501
+ "eval_precision": 0.9466821211243118,
502
+ "eval_precision-all": 0.9342449810881582,
503
+ "eval_precision-das": 0.945286506469501,
504
+ "eval_precision-l1": 0.9284979423868313,
505
+ "eval_precision-l2": 0.941728064300067,
506
+ "eval_recall": 0.9497093023255814,
507
+ "eval_recall-all": 0.9427480916030534,
508
+ "eval_recall-das": 0.9523277467411546,
509
+ "eval_recall-l1": 0.94750656167979,
510
+ "eval_recall-l2": 0.9367088607594937,
511
+ "eval_runtime": 5.4983,
512
+ "eval_samples_per_second": 122.948,
513
+ "eval_steps_per_second": 7.821,
514
+ "step": 500
515
+ },
516
+ {
517
+ "epoch": 1.57,
518
+ "eval_ACT": {
519
+ "f1": 0.9351145038167938,
520
+ "number": 519,
521
+ "precision": 0.9262759924385633,
522
+ "recall": 0.9441233140655106
523
+ },
524
+ "eval_ACT_L1": {
525
+ "f1": 0.9496124031007751,
526
+ "number": 503,
527
+ "precision": 0.9262759924385633,
528
+ "recall": 0.974155069582505
529
+ },
530
+ "eval_ACT_L2": {
531
+ "f1": 0.0,
532
+ "number": 16,
533
+ "precision": 0.0,
534
+ "recall": 0.0
535
+ },
536
+ "eval_CARDINAL": {
537
+ "f1": 0.9808823529411764,
538
+ "number": 678,
539
+ "precision": 0.9780058651026393,
540
+ "recall": 0.9837758112094396
541
+ },
542
+ "eval_DESC": {
543
+ "f1": 0.2711864406779661,
544
+ "number": 30,
545
+ "precision": 0.27586206896551724,
546
+ "recall": 0.26666666666666666
547
+ },
548
+ "eval_FT": {
549
+ "f1": 0.0,
550
+ "number": 7,
551
+ "precision": 0.0,
552
+ "recall": 0.0
553
+ },
554
+ "eval_LOC": {
555
+ "f1": 0.9541284403669723,
556
+ "number": 761,
557
+ "precision": 0.9516339869281045,
558
+ "recall": 0.9566360052562418
559
+ },
560
+ "eval_PER": {
561
+ "f1": 0.9720176730486009,
562
+ "number": 676,
563
+ "precision": 0.967741935483871,
564
+ "recall": 0.9763313609467456
565
+ },
566
+ "eval_SPAT": {
567
+ "f1": 0.9633883704235463,
568
+ "number": 694,
569
+ "precision": 0.9599427753934192,
570
+ "recall": 0.9668587896253602
571
+ },
572
+ "eval_TITRE": {
573
+ "f1": 0.0,
574
+ "number": 2,
575
+ "precision": 0.0,
576
+ "recall": 0.0
577
+ },
578
+ "eval_TITREH": {
579
+ "f1": 0.676470588235294,
580
+ "number": 33,
581
+ "precision": 0.6571428571428571,
582
+ "recall": 0.696969696969697
583
+ },
584
+ "eval_TITREP": {
585
+ "f1": 0.0,
586
+ "number": 6,
587
+ "precision": 0.0,
588
+ "recall": 0.0
589
+ },
590
+ "eval_accuracy": 0.9583649708934447,
591
+ "eval_accuracy-all": 0.9695646671728676,
592
+ "eval_accuracy-das": 0.9716527461402177,
593
+ "eval_accuracy-l1": 0.9644393824348266,
594
+ "eval_accuracy-l2": 0.9746899519109087,
595
+ "eval_f1": 0.9551458847437944,
596
+ "eval_f1-all": 0.9510837727006444,
597
+ "eval_f1-das": 0.9576050576422462,
598
+ "eval_f1-l1": 0.9516129032258065,
599
+ "eval_f1-l2": 0.9504021447721179,
600
+ "eval_loss": 0.16219548881053925,
601
+ "eval_precision": 0.953899681066976,
602
+ "eval_precision-all": 0.9488603156049094,
603
+ "eval_precision-das": 0.9561826958782027,
604
+ "eval_precision-l1": 0.9432697266632285,
605
+ "eval_precision-l2": 0.9561699258260283,
606
+ "eval_recall": 0.9563953488372093,
607
+ "eval_recall-all": 0.9533176746917205,
608
+ "eval_recall-das": 0.9590316573556797,
609
+ "eval_recall-l1": 0.9601049868766404,
610
+ "eval_recall-l2": 0.9447035309793471,
611
+ "eval_runtime": 5.458,
612
+ "eval_samples_per_second": 123.855,
613
+ "eval_steps_per_second": 7.878,
614
+ "step": 600
615
+ },
616
+ {
617
+ "epoch": 1.84,
618
+ "eval_ACT": {
619
+ "f1": 0.9361296472831266,
620
+ "number": 519,
621
+ "precision": 0.9264150943396227,
622
+ "recall": 0.9460500963391136
623
+ },
624
+ "eval_ACT_L1": {
625
+ "f1": 0.9483933787731256,
626
+ "number": 503,
627
+ "precision": 0.9293893129770993,
628
+ "recall": 0.9681908548707754
629
+ },
630
+ "eval_ACT_L2": {
631
+ "f1": 0.36363636363636365,
632
+ "number": 16,
633
+ "precision": 0.6666666666666666,
634
+ "recall": 0.25
635
+ },
636
+ "eval_CARDINAL": {
637
+ "f1": 0.9889298892988929,
638
+ "number": 678,
639
+ "precision": 0.9896602658788775,
640
+ "recall": 0.9882005899705014
641
+ },
642
+ "eval_DESC": {
643
+ "f1": 0.4528301886792453,
644
+ "number": 30,
645
+ "precision": 0.5217391304347826,
646
+ "recall": 0.4
647
+ },
648
+ "eval_FT": {
649
+ "f1": 0.0,
650
+ "number": 7,
651
+ "precision": 0.0,
652
+ "recall": 0.0
653
+ },
654
+ "eval_LOC": {
655
+ "f1": 0.9514435695538058,
656
+ "number": 761,
657
+ "precision": 0.9501965923984272,
658
+ "recall": 0.9526938239159002
659
+ },
660
+ "eval_PER": {
661
+ "f1": 0.9666913397483345,
662
+ "number": 676,
663
+ "precision": 0.9674074074074074,
664
+ "recall": 0.9659763313609467
665
+ },
666
+ "eval_SPAT": {
667
+ "f1": 0.9519713261648747,
668
+ "number": 694,
669
+ "precision": 0.9472182596291013,
670
+ "recall": 0.9567723342939481
671
+ },
672
+ "eval_TITRE": {
673
+ "f1": 0.0,
674
+ "number": 2,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_TITREH": {
679
+ "f1": 0.6216216216216217,
680
+ "number": 33,
681
+ "precision": 0.5609756097560976,
682
+ "recall": 0.696969696969697
683
+ },
684
+ "eval_TITREP": {
685
+ "f1": 0.2222222222222222,
686
+ "number": 6,
687
+ "precision": 0.3333333333333333,
688
+ "recall": 0.16666666666666666
689
+ },
690
+ "eval_accuracy": 0.9605163249810175,
691
+ "eval_accuracy-all": 0.9719691217413313,
692
+ "eval_accuracy-das": 0.9713996456593268,
693
+ "eval_accuracy-l1": 0.9669703872437357,
694
+ "eval_accuracy-l2": 0.9769678562389269,
695
+ "eval_f1": 0.9528096413532743,
696
+ "eval_f1-all": 0.9499926675465612,
697
+ "eval_f1-das": 0.9529827169671065,
698
+ "eval_f1-l1": 0.9487983281086729,
699
+ "eval_f1-l2": 0.9515212303577398,
700
+ "eval_loss": 0.1616193950176239,
701
+ "eval_precision": 0.9518421816071947,
702
+ "eval_precision-all": 0.9490184588338705,
703
+ "eval_precision-das": 0.9510385756676558,
704
+ "eval_precision-l1": 0.9443577743109725,
705
+ "eval_precision-l2": 0.9550335570469799,
706
+ "eval_recall": 0.9537790697674419,
707
+ "eval_recall-all": 0.9509688784497945,
708
+ "eval_recall-das": 0.9549348230912477,
709
+ "eval_recall-l1": 0.9532808398950131,
710
+ "eval_recall-l2": 0.9480346435709527,
711
+ "eval_runtime": 5.3537,
712
+ "eval_samples_per_second": 126.267,
713
+ "eval_steps_per_second": 8.032,
714
+ "step": 700
715
+ },
716
+ {
717
+ "epoch": 2.1,
718
+ "eval_ACT": {
719
+ "f1": 0.9180018850141377,
720
+ "number": 519,
721
+ "precision": 0.8985239852398524,
722
+ "recall": 0.9383429672447013
723
+ },
724
+ "eval_ACT_L1": {
725
+ "f1": 0.942439024390244,
726
+ "number": 503,
727
+ "precision": 0.9252873563218391,
728
+ "recall": 0.9602385685884692
729
+ },
730
+ "eval_ACT_L2": {
731
+ "f1": 0.22222222222222224,
732
+ "number": 16,
733
+ "precision": 0.2,
734
+ "recall": 0.25
735
+ },
736
+ "eval_CARDINAL": {
737
+ "f1": 0.986019131714496,
738
+ "number": 678,
739
+ "precision": 0.9838472834067548,
740
+ "recall": 0.9882005899705014
741
+ },
742
+ "eval_DESC": {
743
+ "f1": 0.4210526315789474,
744
+ "number": 30,
745
+ "precision": 0.34782608695652173,
746
+ "recall": 0.5333333333333333
747
+ },
748
+ "eval_FT": {
749
+ "f1": 0.0,
750
+ "number": 7,
751
+ "precision": 0.0,
752
+ "recall": 0.0
753
+ },
754
+ "eval_LOC": {
755
+ "f1": 0.9256844850065189,
756
+ "number": 761,
757
+ "precision": 0.9184993531694696,
758
+ "recall": 0.9329829172141918
759
+ },
760
+ "eval_PER": {
761
+ "f1": 0.9558173784977908,
762
+ "number": 676,
763
+ "precision": 0.9516129032258065,
764
+ "recall": 0.9600591715976331
765
+ },
766
+ "eval_SPAT": {
767
+ "f1": 0.9461593682699211,
768
+ "number": 694,
769
+ "precision": 0.9427753934191703,
770
+ "recall": 0.9495677233429395
771
+ },
772
+ "eval_TITRE": {
773
+ "f1": 0.0,
774
+ "number": 2,
775
+ "precision": 0.0,
776
+ "recall": 0.0
777
+ },
778
+ "eval_TITREH": {
779
+ "f1": 0.7605633802816901,
780
+ "number": 33,
781
+ "precision": 0.7105263157894737,
782
+ "recall": 0.8181818181818182
783
+ },
784
+ "eval_TITREP": {
785
+ "f1": 0.3333333333333333,
786
+ "number": 6,
787
+ "precision": 0.3333333333333333,
788
+ "recall": 0.3333333333333333
789
+ },
790
+ "eval_accuracy": 0.9474816502151354,
791
+ "eval_accuracy-all": 0.9607694254619084,
792
+ "eval_accuracy-das": 0.967603138445963,
793
+ "eval_accuracy-l1": 0.9552012148823082,
794
+ "eval_accuracy-l2": 0.9663376360415085,
795
+ "eval_f1": 0.9397035544682689,
796
+ "eval_f1-all": 0.9369998545031283,
797
+ "eval_f1-das": 0.9450305385896723,
798
+ "eval_f1-l1": 0.9377270368448366,
799
+ "eval_f1-l2": 0.9360715468698245,
800
+ "eval_loss": 0.17993101477622986,
801
+ "eval_precision": 0.9304645198062126,
802
+ "eval_precision-all": 0.9287568503028555,
803
+ "eval_precision-das": 0.9392935982339956,
804
+ "eval_precision-l1": 0.9271421241662391,
805
+ "eval_precision-l2": 0.9308300395256917,
806
+ "eval_recall": 0.9491279069767442,
807
+ "eval_recall-all": 0.9453904873752202,
808
+ "eval_recall-das": 0.9508379888268157,
809
+ "eval_recall-l1": 0.9485564304461942,
810
+ "eval_recall-l2": 0.9413724183877415,
811
+ "eval_runtime": 5.7248,
812
+ "eval_samples_per_second": 118.084,
813
+ "eval_steps_per_second": 7.511,
814
+ "step": 800
815
+ },
816
+ {
817
+ "epoch": 2.36,
818
+ "eval_ACT": {
819
+ "f1": 0.9387370405278038,
820
+ "number": 519,
821
+ "precision": 0.9188191881918819,
822
+ "recall": 0.9595375722543352
823
+ },
824
+ "eval_ACT_L1": {
825
+ "f1": 0.9555125725338492,
826
+ "number": 503,
827
+ "precision": 0.9303201506591338,
828
+ "recall": 0.9821073558648111
829
+ },
830
+ "eval_ACT_L2": {
831
+ "f1": 0.2962962962962963,
832
+ "number": 16,
833
+ "precision": 0.36363636363636365,
834
+ "recall": 0.25
835
+ },
836
+ "eval_CARDINAL": {
837
+ "f1": 0.9845474613686535,
838
+ "number": 678,
839
+ "precision": 0.9823788546255506,
840
+ "recall": 0.9867256637168141
841
+ },
842
+ "eval_DESC": {
843
+ "f1": 0.3384615384615384,
844
+ "number": 30,
845
+ "precision": 0.3142857142857143,
846
+ "recall": 0.36666666666666664
847
+ },
848
+ "eval_FT": {
849
+ "f1": 0.0,
850
+ "number": 7,
851
+ "precision": 0.0,
852
+ "recall": 0.0
853
+ },
854
+ "eval_LOC": {
855
+ "f1": 0.9481967213114754,
856
+ "number": 761,
857
+ "precision": 0.9463350785340314,
858
+ "recall": 0.9500657030223391
859
+ },
860
+ "eval_PER": {
861
+ "f1": 0.969786293294031,
862
+ "number": 676,
863
+ "precision": 0.9662261380323054,
864
+ "recall": 0.9733727810650887
865
+ },
866
+ "eval_SPAT": {
867
+ "f1": 0.9511494252873564,
868
+ "number": 694,
869
+ "precision": 0.9484240687679083,
870
+ "recall": 0.9538904899135446
871
+ },
872
+ "eval_TITRE": {
873
+ "f1": 0.0,
874
+ "number": 2,
875
+ "precision": 0.0,
876
+ "recall": 0.0
877
+ },
878
+ "eval_TITREH": {
879
+ "f1": 0.7936507936507938,
880
+ "number": 33,
881
+ "precision": 0.8333333333333334,
882
+ "recall": 0.7575757575757576
883
+ },
884
+ "eval_TITREP": {
885
+ "f1": 0.3333333333333333,
886
+ "number": 6,
887
+ "precision": 0.3333333333333333,
888
+ "recall": 0.3333333333333333
889
+ },
890
+ "eval_accuracy": 0.9600101240192357,
891
+ "eval_accuracy-all": 0.9705770690964313,
892
+ "eval_accuracy-das": 0.9731713490255631,
893
+ "eval_accuracy-l1": 0.9653252341179448,
894
+ "eval_accuracy-l2": 0.9758289040749177,
895
+ "eval_f1": 0.9563578367406117,
896
+ "eval_f1-all": 0.9492912465293001,
897
+ "eval_f1-das": 0.959539717891611,
898
+ "eval_f1-l1": 0.9480519480519479,
899
+ "eval_f1-l2": 0.9508853992649516,
900
+ "eval_loss": 0.16017325222492218,
901
+ "eval_precision": 0.9540063638993347,
902
+ "eval_precision-all": 0.945010183299389,
903
+ "eval_precision-das": 0.9563448020717721,
904
+ "eval_precision-l1": 0.9383033419023136,
905
+ "eval_precision-l2": 0.9537533512064343,
906
+ "eval_recall": 0.9587209302325581,
907
+ "eval_recall-all": 0.9536112742219612,
908
+ "eval_recall-das": 0.962756052141527,
909
+ "eval_recall-l1": 0.958005249343832,
910
+ "eval_recall-l2": 0.9480346435709527,
911
+ "eval_runtime": 5.5031,
912
+ "eval_samples_per_second": 122.84,
913
+ "eval_steps_per_second": 7.814,
914
+ "step": 900
915
+ },
916
+ {
917
+ "epoch": 2.62,
918
+ "learning_rate": 8e-05,
919
+ "loss": 0.1449,
920
+ "step": 1000
921
+ },
922
+ {
923
+ "epoch": 2.62,
924
+ "eval_ACT": {
925
+ "f1": 0.9233716475095786,
926
+ "number": 519,
927
+ "precision": 0.9180952380952381,
928
+ "recall": 0.928709055876686
929
+ },
930
+ "eval_ACT_L1": {
931
+ "f1": 0.9397828232971372,
932
+ "number": 503,
933
+ "precision": 0.9333333333333333,
934
+ "recall": 0.9463220675944334
935
+ },
936
+ "eval_ACT_L2": {
937
+ "f1": 0.38709677419354843,
938
+ "number": 16,
939
+ "precision": 0.4,
940
+ "recall": 0.375
941
+ },
942
+ "eval_CARDINAL": {
943
+ "f1": 0.9823788546255506,
944
+ "number": 678,
945
+ "precision": 0.9780701754385965,
946
+ "recall": 0.9867256637168141
947
+ },
948
+ "eval_DESC": {
949
+ "f1": 0.47058823529411764,
950
+ "number": 30,
951
+ "precision": 0.42105263157894735,
952
+ "recall": 0.5333333333333333
953
+ },
954
+ "eval_FT": {
955
+ "f1": 0.0,
956
+ "number": 7,
957
+ "precision": 0.0,
958
+ "recall": 0.0
959
+ },
960
+ "eval_LOC": {
961
+ "f1": 0.9440104166666667,
962
+ "number": 761,
963
+ "precision": 0.9354838709677419,
964
+ "recall": 0.9526938239159002
965
+ },
966
+ "eval_PER": {
967
+ "f1": 0.9690265486725664,
968
+ "number": 676,
969
+ "precision": 0.9661764705882353,
970
+ "recall": 0.9718934911242604
971
+ },
972
+ "eval_SPAT": {
973
+ "f1": 0.946236559139785,
974
+ "number": 694,
975
+ "precision": 0.9415121255349501,
976
+ "recall": 0.9510086455331412
977
+ },
978
+ "eval_TITRE": {
979
+ "f1": 0.0,
980
+ "number": 2,
981
+ "precision": 0.0,
982
+ "recall": 0.0
983
+ },
984
+ "eval_TITREH": {
985
+ "f1": 0.8307692307692308,
986
+ "number": 33,
987
+ "precision": 0.84375,
988
+ "recall": 0.8181818181818182
989
+ },
990
+ "eval_TITREP": {
991
+ "f1": 0.3636363636363636,
992
+ "number": 6,
993
+ "precision": 0.4,
994
+ "recall": 0.3333333333333333
995
+ },
996
+ "eval_accuracy": 0.957605669450772,
997
+ "eval_accuracy-all": 0.9693748418121995,
998
+ "eval_accuracy-das": 0.9710199949379904,
999
+ "eval_accuracy-l1": 0.9641862819539357,
1000
+ "eval_accuracy-l2": 0.9745634016704632,
1001
+ "eval_f1": 0.9503177354130561,
1002
+ "eval_f1-all": 0.9459538416593631,
1003
+ "eval_f1-das": 0.953583364277757,
1004
+ "eval_f1-l1": 0.9436619718309859,
1005
+ "eval_f1-l2": 0.948871181938911,
1006
+ "eval_loss": 0.17344143986701965,
1007
+ "eval_precision": 0.9443168771526981,
1008
+ "eval_precision-all": 0.9412790697674419,
1009
+ "eval_precision-das": 0.9507589781562384,
1010
+ "eval_precision-l1": 0.937791601866252,
1011
+ "eval_precision-l2": 0.9457313037723362,
1012
+ "eval_recall": 0.9563953488372093,
1013
+ "eval_recall-all": 0.9506752789195537,
1014
+ "eval_recall-das": 0.9564245810055866,
1015
+ "eval_recall-l1": 0.9496062992125984,
1016
+ "eval_recall-l2": 0.9520319786808794,
1017
+ "eval_runtime": 5.2868,
1018
+ "eval_samples_per_second": 127.865,
1019
+ "eval_steps_per_second": 8.133,
1020
+ "step": 1000
1021
+ },
1022
+ {
1023
+ "epoch": 2.89,
1024
+ "eval_ACT": {
1025
+ "f1": 0.9411764705882353,
1026
+ "number": 519,
1027
+ "precision": 0.9271028037383178,
1028
+ "recall": 0.9556840077071291
1029
+ },
1030
+ "eval_ACT_L1": {
1031
+ "f1": 0.966403162055336,
1032
+ "number": 503,
1033
+ "precision": 0.9607072691552063,
1034
+ "recall": 0.9721669980119284
1035
+ },
1036
+ "eval_ACT_L2": {
1037
+ "f1": 0.33333333333333337,
1038
+ "number": 16,
1039
+ "precision": 0.2692307692307692,
1040
+ "recall": 0.4375
1041
+ },
1042
+ "eval_CARDINAL": {
1043
+ "f1": 0.9852724594992636,
1044
+ "number": 678,
1045
+ "precision": 0.9838235294117647,
1046
+ "recall": 0.9867256637168141
1047
+ },
1048
+ "eval_DESC": {
1049
+ "f1": 0.4864864864864865,
1050
+ "number": 30,
1051
+ "precision": 0.4090909090909091,
1052
+ "recall": 0.6
1053
+ },
1054
+ "eval_FT": {
1055
+ "f1": 0.18181818181818182,
1056
+ "number": 7,
1057
+ "precision": 0.25,
1058
+ "recall": 0.14285714285714285
1059
+ },
1060
+ "eval_LOC": {
1061
+ "f1": 0.9514435695538058,
1062
+ "number": 761,
1063
+ "precision": 0.9501965923984272,
1064
+ "recall": 0.9526938239159002
1065
+ },
1066
+ "eval_PER": {
1067
+ "f1": 0.9807976366322009,
1068
+ "number": 676,
1069
+ "precision": 0.9793510324483776,
1070
+ "recall": 0.9822485207100592
1071
+ },
1072
+ "eval_SPAT": {
1073
+ "f1": 0.9503239740820734,
1074
+ "number": 694,
1075
+ "precision": 0.9496402877697842,
1076
+ "recall": 0.9510086455331412
1077
+ },
1078
+ "eval_TITRE": {
1079
+ "f1": 0.0,
1080
+ "number": 2,
1081
+ "precision": 0.0,
1082
+ "recall": 0.0
1083
+ },
1084
+ "eval_TITREH": {
1085
+ "f1": 0.819672131147541,
1086
+ "number": 33,
1087
+ "precision": 0.8928571428571429,
1088
+ "recall": 0.7575757575757576
1089
+ },
1090
+ "eval_TITREP": {
1091
+ "f1": 0.26666666666666666,
1092
+ "number": 6,
1093
+ "precision": 0.2222222222222222,
1094
+ "recall": 0.3333333333333333
1095
+ },
1096
+ "eval_accuracy": 0.9530498607947355,
1097
+ "eval_accuracy-all": 0.964819033156163,
1098
+ "eval_accuracy-das": 0.9724120475828905,
1099
+ "eval_accuracy-l1": 0.960389774740572,
1100
+ "eval_accuracy-l2": 0.969248291571754,
1101
+ "eval_f1": 0.9578566256335989,
1102
+ "eval_f1-all": 0.952937737503654,
1103
+ "eval_f1-das": 0.9619029920089203,
1104
+ "eval_f1-l1": 0.9558861915948839,
1105
+ "eval_f1-l2": 0.9491863168382597,
1106
+ "eval_loss": 0.16722118854522705,
1107
+ "eval_precision": 0.9544011544011544,
1108
+ "eval_precision-all": 0.9487776484284052,
1109
+ "eval_precision-das": 0.9599406528189911,
1110
+ "eval_precision-l1": 0.95067497403946,
1111
+ "eval_precision-l2": 0.9463576158940398,
1112
+ "eval_recall": 0.9613372093023256,
1113
+ "eval_recall-all": 0.9571344685848503,
1114
+ "eval_recall-das": 0.9638733705772812,
1115
+ "eval_recall-l1": 0.9611548556430446,
1116
+ "eval_recall-l2": 0.9520319786808794,
1117
+ "eval_runtime": 5.3735,
1118
+ "eval_samples_per_second": 125.803,
1119
+ "eval_steps_per_second": 8.002,
1120
+ "step": 1100
1121
+ },
1122
+ {
1123
+ "epoch": 3.15,
1124
+ "eval_ACT": {
1125
+ "f1": 0.9268755935422602,
1126
+ "number": 519,
1127
+ "precision": 0.9138576779026217,
1128
+ "recall": 0.9402697495183044
1129
+ },
1130
+ "eval_ACT_L1": {
1131
+ "f1": 0.95069033530572,
1132
+ "number": 503,
1133
+ "precision": 0.9432485322896281,
1134
+ "recall": 0.9582504970178927
1135
+ },
1136
+ "eval_ACT_L2": {
1137
+ "f1": 0.30769230769230765,
1138
+ "number": 16,
1139
+ "precision": 0.2608695652173913,
1140
+ "recall": 0.375
1141
+ },
1142
+ "eval_CARDINAL": {
1143
+ "f1": 0.9867647058823529,
1144
+ "number": 678,
1145
+ "precision": 0.9838709677419355,
1146
+ "recall": 0.9896755162241888
1147
+ },
1148
+ "eval_DESC": {
1149
+ "f1": 0.43243243243243246,
1150
+ "number": 30,
1151
+ "precision": 0.36363636363636365,
1152
+ "recall": 0.5333333333333333
1153
+ },
1154
+ "eval_FT": {
1155
+ "f1": 0.2,
1156
+ "number": 7,
1157
+ "precision": 0.3333333333333333,
1158
+ "recall": 0.14285714285714285
1159
+ },
1160
+ "eval_LOC": {
1161
+ "f1": 0.9523809523809524,
1162
+ "number": 761,
1163
+ "precision": 0.9455958549222798,
1164
+ "recall": 0.9592641261498029
1165
+ },
1166
+ "eval_PER": {
1167
+ "f1": 0.9742078113485629,
1168
+ "number": 676,
1169
+ "precision": 0.9706314243759178,
1170
+ "recall": 0.977810650887574
1171
+ },
1172
+ "eval_SPAT": {
1173
+ "f1": 0.9633883704235463,
1174
+ "number": 694,
1175
+ "precision": 0.9599427753934192,
1176
+ "recall": 0.9668587896253602
1177
+ },
1178
+ "eval_TITRE": {
1179
+ "f1": 0.0,
1180
+ "number": 2,
1181
+ "precision": 0.0,
1182
+ "recall": 0.0
1183
+ },
1184
+ "eval_TITREH": {
1185
+ "f1": 0.8059701492537314,
1186
+ "number": 33,
1187
+ "precision": 0.7941176470588235,
1188
+ "recall": 0.8181818181818182
1189
+ },
1190
+ "eval_TITREP": {
1191
+ "f1": 0.5,
1192
+ "number": 6,
1193
+ "precision": 0.5,
1194
+ "recall": 0.5
1195
+ },
1196
+ "eval_accuracy": 0.9558339660845355,
1197
+ "eval_accuracy-all": 0.9667172867628449,
1198
+ "eval_accuracy-das": 0.9746899519109087,
1199
+ "eval_accuracy-l1": 0.9619083776259175,
1200
+ "eval_accuracy-l2": 0.9715261958997722,
1201
+ "eval_f1": 0.9552411204158244,
1202
+ "eval_f1-all": 0.9526308118350095,
1203
+ "eval_f1-das": 0.9595697329376855,
1204
+ "eval_f1-l1": 0.9531249999999999,
1205
+ "eval_f1-l2": 0.9520026481297584,
1206
+ "eval_loss": 0.15443478524684906,
1207
+ "eval_precision": 0.948938611589214,
1208
+ "eval_precision-all": 0.9458755426917511,
1209
+ "eval_precision-das": 0.9556704839305504,
1210
+ "eval_precision-l1": 0.9457364341085271,
1211
+ "eval_precision-l2": 0.9460526315789474,
1212
+ "eval_recall": 0.9616279069767442,
1213
+ "eval_recall-all": 0.9594832648267763,
1214
+ "eval_recall-das": 0.9635009310986965,
1215
+ "eval_recall-l1": 0.9606299212598425,
1216
+ "eval_recall-l2": 0.9580279813457695,
1217
+ "eval_runtime": 5.4706,
1218
+ "eval_samples_per_second": 123.569,
1219
+ "eval_steps_per_second": 7.86,
1220
+ "step": 1200
1221
+ },
1222
+ {
1223
+ "epoch": 3.41,
1224
+ "eval_ACT": {
1225
+ "f1": 0.9435406698564592,
1226
+ "number": 519,
1227
+ "precision": 0.9372623574144486,
1228
+ "recall": 0.9499036608863198
1229
+ },
1230
+ "eval_ACT_L1": {
1231
+ "f1": 0.9560975609756097,
1232
+ "number": 503,
1233
+ "precision": 0.9386973180076629,
1234
+ "recall": 0.974155069582505
1235
+ },
1236
+ "eval_ACT_L2": {
1237
+ "f1": 0.3,
1238
+ "number": 16,
1239
+ "precision": 0.75,
1240
+ "recall": 0.1875
1241
+ },
1242
+ "eval_CARDINAL": {
1243
+ "f1": 0.9882179675994109,
1244
+ "number": 678,
1245
+ "precision": 0.986764705882353,
1246
+ "recall": 0.9896755162241888
1247
+ },
1248
+ "eval_DESC": {
1249
+ "f1": 0.48,
1250
+ "number": 30,
1251
+ "precision": 0.6,
1252
+ "recall": 0.4
1253
+ },
1254
+ "eval_FT": {
1255
+ "f1": 0.2,
1256
+ "number": 7,
1257
+ "precision": 0.3333333333333333,
1258
+ "recall": 0.14285714285714285
1259
+ },
1260
+ "eval_LOC": {
1261
+ "f1": 0.9551656920077972,
1262
+ "number": 761,
1263
+ "precision": 0.9447300771208226,
1264
+ "recall": 0.9658344283837057
1265
+ },
1266
+ "eval_PER": {
1267
+ "f1": 0.9756457564575647,
1268
+ "number": 676,
1269
+ "precision": 0.9734904270986745,
1270
+ "recall": 0.977810650887574
1271
+ },
1272
+ "eval_SPAT": {
1273
+ "f1": 0.9558404558404557,
1274
+ "number": 694,
1275
+ "precision": 0.9450704225352112,
1276
+ "recall": 0.9668587896253602
1277
+ },
1278
+ "eval_TITRE": {
1279
+ "f1": 0.0,
1280
+ "number": 2,
1281
+ "precision": 0.0,
1282
+ "recall": 0.0
1283
+ },
1284
+ "eval_TITREH": {
1285
+ "f1": 0.8307692307692308,
1286
+ "number": 33,
1287
+ "precision": 0.84375,
1288
+ "recall": 0.8181818181818182
1289
+ },
1290
+ "eval_TITREP": {
1291
+ "f1": 0.3333333333333333,
1292
+ "number": 6,
1293
+ "precision": 0.3333333333333333,
1294
+ "recall": 0.3333333333333333
1295
+ },
1296
+ "eval_accuracy": 0.9607694254619084,
1297
+ "eval_accuracy-all": 0.9705770690964313,
1298
+ "eval_accuracy-das": 0.9731713490255631,
1299
+ "eval_accuracy-l1": 0.9668438370032904,
1300
+ "eval_accuracy-l2": 0.9743103011895723,
1301
+ "eval_f1": 0.9611481588866339,
1302
+ "eval_f1-all": 0.9570175438596491,
1303
+ "eval_f1-das": 0.9630866258579114,
1304
+ "eval_f1-l1": 0.9562043795620437,
1305
+ "eval_f1-l2": 0.9580559254327563,
1306
+ "eval_loss": 0.17625676095485687,
1307
+ "eval_precision": 0.9586466165413534,
1308
+ "eval_precision-all": 0.9531158998252767,
1309
+ "eval_precision-das": 0.959349593495935,
1310
+ "eval_precision-l1": 0.949766960124288,
1311
+ "eval_precision-l2": 0.957418496340652,
1312
+ "eval_recall": 0.9636627906976745,
1313
+ "eval_recall-all": 0.96095126247798,
1314
+ "eval_recall-das": 0.966852886405959,
1315
+ "eval_recall-l1": 0.9627296587926509,
1316
+ "eval_recall-l2": 0.9586942038640907,
1317
+ "eval_runtime": 5.5364,
1318
+ "eval_samples_per_second": 122.101,
1319
+ "eval_steps_per_second": 7.767,
1320
+ "step": 1300
1321
+ },
1322
+ {
1323
+ "epoch": 3.67,
1324
+ "eval_ACT": {
1325
+ "f1": 0.9299242424242424,
1326
+ "number": 519,
1327
+ "precision": 0.9143389199255121,
1328
+ "recall": 0.9460500963391136
1329
+ },
1330
+ "eval_ACT_L1": {
1331
+ "f1": 0.9517241379310345,
1332
+ "number": 503,
1333
+ "precision": 0.943359375,
1334
+ "recall": 0.9602385685884692
1335
+ },
1336
+ "eval_ACT_L2": {
1337
+ "f1": 0.39024390243902435,
1338
+ "number": 16,
1339
+ "precision": 0.32,
1340
+ "recall": 0.5
1341
+ },
1342
+ "eval_CARDINAL": {
1343
+ "f1": 0.9830757910228108,
1344
+ "number": 678,
1345
+ "precision": 0.9809104258443465,
1346
+ "recall": 0.9852507374631269
1347
+ },
1348
+ "eval_DESC": {
1349
+ "f1": 0.49315068493150693,
1350
+ "number": 30,
1351
+ "precision": 0.4186046511627907,
1352
+ "recall": 0.6
1353
+ },
1354
+ "eval_FT": {
1355
+ "f1": 0.22222222222222224,
1356
+ "number": 7,
1357
+ "precision": 0.5,
1358
+ "recall": 0.14285714285714285
1359
+ },
1360
+ "eval_LOC": {
1361
+ "f1": 0.9440832249674903,
1362
+ "number": 761,
1363
+ "precision": 0.9343629343629344,
1364
+ "recall": 0.9540078843626807
1365
+ },
1366
+ "eval_PER": {
1367
+ "f1": 0.9756457564575647,
1368
+ "number": 676,
1369
+ "precision": 0.9734904270986745,
1370
+ "recall": 0.977810650887574
1371
+ },
1372
+ "eval_SPAT": {
1373
+ "f1": 0.9613180515759313,
1374
+ "number": 694,
1375
+ "precision": 0.9558404558404558,
1376
+ "recall": 0.9668587896253602
1377
+ },
1378
+ "eval_TITRE": {
1379
+ "f1": 0.0,
1380
+ "number": 2,
1381
+ "precision": 0.0,
1382
+ "recall": 0.0
1383
+ },
1384
+ "eval_TITREH": {
1385
+ "f1": 0.8484848484848486,
1386
+ "number": 33,
1387
+ "precision": 0.8484848484848485,
1388
+ "recall": 0.8484848484848485
1389
+ },
1390
+ "eval_TITREP": {
1391
+ "f1": 0.4,
1392
+ "number": 6,
1393
+ "precision": 0.3333333333333333,
1394
+ "recall": 0.5
1395
+ },
1396
+ "eval_accuracy": 0.9524171095925082,
1397
+ "eval_accuracy-all": 0.9641862819539357,
1398
+ "eval_accuracy-das": 0.9696279422930904,
1399
+ "eval_accuracy-l1": 0.9610225259427992,
1400
+ "eval_accuracy-l2": 0.9673500379650721,
1401
+ "eval_f1": 0.9534112216933507,
1402
+ "eval_f1-all": 0.9512301645072062,
1403
+ "eval_f1-das": 0.9583101723179546,
1404
+ "eval_f1-l1": 0.9544389481905754,
1405
+ "eval_f1-l2": 0.9471598414795244,
1406
+ "eval_loss": 0.17374566197395325,
1407
+ "eval_precision": 0.9461780704265674,
1408
+ "eval_precision-all": 0.9434016748483973,
1409
+ "eval_precision-das": 0.9535398230088495,
1410
+ "eval_precision-l1": 0.9467975206611571,
1411
+ "eval_precision-l2": 0.9390962671905697,
1412
+ "eval_recall": 0.9607558139534884,
1413
+ "eval_recall-all": 0.9591896652965355,
1414
+ "eval_recall-das": 0.9631284916201117,
1415
+ "eval_recall-l1": 0.9622047244094488,
1416
+ "eval_recall-l2": 0.955363091272485,
1417
+ "eval_runtime": 5.5496,
1418
+ "eval_samples_per_second": 121.811,
1419
+ "eval_steps_per_second": 7.748,
1420
+ "step": 1400
1421
+ },
1422
+ {
1423
+ "epoch": 3.94,
1424
+ "learning_rate": 7e-05,
1425
+ "loss": 0.0874,
1426
+ "step": 1500
1427
+ },
1428
+ {
1429
+ "epoch": 3.94,
1430
+ "eval_ACT": {
1431
+ "f1": 0.9458689458689458,
1432
+ "number": 519,
1433
+ "precision": 0.9325842696629213,
1434
+ "recall": 0.9595375722543352
1435
+ },
1436
+ "eval_ACT_L1": {
1437
+ "f1": 0.9647749510763209,
1438
+ "number": 503,
1439
+ "precision": 0.9499036608863198,
1440
+ "recall": 0.9801192842942346
1441
+ },
1442
+ "eval_ACT_L2": {
1443
+ "f1": 0.3225806451612903,
1444
+ "number": 16,
1445
+ "precision": 0.3333333333333333,
1446
+ "recall": 0.3125
1447
+ },
1448
+ "eval_CARDINAL": {
1449
+ "f1": 0.9823788546255506,
1450
+ "number": 678,
1451
+ "precision": 0.9780701754385965,
1452
+ "recall": 0.9867256637168141
1453
+ },
1454
+ "eval_DESC": {
1455
+ "f1": 0.3225806451612903,
1456
+ "number": 30,
1457
+ "precision": 0.3125,
1458
+ "recall": 0.3333333333333333
1459
+ },
1460
+ "eval_FT": {
1461
+ "f1": 0.25,
1462
+ "number": 7,
1463
+ "precision": 0.2222222222222222,
1464
+ "recall": 0.2857142857142857
1465
+ },
1466
+ "eval_LOC": {
1467
+ "f1": 0.954367666232073,
1468
+ "number": 761,
1469
+ "precision": 0.9469598965071151,
1470
+ "recall": 0.961892247043364
1471
+ },
1472
+ "eval_PER": {
1473
+ "f1": 0.9764011799410028,
1474
+ "number": 676,
1475
+ "precision": 0.9735294117647059,
1476
+ "recall": 0.9792899408284024
1477
+ },
1478
+ "eval_SPAT": {
1479
+ "f1": 0.9601706970128022,
1480
+ "number": 694,
1481
+ "precision": 0.9480337078651685,
1482
+ "recall": 0.9726224783861671
1483
+ },
1484
+ "eval_TITRE": {
1485
+ "f1": 0.0,
1486
+ "number": 2,
1487
+ "precision": 0.0,
1488
+ "recall": 0.0
1489
+ },
1490
+ "eval_TITREH": {
1491
+ "f1": 0.8358208955223881,
1492
+ "number": 33,
1493
+ "precision": 0.8235294117647058,
1494
+ "recall": 0.8484848484848485
1495
+ },
1496
+ "eval_TITREP": {
1497
+ "f1": 0.28571428571428575,
1498
+ "number": 6,
1499
+ "precision": 0.25,
1500
+ "recall": 0.3333333333333333
1501
+ },
1502
+ "eval_accuracy": 0.9526702100733991,
1503
+ "eval_accuracy-all": 0.9644393824348266,
1504
+ "eval_accuracy-das": 0.9700075930144267,
1505
+ "eval_accuracy-l1": 0.9602632245001266,
1506
+ "eval_accuracy-l2": 0.9686155403695267,
1507
+ "eval_f1": 0.9585320040456581,
1508
+ "eval_f1-all": 0.9540162980209547,
1509
+ "eval_f1-das": 0.9615384615384616,
1510
+ "eval_f1-l1": 0.9563409563409563,
1511
+ "eval_f1-l2": 0.9510582010582012,
1512
+ "eval_loss": 0.1944604068994522,
1513
+ "eval_precision": 0.9528871014076414,
1514
+ "eval_precision-all": 0.9457587997691864,
1515
+ "eval_precision-das": 0.9548292324641939,
1516
+ "eval_precision-l1": 0.9469891919711786,
1517
+ "eval_precision-l2": 0.9441891004596191,
1518
+ "eval_recall": 0.9642441860465116,
1519
+ "eval_recall-all": 0.9624192601291838,
1520
+ "eval_recall-das": 0.9683426443202979,
1521
+ "eval_recall-l1": 0.9658792650918635,
1522
+ "eval_recall-l2": 0.9580279813457695,
1523
+ "eval_runtime": 5.5418,
1524
+ "eval_samples_per_second": 121.983,
1525
+ "eval_steps_per_second": 7.759,
1526
+ "step": 1500
1527
+ },
1528
+ {
1529
+ "epoch": 4.2,
1530
+ "eval_ACT": {
1531
+ "f1": 0.9579349904397705,
1532
+ "number": 519,
1533
+ "precision": 0.9506641366223909,
1534
+ "recall": 0.9653179190751445
1535
+ },
1536
+ "eval_ACT_L1": {
1537
+ "f1": 0.973293768545994,
1538
+ "number": 503,
1539
+ "precision": 0.968503937007874,
1540
+ "recall": 0.9781312127236581
1541
+ },
1542
+ "eval_ACT_L2": {
1543
+ "f1": 0.5142857142857142,
1544
+ "number": 16,
1545
+ "precision": 0.47368421052631576,
1546
+ "recall": 0.5625
1547
+ },
1548
+ "eval_CARDINAL": {
1549
+ "f1": 0.9801031687546058,
1550
+ "number": 678,
1551
+ "precision": 0.979381443298969,
1552
+ "recall": 0.9808259587020649
1553
+ },
1554
+ "eval_DESC": {
1555
+ "f1": 0.5901639344262295,
1556
+ "number": 30,
1557
+ "precision": 0.5806451612903226,
1558
+ "recall": 0.6
1559
+ },
1560
+ "eval_FT": {
1561
+ "f1": 0.30769230769230765,
1562
+ "number": 7,
1563
+ "precision": 0.3333333333333333,
1564
+ "recall": 0.2857142857142857
1565
+ },
1566
+ "eval_LOC": {
1567
+ "f1": 0.9542483660130721,
1568
+ "number": 761,
1569
+ "precision": 0.9492847854356307,
1570
+ "recall": 0.9592641261498029
1571
+ },
1572
+ "eval_PER": {
1573
+ "f1": 0.9793510324483775,
1574
+ "number": 676,
1575
+ "precision": 0.9764705882352941,
1576
+ "recall": 0.9822485207100592
1577
+ },
1578
+ "eval_SPAT": {
1579
+ "f1": 0.9649749821300929,
1580
+ "number": 694,
1581
+ "precision": 0.9574468085106383,
1582
+ "recall": 0.9726224783861671
1583
+ },
1584
+ "eval_TITRE": {
1585
+ "f1": 0.0,
1586
+ "number": 2,
1587
+ "precision": 0.0,
1588
+ "recall": 0.0
1589
+ },
1590
+ "eval_TITREH": {
1591
+ "f1": 0.8064516129032258,
1592
+ "number": 33,
1593
+ "precision": 0.8620689655172413,
1594
+ "recall": 0.7575757575757576
1595
+ },
1596
+ "eval_TITREP": {
1597
+ "f1": 0.3333333333333333,
1598
+ "number": 6,
1599
+ "precision": 0.3333333333333333,
1600
+ "recall": 0.3333333333333333
1601
+ },
1602
+ "eval_accuracy": 0.9616552771450265,
1603
+ "eval_accuracy-all": 0.9713996456593268,
1604
+ "eval_accuracy-das": 0.9751961528726905,
1605
+ "eval_accuracy-l1": 0.9691217413313086,
1606
+ "eval_accuracy-l2": 0.973677549987345,
1607
+ "eval_f1": 0.9617391304347827,
1608
+ "eval_f1-all": 0.9599298040362678,
1609
+ "eval_f1-das": 0.9646971386101821,
1610
+ "eval_f1-l1": 0.9657874118568817,
1611
+ "eval_f1-l2": 0.9524759056164839,
1612
+ "eval_loss": 0.18698786199092865,
1613
+ "eval_precision": 0.9589595375722544,
1614
+ "eval_precision-all": 0.9562937062937062,
1615
+ "eval_precision-das": 0.9625509825732295,
1616
+ "eval_precision-l1": 0.9610187110187111,
1617
+ "eval_precision-l2": 0.9502652519893899,
1618
+ "eval_recall": 0.9645348837209302,
1619
+ "eval_recall-all": 0.9635936582501468,
1620
+ "eval_recall-das": 0.966852886405959,
1621
+ "eval_recall-l1": 0.9706036745406824,
1622
+ "eval_recall-l2": 0.9546968687541639,
1623
+ "eval_runtime": 5.912,
1624
+ "eval_samples_per_second": 114.344,
1625
+ "eval_steps_per_second": 7.273,
1626
+ "step": 1600
1627
+ },
1628
+ {
1629
+ "epoch": 4.46,
1630
+ "eval_ACT": {
1631
+ "f1": 0.9420702754036088,
1632
+ "number": 519,
1633
+ "precision": 0.9288389513108615,
1634
+ "recall": 0.9556840077071291
1635
+ },
1636
+ "eval_ACT_L1": {
1637
+ "f1": 0.9663366336633663,
1638
+ "number": 503,
1639
+ "precision": 0.9625246548323472,
1640
+ "recall": 0.9701789264413518
1641
+ },
1642
+ "eval_ACT_L2": {
1643
+ "f1": 0.37209302325581395,
1644
+ "number": 16,
1645
+ "precision": 0.2962962962962963,
1646
+ "recall": 0.5
1647
+ },
1648
+ "eval_CARDINAL": {
1649
+ "f1": 0.9823269513991163,
1650
+ "number": 678,
1651
+ "precision": 0.9808823529411764,
1652
+ "recall": 0.9837758112094396
1653
+ },
1654
+ "eval_DESC": {
1655
+ "f1": 0.4927536231884058,
1656
+ "number": 30,
1657
+ "precision": 0.4358974358974359,
1658
+ "recall": 0.5666666666666667
1659
+ },
1660
+ "eval_FT": {
1661
+ "f1": 0.4,
1662
+ "number": 7,
1663
+ "precision": 0.6666666666666666,
1664
+ "recall": 0.2857142857142857
1665
+ },
1666
+ "eval_LOC": {
1667
+ "f1": 0.9489528795811519,
1668
+ "number": 761,
1669
+ "precision": 0.9452411994784876,
1670
+ "recall": 0.9526938239159002
1671
+ },
1672
+ "eval_PER": {
1673
+ "f1": 0.9778434268833086,
1674
+ "number": 676,
1675
+ "precision": 0.976401179941003,
1676
+ "recall": 0.9792899408284024
1677
+ },
1678
+ "eval_SPAT": {
1679
+ "f1": 0.9577060931899642,
1680
+ "number": 694,
1681
+ "precision": 0.9529243937232525,
1682
+ "recall": 0.962536023054755
1683
+ },
1684
+ "eval_TITRE": {
1685
+ "f1": 0.0,
1686
+ "number": 2,
1687
+ "precision": 0.0,
1688
+ "recall": 0.0
1689
+ },
1690
+ "eval_TITREH": {
1691
+ "f1": 0.8405797101449276,
1692
+ "number": 33,
1693
+ "precision": 0.8055555555555556,
1694
+ "recall": 0.8787878787878788
1695
+ },
1696
+ "eval_TITREP": {
1697
+ "f1": 0.3333333333333333,
1698
+ "number": 6,
1699
+ "precision": 0.3333333333333333,
1700
+ "recall": 0.3333333333333333
1701
+ },
1702
+ "eval_accuracy": 0.9578587699316629,
1703
+ "eval_accuracy-all": 0.9679827891672994,
1704
+ "eval_accuracy-das": 0.9738041002277904,
1705
+ "eval_accuracy-l1": 0.9646924829157175,
1706
+ "eval_accuracy-l2": 0.9712730954188813,
1707
+ "eval_f1": 0.9567731675581899,
1708
+ "eval_f1-all": 0.9541605839416059,
1709
+ "eval_f1-das": 0.962109955423477,
1710
+ "eval_f1-l1": 0.9582245430809399,
1711
+ "eval_f1-l2": 0.9490066225165563,
1712
+ "eval_loss": 0.1859915405511856,
1713
+ "eval_precision": 0.9516824849007766,
1714
+ "eval_precision-all": 0.9488966318234611,
1715
+ "eval_precision-das": 0.9596146721007781,
1716
+ "eval_precision-l1": 0.9532467532467532,
1717
+ "eval_precision-l2": 0.9433838051349572,
1718
+ "eval_recall": 0.9619186046511627,
1719
+ "eval_recall-all": 0.9594832648267763,
1720
+ "eval_recall-das": 0.9646182495344506,
1721
+ "eval_recall-l1": 0.963254593175853,
1722
+ "eval_recall-l2": 0.9546968687541639,
1723
+ "eval_runtime": 5.5062,
1724
+ "eval_samples_per_second": 122.771,
1725
+ "eval_steps_per_second": 7.809,
1726
+ "step": 1700
1727
+ },
1728
+ {
1729
+ "epoch": 4.72,
1730
+ "eval_ACT": {
1731
+ "f1": 0.9666348903717827,
1732
+ "number": 519,
1733
+ "precision": 0.9566037735849057,
1734
+ "recall": 0.976878612716763
1735
+ },
1736
+ "eval_ACT_L1": {
1737
+ "f1": 0.9764705882352941,
1738
+ "number": 503,
1739
+ "precision": 0.9632495164410058,
1740
+ "recall": 0.9900596421471173
1741
+ },
1742
+ "eval_ACT_L2": {
1743
+ "f1": 0.6206896551724138,
1744
+ "number": 16,
1745
+ "precision": 0.6923076923076923,
1746
+ "recall": 0.5625
1747
+ },
1748
+ "eval_CARDINAL": {
1749
+ "f1": 0.9852941176470589,
1750
+ "number": 678,
1751
+ "precision": 0.9824046920821115,
1752
+ "recall": 0.9882005899705014
1753
+ },
1754
+ "eval_DESC": {
1755
+ "f1": 0.5666666666666667,
1756
+ "number": 30,
1757
+ "precision": 0.5666666666666667,
1758
+ "recall": 0.5666666666666667
1759
+ },
1760
+ "eval_FT": {
1761
+ "f1": 0.2,
1762
+ "number": 7,
1763
+ "precision": 0.3333333333333333,
1764
+ "recall": 0.14285714285714285
1765
+ },
1766
+ "eval_LOC": {
1767
+ "f1": 0.9542483660130721,
1768
+ "number": 761,
1769
+ "precision": 0.9492847854356307,
1770
+ "recall": 0.9592641261498029
1771
+ },
1772
+ "eval_PER": {
1773
+ "f1": 0.9793205317577548,
1774
+ "number": 676,
1775
+ "precision": 0.9778761061946902,
1776
+ "recall": 0.9807692307692307
1777
+ },
1778
+ "eval_SPAT": {
1779
+ "f1": 0.9547738693467337,
1780
+ "number": 694,
1781
+ "precision": 0.9513590844062947,
1782
+ "recall": 0.9582132564841499
1783
+ },
1784
+ "eval_TITRE": {
1785
+ "f1": 0.0,
1786
+ "number": 2,
1787
+ "precision": 0.0,
1788
+ "recall": 0.0
1789
+ },
1790
+ "eval_TITREH": {
1791
+ "f1": 0.8823529411764706,
1792
+ "number": 33,
1793
+ "precision": 0.8571428571428571,
1794
+ "recall": 0.9090909090909091
1795
+ },
1796
+ "eval_TITREP": {
1797
+ "f1": 0.4615384615384615,
1798
+ "number": 6,
1799
+ "precision": 0.42857142857142855,
1800
+ "recall": 0.5
1801
+ },
1802
+ "eval_accuracy": 0.9643128321943811,
1803
+ "eval_accuracy-all": 0.974120475828904,
1804
+ "eval_accuracy-das": 0.9757023538344722,
1805
+ "eval_accuracy-l1": 0.9711465451784358,
1806
+ "eval_accuracy-l2": 0.9770944064793723,
1807
+ "eval_f1": 0.9649580075296842,
1808
+ "eval_f1-all": 0.9609592045620704,
1809
+ "eval_f1-das": 0.968651456130588,
1810
+ "eval_f1-l1": 0.9626534343170541,
1811
+ "eval_f1-l2": 0.9588039867109635,
1812
+ "eval_loss": 0.16283993422985077,
1813
+ "eval_precision": 0.96133871898442,
1814
+ "eval_precision-all": 0.9571803087678415,
1815
+ "eval_precision-das": 0.9648928307464892,
1816
+ "eval_precision-l1": 0.9579002079002079,
1817
+ "eval_precision-l2": 0.9562624254473161,
1818
+ "eval_recall": 0.9686046511627907,
1819
+ "eval_recall-all": 0.9647680563711099,
1820
+ "eval_recall-das": 0.97243947858473,
1821
+ "eval_recall-l1": 0.9674540682414698,
1822
+ "eval_recall-l2": 0.9613590939373751,
1823
+ "eval_runtime": 5.4991,
1824
+ "eval_samples_per_second": 122.928,
1825
+ "eval_steps_per_second": 7.819,
1826
+ "step": 1800
1827
+ },
1828
+ {
1829
+ "epoch": 4.99,
1830
+ "eval_ACT": {
1831
+ "f1": 0.941398865784499,
1832
+ "number": 519,
1833
+ "precision": 0.9239332096474954,
1834
+ "recall": 0.9595375722543352
1835
+ },
1836
+ "eval_ACT_L1": {
1837
+ "f1": 0.9655172413793103,
1838
+ "number": 503,
1839
+ "precision": 0.95703125,
1840
+ "recall": 0.974155069582505
1841
+ },
1842
+ "eval_ACT_L2": {
1843
+ "f1": 0.37209302325581395,
1844
+ "number": 16,
1845
+ "precision": 0.2962962962962963,
1846
+ "recall": 0.5
1847
+ },
1848
+ "eval_CARDINAL": {
1849
+ "f1": 0.9852507374631269,
1850
+ "number": 678,
1851
+ "precision": 0.9852507374631269,
1852
+ "recall": 0.9852507374631269
1853
+ },
1854
+ "eval_DESC": {
1855
+ "f1": 0.49315068493150693,
1856
+ "number": 30,
1857
+ "precision": 0.4186046511627907,
1858
+ "recall": 0.6
1859
+ },
1860
+ "eval_FT": {
1861
+ "f1": 0.3333333333333333,
1862
+ "number": 7,
1863
+ "precision": 0.4,
1864
+ "recall": 0.2857142857142857
1865
+ },
1866
+ "eval_LOC": {
1867
+ "f1": 0.9614126880313931,
1868
+ "number": 761,
1869
+ "precision": 0.95703125,
1870
+ "recall": 0.9658344283837057
1871
+ },
1872
+ "eval_PER": {
1873
+ "f1": 0.9815225424981524,
1874
+ "number": 676,
1875
+ "precision": 0.9807976366322009,
1876
+ "recall": 0.9822485207100592
1877
+ },
1878
+ "eval_SPAT": {
1879
+ "f1": 0.9555236728837877,
1880
+ "number": 694,
1881
+ "precision": 0.9514285714285714,
1882
+ "recall": 0.9596541786743515
1883
+ },
1884
+ "eval_TITRE": {
1885
+ "f1": 0.0,
1886
+ "number": 2,
1887
+ "precision": 0.0,
1888
+ "recall": 0.0
1889
+ },
1890
+ "eval_TITREH": {
1891
+ "f1": 0.923076923076923,
1892
+ "number": 33,
1893
+ "precision": 0.9375,
1894
+ "recall": 0.9090909090909091
1895
+ },
1896
+ "eval_TITREP": {
1897
+ "f1": 0.28571428571428575,
1898
+ "number": 6,
1899
+ "precision": 0.25,
1900
+ "recall": 0.3333333333333333
1901
+ },
1902
+ "eval_accuracy": 0.960389774740572,
1903
+ "eval_accuracy-all": 0.9701341432548722,
1904
+ "eval_accuracy-das": 0.9759554543153632,
1905
+ "eval_accuracy-l1": 0.9659579853201721,
1906
+ "eval_accuracy-l2": 0.9743103011895723,
1907
+ "eval_f1": 0.9632523148148149,
1908
+ "eval_f1-all": 0.9577012835472578,
1909
+ "eval_f1-das": 0.9673226884515411,
1910
+ "eval_f1-l1": 0.9580401355225436,
1911
+ "eval_f1-l2": 0.9572706194104007,
1912
+ "eval_loss": 0.16160346567630768,
1913
+ "eval_precision": 0.9588133640552995,
1914
+ "eval_precision-all": 0.9515942028985507,
1915
+ "eval_precision-das": 0.9644576082932247,
1916
+ "eval_precision-l1": 0.9513457556935818,
1917
+ "eval_precision-l2": 0.9519104084321476,
1918
+ "eval_recall": 0.9677325581395348,
1919
+ "eval_recall-all": 0.9638872577803875,
1920
+ "eval_recall-das": 0.9702048417132216,
1921
+ "eval_recall-l1": 0.9648293963254593,
1922
+ "eval_recall-l2": 0.9626915389740173,
1923
+ "eval_runtime": 5.4066,
1924
+ "eval_samples_per_second": 125.032,
1925
+ "eval_steps_per_second": 7.953,
1926
+ "step": 1900
1927
+ },
1928
+ {
1929
+ "epoch": 5.25,
1930
+ "learning_rate": 6e-05,
1931
+ "loss": 0.0496,
1932
+ "step": 2000
1933
+ },
1934
+ {
1935
+ "epoch": 5.25,
1936
+ "eval_ACT": {
1937
+ "f1": 0.9627507163323782,
1938
+ "number": 519,
1939
+ "precision": 0.9545454545454546,
1940
+ "recall": 0.9710982658959537
1941
+ },
1942
+ "eval_ACT_L1": {
1943
+ "f1": 0.9735034347399412,
1944
+ "number": 503,
1945
+ "precision": 0.9612403100775194,
1946
+ "recall": 0.9860834990059643
1947
+ },
1948
+ "eval_ACT_L2": {
1949
+ "f1": 0.5714285714285715,
1950
+ "number": 16,
1951
+ "precision": 0.6666666666666666,
1952
+ "recall": 0.5
1953
+ },
1954
+ "eval_CARDINAL": {
1955
+ "f1": 0.9852507374631269,
1956
+ "number": 678,
1957
+ "precision": 0.9852507374631269,
1958
+ "recall": 0.9852507374631269
1959
+ },
1960
+ "eval_DESC": {
1961
+ "f1": 0.5901639344262295,
1962
+ "number": 30,
1963
+ "precision": 0.5806451612903226,
1964
+ "recall": 0.6
1965
+ },
1966
+ "eval_FT": {
1967
+ "f1": 0.4615384615384615,
1968
+ "number": 7,
1969
+ "precision": 0.5,
1970
+ "recall": 0.42857142857142855
1971
+ },
1972
+ "eval_LOC": {
1973
+ "f1": 0.9574328749181402,
1974
+ "number": 761,
1975
+ "precision": 0.9543080939947781,
1976
+ "recall": 0.9605781865965834
1977
+ },
1978
+ "eval_PER": {
1979
+ "f1": 0.9785344189489268,
1980
+ "number": 676,
1981
+ "precision": 0.9792592592592593,
1982
+ "recall": 0.977810650887574
1983
+ },
1984
+ "eval_SPAT": {
1985
+ "f1": 0.9619526202440775,
1986
+ "number": 694,
1987
+ "precision": 0.9585121602288984,
1988
+ "recall": 0.9654178674351584
1989
+ },
1990
+ "eval_TITRE": {
1991
+ "f1": 0.0,
1992
+ "number": 2,
1993
+ "precision": 0.0,
1994
+ "recall": 0.0
1995
+ },
1996
+ "eval_TITREH": {
1997
+ "f1": 0.9206349206349207,
1998
+ "number": 33,
1999
+ "precision": 0.9666666666666667,
2000
+ "recall": 0.8787878787878788
2001
+ },
2002
+ "eval_TITREP": {
2003
+ "f1": 0.4615384615384615,
2004
+ "number": 6,
2005
+ "precision": 0.42857142857142855,
2006
+ "recall": 0.5
2007
+ },
2008
+ "eval_accuracy": 0.9693748418121995,
2009
+ "eval_accuracy-all": 0.9779169830422678,
2010
+ "eval_accuracy-das": 0.9788661098456087,
2011
+ "eval_accuracy-l1": 0.9744368514300177,
2012
+ "eval_accuracy-l2": 0.9813971146545178,
2013
+ "eval_f1": 0.9663670629167874,
2014
+ "eval_f1-all": 0.9630823322590096,
2015
+ "eval_f1-das": 0.9693137437232657,
2016
+ "eval_f1-l1": 0.964453737584945,
2017
+ "eval_f1-l2": 0.9613333333333334,
2018
+ "eval_loss": 0.1529596447944641,
2019
+ "eval_precision": 0.9638519375361481,
2020
+ "eval_precision-all": 0.9611111111111111,
2021
+ "eval_precision-das": 0.9680534918276374,
2022
+ "eval_precision-l1": 0.9604372722540343,
2023
+ "eval_precision-l2": 0.961974649766511,
2024
+ "eval_recall": 0.9688953488372093,
2025
+ "eval_recall-all": 0.9650616559013505,
2026
+ "eval_recall-das": 0.9705772811918063,
2027
+ "eval_recall-l1": 0.968503937007874,
2028
+ "eval_recall-l2": 0.960692871419054,
2029
+ "eval_runtime": 5.5475,
2030
+ "eval_samples_per_second": 121.856,
2031
+ "eval_steps_per_second": 7.751,
2032
+ "step": 2000
2033
+ }
2034
+ ],
2035
+ "max_steps": 5000,
2036
+ "num_train_epochs": 14,
2037
+ "total_flos": 813927239246016.0,
2038
+ "trial_name": null,
2039
+ "trial_params": null
2040
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e42ebb395a22e62137cbb6f3cbb589d95f46a8d0305621db1cd56d54757ac655
3
+ size 3503