nlpso commited on
Commit
ee35760
·
1 Parent(s): 0d57904

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-b_PER+O",
17
+ "2": "I-i_PER+O",
18
+ "3": "I-b_PER+b_TITREH",
19
+ "4": "I-i_PER+b_TITREH",
20
+ "5": "I-i_PER+i_TITREH",
21
+ "6": "I-b_ACT+O",
22
+ "7": "I-i_ACT+O",
23
+ "8": "I-b_DESC+O",
24
+ "9": "I-i_DESC+O",
25
+ "10": "I-b_DESC+b_ACT",
26
+ "11": "I-i_DESC+b_ACT",
27
+ "12": "I-i_DESC+i_ACT",
28
+ "13": "I-b_DESC+b_TITREP",
29
+ "14": "I-i_DESC+b_TITREP",
30
+ "15": "I-i_DESC+i_TITREP",
31
+ "16": "I-b_SPAT+O",
32
+ "17": "I-i_SPAT+O",
33
+ "18": "I-b_SPAT+b_LOC",
34
+ "19": "I-i_SPAT+b_LOC",
35
+ "20": "I-i_SPAT+i_LOC",
36
+ "21": "I-b_SPAT+b_CARDINAL",
37
+ "22": "I-i_SPAT+b_CARDINAL",
38
+ "23": "I-i_SPAT+i_CARDINAL",
39
+ "24": "I-b_SPAT+b_FT",
40
+ "25": "I-i_SPAT+b_FT",
41
+ "26": "I-i_SPAT+i_FT",
42
+ "27": "I-b_TITRE+O",
43
+ "28": "I-i_TITRE+O"
44
+ },
45
+ "initializer_range": 0.02,
46
+ "intermediate_size": 3072,
47
+ "label2id": {
48
+ "I-b_ACT+O": 6,
49
+ "I-b_DESC+O": 8,
50
+ "I-b_DESC+b_ACT": 10,
51
+ "I-b_DESC+b_TITREP": 13,
52
+ "I-b_PER+O": 1,
53
+ "I-b_PER+b_TITREH": 3,
54
+ "I-b_SPAT+O": 16,
55
+ "I-b_SPAT+b_CARDINAL": 21,
56
+ "I-b_SPAT+b_FT": 24,
57
+ "I-b_SPAT+b_LOC": 18,
58
+ "I-b_TITRE+O": 27,
59
+ "I-i_ACT+O": 7,
60
+ "I-i_DESC+O": 9,
61
+ "I-i_DESC+b_ACT": 11,
62
+ "I-i_DESC+b_TITREP": 14,
63
+ "I-i_DESC+i_ACT": 12,
64
+ "I-i_DESC+i_TITREP": 15,
65
+ "I-i_PER+O": 2,
66
+ "I-i_PER+b_TITREH": 4,
67
+ "I-i_PER+i_TITREH": 5,
68
+ "I-i_SPAT+O": 17,
69
+ "I-i_SPAT+b_CARDINAL": 22,
70
+ "I-i_SPAT+b_FT": 25,
71
+ "I-i_SPAT+b_LOC": 19,
72
+ "I-i_SPAT+i_CARDINAL": 23,
73
+ "I-i_SPAT+i_FT": 26,
74
+ "I-i_SPAT+i_LOC": 20,
75
+ "I-i_TITRE+O": 28,
76
+ "O+O": 0
77
+ },
78
+ "layer_norm_eps": 1e-05,
79
+ "max_position_embeddings": 514,
80
+ "model_type": "camembert",
81
+ "num_attention_heads": 12,
82
+ "num_hidden_layers": 12,
83
+ "output_past": true,
84
+ "pad_token_id": 1,
85
+ "position_embedding_type": "absolute",
86
+ "torch_dtype": "float32",
87
+ "transformers_version": "4.25.1",
88
+ "type_vocab_size": 1,
89
+ "use_cache": true,
90
+ "vocab_size": 32005
91
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f8fb1deeb84dc50b36070f9f373acd22dde3493f6a8fe6ab21569a2cc73c896
3
+ size 880544613
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13434bc0ac6e292a14c84897b392d5ac8b9fe987d426f8546adb86ed6c53339b
3
+ size 440285681
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c091f2db044c97f5da711a730d9a1fe52743711d448258b57b8e857082016b9b
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e026fb7cb5555507d8791aa654af1e3922b1146f7bb21228d191cc76d86c51e1
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,1594 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9703461495095276,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/312-camembert-ner-hierarchical-loss-iob2/checkpoint-1500",
4
+ "epoch": 3.937007874015748,
5
+ "global_step": 1500,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8519855595667871,
14
+ "number": 519,
15
+ "precision": 0.801358234295416,
16
+ "recall": 0.9094412331406551
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.8644688644688645,
20
+ "number": 503,
21
+ "precision": 0.801358234295416,
22
+ "recall": 0.9383697813121272
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9751461988304094,
32
+ "number": 678,
33
+ "precision": 0.9666666666666667,
34
+ "recall": 0.9837758112094396
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9278215223097113,
50
+ "number": 762,
51
+ "precision": 0.9278215223097113,
52
+ "recall": 0.9278215223097113
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9360764144011756,
56
+ "number": 676,
57
+ "precision": 0.92992700729927,
58
+ "recall": 0.9423076923076923
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.89484827099506,
62
+ "number": 694,
63
+ "precision": 0.8769017980636238,
64
+ "recall": 0.9135446685878963
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.9289970208540218,
85
+ "eval_accuracy-all": 0.9515888778550149,
86
+ "eval_accuracy-das": 0.9478649453823237,
87
+ "eval_accuracy-l1": 0.9366931479642503,
88
+ "eval_accuracy-l1l2": 0.9298659384309831,
89
+ "eval_accuracy-l2": 0.9664846077457795,
90
+ "eval_f1": 0.9287086204948594,
91
+ "eval_f1-all": 0.9092765460910152,
92
+ "eval_f1-das": 0.9235337787676319,
93
+ "eval_f1-l1": 0.8933880061506919,
94
+ "eval_f1-l1l2": 0.9203233256351039,
95
+ "eval_f1-l2": 0.930264048747461,
96
+ "eval_loss": 0.5439923405647278,
97
+ "eval_precision": 0.9307065217391305,
98
+ "eval_precision-all": 0.9037402145549435,
99
+ "eval_precision-das": 0.9201183431952663,
100
+ "eval_precision-l1": 0.8728092138207311,
101
+ "eval_precision-l1l2": 0.9179383818024762,
102
+ "eval_precision-l2": 0.9462809917355371,
103
+ "eval_recall": 0.9267192784667418,
104
+ "eval_recall-all": 0.9148811270912827,
105
+ "eval_recall-das": 0.9269746646795827,
106
+ "eval_recall-l1": 0.9149606299212598,
107
+ "eval_recall-l1l2": 0.9227206946454414,
108
+ "eval_recall-l2": 0.914780292942743,
109
+ "eval_runtime": 6.6142,
110
+ "eval_samples_per_second": 102.205,
111
+ "eval_steps_per_second": 6.501,
112
+ "step": 100
113
+ },
114
+ {
115
+ "epoch": 0.52,
116
+ "eval_ACT": {
117
+ "f1": 0.9038817005545287,
118
+ "number": 519,
119
+ "precision": 0.8685612788632326,
120
+ "recall": 0.9421965317919075
121
+ },
122
+ "eval_ACT_L1": {
123
+ "f1": 0.9174484052532833,
124
+ "number": 503,
125
+ "precision": 0.8685612788632326,
126
+ "recall": 0.9721669980119284
127
+ },
128
+ "eval_ACT_L2": {
129
+ "f1": 0.0,
130
+ "number": 16,
131
+ "precision": 0.0,
132
+ "recall": 0.0
133
+ },
134
+ "eval_CARDINAL": {
135
+ "f1": 0.9772893772893773,
136
+ "number": 678,
137
+ "precision": 0.9708879184861717,
138
+ "recall": 0.9837758112094396
139
+ },
140
+ "eval_DESC": {
141
+ "f1": 0.0,
142
+ "number": 30,
143
+ "precision": 0.0,
144
+ "recall": 0.0
145
+ },
146
+ "eval_FT": {
147
+ "f1": 0.0,
148
+ "number": 7,
149
+ "precision": 0.0,
150
+ "recall": 0.0
151
+ },
152
+ "eval_LOC": {
153
+ "f1": 0.946959896507115,
154
+ "number": 762,
155
+ "precision": 0.9336734693877551,
156
+ "recall": 0.9606299212598425
157
+ },
158
+ "eval_PER": {
159
+ "f1": 0.9405722670579605,
160
+ "number": 676,
161
+ "precision": 0.9330422125181951,
162
+ "recall": 0.9482248520710059
163
+ },
164
+ "eval_SPAT": {
165
+ "f1": 0.9542857142857143,
166
+ "number": 694,
167
+ "precision": 0.9461756373937678,
168
+ "recall": 0.962536023054755
169
+ },
170
+ "eval_TITRE": {
171
+ "f1": 0.0,
172
+ "number": 2,
173
+ "precision": 0.0,
174
+ "recall": 0.0
175
+ },
176
+ "eval_TITREH": {
177
+ "f1": 0.0,
178
+ "number": 33,
179
+ "precision": 0.0,
180
+ "recall": 0.0
181
+ },
182
+ "eval_TITREP": {
183
+ "f1": 0.0,
184
+ "number": 6,
185
+ "precision": 0.0,
186
+ "recall": 0.0
187
+ },
188
+ "eval_accuracy": 0.9369414101290964,
189
+ "eval_accuracy-all": 0.9571747765640516,
190
+ "eval_accuracy-das": 0.9559334657398213,
191
+ "eval_accuracy-l1": 0.9469960278053625,
192
+ "eval_accuracy-l1l2": 0.9374379344587885,
193
+ "eval_accuracy-l2": 0.9673535253227408,
194
+ "eval_f1": 0.9402732302133906,
195
+ "eval_f1-all": 0.9352054994880795,
196
+ "eval_f1-das": 0.9358070500927643,
197
+ "eval_f1-l1": 0.9306418219461698,
198
+ "eval_f1-l1l2": 0.9345255263916931,
199
+ "eval_f1-l2": 0.9411368987554658,
200
+ "eval_loss": 0.35665348172187805,
201
+ "eval_precision": 0.9416553595658074,
202
+ "eval_precision-all": 0.932069970845481,
203
+ "eval_precision-das": 0.9320029563932003,
204
+ "eval_precision-l1": 0.9178152118427769,
205
+ "eval_precision-l1l2": 0.9313020983041104,
206
+ "eval_precision-l2": 0.9510537049626104,
207
+ "eval_recall": 0.9388951521984217,
208
+ "eval_recall-all": 0.9383621954798943,
209
+ "eval_recall-das": 0.9396423248882265,
210
+ "eval_recall-l1": 0.9438320209973753,
211
+ "eval_recall-l1l2": 0.9377713458755427,
212
+ "eval_recall-l2": 0.9314247669773635,
213
+ "eval_runtime": 6.2574,
214
+ "eval_samples_per_second": 108.032,
215
+ "eval_steps_per_second": 6.872,
216
+ "step": 200
217
+ },
218
+ {
219
+ "epoch": 0.79,
220
+ "eval_ACT": {
221
+ "f1": 0.9258555133079848,
222
+ "number": 519,
223
+ "precision": 0.9136960600375235,
224
+ "recall": 0.9383429672447013
225
+ },
226
+ "eval_ACT_L1": {
227
+ "f1": 0.9401544401544402,
228
+ "number": 503,
229
+ "precision": 0.9136960600375235,
230
+ "recall": 0.9681908548707754
231
+ },
232
+ "eval_ACT_L2": {
233
+ "f1": 0.0,
234
+ "number": 16,
235
+ "precision": 0.0,
236
+ "recall": 0.0
237
+ },
238
+ "eval_CARDINAL": {
239
+ "f1": 0.9919058130978661,
240
+ "number": 678,
241
+ "precision": 0.9897209985315712,
242
+ "recall": 0.9941002949852508
243
+ },
244
+ "eval_DESC": {
245
+ "f1": 0.0,
246
+ "number": 30,
247
+ "precision": 0.0,
248
+ "recall": 0.0
249
+ },
250
+ "eval_FT": {
251
+ "f1": 0.0,
252
+ "number": 7,
253
+ "precision": 0.0,
254
+ "recall": 0.0
255
+ },
256
+ "eval_LOC": {
257
+ "f1": 0.9362244897959184,
258
+ "number": 762,
259
+ "precision": 0.9106699751861043,
260
+ "recall": 0.963254593175853
261
+ },
262
+ "eval_PER": {
263
+ "f1": 0.9646539027982327,
264
+ "number": 676,
265
+ "precision": 0.9604105571847508,
266
+ "recall": 0.9689349112426036
267
+ },
268
+ "eval_SPAT": {
269
+ "f1": 0.9371024734982332,
270
+ "number": 694,
271
+ "precision": 0.9195561719833565,
272
+ "recall": 0.9553314121037464
273
+ },
274
+ "eval_TITRE": {
275
+ "f1": 0.0,
276
+ "number": 2,
277
+ "precision": 0.0,
278
+ "recall": 0.0
279
+ },
280
+ "eval_TITREH": {
281
+ "f1": 0.5142857142857143,
282
+ "number": 33,
283
+ "precision": 0.4864864864864865,
284
+ "recall": 0.5454545454545454
285
+ },
286
+ "eval_TITREP": {
287
+ "f1": 0.0,
288
+ "number": 6,
289
+ "precision": 0.0,
290
+ "recall": 0.0
291
+ },
292
+ "eval_accuracy": 0.9464995034756704,
293
+ "eval_accuracy-all": 0.9610228401191658,
294
+ "eval_accuracy-das": 0.9671052631578947,
295
+ "eval_accuracy-l1": 0.9535749751737835,
296
+ "eval_accuracy-l1l2": 0.9472442899702085,
297
+ "eval_accuracy-l2": 0.9684707050645481,
298
+ "eval_f1": 0.9517287831162999,
299
+ "eval_f1-all": 0.9391076878360703,
300
+ "eval_f1-das": 0.9543353669809577,
301
+ "eval_f1-l1": 0.9364461738002593,
302
+ "eval_f1-l1l2": 0.9466437177280551,
303
+ "eval_f1-l2": 0.9424983476536681,
304
+ "eval_loss": 0.27040067315101624,
305
+ "eval_precision": 0.9476861167002012,
306
+ "eval_precision-all": 0.9300518134715026,
307
+ "eval_precision-das": 0.9471559633027523,
308
+ "eval_precision-l1": 0.9256410256410257,
309
+ "eval_precision-l1l2": 0.9382996872334376,
310
+ "eval_precision-l2": 0.9356955380577427,
311
+ "eval_recall": 0.9558060879368658,
312
+ "eval_recall-all": 0.9483416495450543,
313
+ "eval_recall-das": 0.9616244411326379,
314
+ "eval_recall-l1": 0.94750656167979,
315
+ "eval_recall-l1l2": 0.9551374819102749,
316
+ "eval_recall-l2": 0.9494007989347537,
317
+ "eval_runtime": 6.3964,
318
+ "eval_samples_per_second": 105.684,
319
+ "eval_steps_per_second": 6.723,
320
+ "step": 300
321
+ },
322
+ {
323
+ "epoch": 1.05,
324
+ "eval_ACT": {
325
+ "f1": 0.9171374764595104,
326
+ "number": 519,
327
+ "precision": 0.8968692449355433,
328
+ "recall": 0.9383429672447013
329
+ },
330
+ "eval_ACT_L1": {
331
+ "f1": 0.9311663479923519,
332
+ "number": 503,
333
+ "precision": 0.8968692449355433,
334
+ "recall": 0.9681908548707754
335
+ },
336
+ "eval_ACT_L2": {
337
+ "f1": 0.0,
338
+ "number": 16,
339
+ "precision": 0.0,
340
+ "recall": 0.0
341
+ },
342
+ "eval_CARDINAL": {
343
+ "f1": 0.9926362297496317,
344
+ "number": 678,
345
+ "precision": 0.9911764705882353,
346
+ "recall": 0.9941002949852508
347
+ },
348
+ "eval_DESC": {
349
+ "f1": 0.07894736842105264,
350
+ "number": 30,
351
+ "precision": 0.06521739130434782,
352
+ "recall": 0.1
353
+ },
354
+ "eval_FT": {
355
+ "f1": 0.0,
356
+ "number": 7,
357
+ "precision": 0.0,
358
+ "recall": 0.0
359
+ },
360
+ "eval_LOC": {
361
+ "f1": 0.955671447196871,
362
+ "number": 762,
363
+ "precision": 0.9494818652849741,
364
+ "recall": 0.9619422572178478
365
+ },
366
+ "eval_PER": {
367
+ "f1": 0.9734121122599705,
368
+ "number": 676,
369
+ "precision": 0.971976401179941,
370
+ "recall": 0.9748520710059172
371
+ },
372
+ "eval_SPAT": {
373
+ "f1": 0.9585121602288984,
374
+ "number": 694,
375
+ "precision": 0.9517045454545454,
376
+ "recall": 0.9654178674351584
377
+ },
378
+ "eval_TITRE": {
379
+ "f1": 0.0,
380
+ "number": 2,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_TITREH": {
385
+ "f1": 0.47368421052631576,
386
+ "number": 33,
387
+ "precision": 0.4186046511627907,
388
+ "recall": 0.5454545454545454
389
+ },
390
+ "eval_TITREP": {
391
+ "f1": 0.0,
392
+ "number": 6,
393
+ "precision": 0.0,
394
+ "recall": 0.0
395
+ },
396
+ "eval_accuracy": 0.9510923535253227,
397
+ "eval_accuracy-all": 0.9681603773584906,
398
+ "eval_accuracy-das": 0.9700844091360477,
399
+ "eval_accuracy-l1": 0.9595332671300894,
400
+ "eval_accuracy-l1l2": 0.9517130089374379,
401
+ "eval_accuracy-l2": 0.9767874875868917,
402
+ "eval_f1": 0.9562669071235347,
403
+ "eval_f1-all": 0.9439837043503564,
404
+ "eval_f1-das": 0.9601335063971815,
405
+ "eval_f1-l1": 0.9385964912280701,
406
+ "eval_f1-l1l2": 0.9483796960137655,
407
+ "eval_f1-l2": 0.950950950950951,
408
+ "eval_loss": 0.22973346710205078,
409
+ "eval_precision": 0.9560513860716701,
410
+ "eval_precision-all": 0.9359492210040392,
411
+ "eval_precision-das": 0.955703211517165,
412
+ "eval_precision-l1": 0.9228817858954845,
413
+ "eval_precision-l1l2": 0.9397556123898835,
414
+ "eval_precision-l2": 0.9531772575250836,
415
+ "eval_recall": 0.9564825253664037,
416
+ "eval_recall-all": 0.9521573231582037,
417
+ "eval_recall-das": 0.9646050670640834,
418
+ "eval_recall-l1": 0.9548556430446195,
419
+ "eval_recall-l1l2": 0.9571635311143271,
420
+ "eval_recall-l2": 0.9487350199733688,
421
+ "eval_runtime": 6.2877,
422
+ "eval_samples_per_second": 107.512,
423
+ "eval_steps_per_second": 6.839,
424
+ "step": 400
425
+ },
426
+ {
427
+ "epoch": 1.31,
428
+ "learning_rate": 9e-05,
429
+ "loss": 0.5207,
430
+ "step": 500
431
+ },
432
+ {
433
+ "epoch": 1.31,
434
+ "eval_ACT": {
435
+ "f1": 0.9319271332694151,
436
+ "number": 519,
437
+ "precision": 0.9274809160305344,
438
+ "recall": 0.9364161849710982
439
+ },
440
+ "eval_ACT_L1": {
441
+ "f1": 0.946445959104187,
442
+ "number": 503,
443
+ "precision": 0.9274809160305344,
444
+ "recall": 0.9662027833001988
445
+ },
446
+ "eval_ACT_L2": {
447
+ "f1": 0.0,
448
+ "number": 16,
449
+ "precision": 0.0,
450
+ "recall": 0.0
451
+ },
452
+ "eval_CARDINAL": {
453
+ "f1": 0.9918938835666913,
454
+ "number": 678,
455
+ "precision": 0.9911634756995582,
456
+ "recall": 0.9926253687315634
457
+ },
458
+ "eval_DESC": {
459
+ "f1": 0.0,
460
+ "number": 30,
461
+ "precision": 0.0,
462
+ "recall": 0.0
463
+ },
464
+ "eval_FT": {
465
+ "f1": 0.0,
466
+ "number": 7,
467
+ "precision": 0.0,
468
+ "recall": 0.0
469
+ },
470
+ "eval_LOC": {
471
+ "f1": 0.9528118939883646,
472
+ "number": 762,
473
+ "precision": 0.9388535031847134,
474
+ "recall": 0.9671916010498688
475
+ },
476
+ "eval_PER": {
477
+ "f1": 0.9712601326455416,
478
+ "number": 676,
479
+ "precision": 0.9676945668135095,
480
+ "recall": 0.9748520710059172
481
+ },
482
+ "eval_SPAT": {
483
+ "f1": 0.9601706970128022,
484
+ "number": 694,
485
+ "precision": 0.9480337078651685,
486
+ "recall": 0.9726224783861671
487
+ },
488
+ "eval_TITRE": {
489
+ "f1": 0.0,
490
+ "number": 2,
491
+ "precision": 0.0,
492
+ "recall": 0.0
493
+ },
494
+ "eval_TITREH": {
495
+ "f1": 0.4186046511627907,
496
+ "number": 33,
497
+ "precision": 0.33962264150943394,
498
+ "recall": 0.5454545454545454
499
+ },
500
+ "eval_TITREP": {
501
+ "f1": 0.0,
502
+ "number": 6,
503
+ "precision": 0.0,
504
+ "recall": 0.0
505
+ },
506
+ "eval_accuracy": 0.9503475670307845,
507
+ "eval_accuracy-all": 0.964622641509434,
508
+ "eval_accuracy-das": 0.9658639523336644,
509
+ "eval_accuracy-l1": 0.9575471698113207,
510
+ "eval_accuracy-l1l2": 0.9507199602780536,
511
+ "eval_accuracy-l2": 0.9716981132075472,
512
+ "eval_f1": 0.9562860047441545,
513
+ "eval_f1-all": 0.9488752556237219,
514
+ "eval_f1-das": 0.9608752086037455,
515
+ "eval_f1-l1": 0.9511366605696369,
516
+ "eval_f1-l1l2": 0.9518315546582059,
517
+ "eval_f1-l2": 0.9460086121232195,
518
+ "eval_loss": 0.23373912274837494,
519
+ "eval_precision": 0.9581258488003621,
520
+ "eval_precision-all": 0.9444605990113405,
521
+ "eval_precision-das": 0.9564414913252123,
522
+ "eval_precision-l1": 0.9469302809573361,
523
+ "eval_precision-l1l2": 0.9485484334578902,
524
+ "eval_precision-l2": 0.9413315754779169,
525
+ "eval_recall": 0.9544532130777903,
526
+ "eval_recall-all": 0.9533313765776343,
527
+ "eval_recall-das": 0.9653502235469449,
528
+ "eval_recall-l1": 0.9553805774278216,
529
+ "eval_recall-l1l2": 0.9551374819102749,
530
+ "eval_recall-l2": 0.9507323568575233,
531
+ "eval_runtime": 6.7397,
532
+ "eval_samples_per_second": 100.3,
533
+ "eval_steps_per_second": 6.38,
534
+ "step": 500
535
+ },
536
+ {
537
+ "epoch": 1.57,
538
+ "eval_ACT": {
539
+ "f1": 0.9277566539923954,
540
+ "number": 519,
541
+ "precision": 0.9155722326454033,
542
+ "recall": 0.9402697495183044
543
+ },
544
+ "eval_ACT_L1": {
545
+ "f1": 0.942084942084942,
546
+ "number": 503,
547
+ "precision": 0.9155722326454033,
548
+ "recall": 0.9701789264413518
549
+ },
550
+ "eval_ACT_L2": {
551
+ "f1": 0.0,
552
+ "number": 16,
553
+ "precision": 0.0,
554
+ "recall": 0.0
555
+ },
556
+ "eval_CARDINAL": {
557
+ "f1": 0.9926253687315634,
558
+ "number": 678,
559
+ "precision": 0.9926253687315634,
560
+ "recall": 0.9926253687315634
561
+ },
562
+ "eval_DESC": {
563
+ "f1": 0.28070175438596495,
564
+ "number": 30,
565
+ "precision": 0.2962962962962963,
566
+ "recall": 0.26666666666666666
567
+ },
568
+ "eval_FT": {
569
+ "f1": 0.0,
570
+ "number": 7,
571
+ "precision": 0.0,
572
+ "recall": 0.0
573
+ },
574
+ "eval_LOC": {
575
+ "f1": 0.9475753604193973,
576
+ "number": 762,
577
+ "precision": 0.9463350785340314,
578
+ "recall": 0.9488188976377953
579
+ },
580
+ "eval_PER": {
581
+ "f1": 0.981549815498155,
582
+ "number": 676,
583
+ "precision": 0.979381443298969,
584
+ "recall": 0.9837278106508875
585
+ },
586
+ "eval_SPAT": {
587
+ "f1": 0.9598278335724534,
588
+ "number": 694,
589
+ "precision": 0.9557142857142857,
590
+ "recall": 0.9639769452449568
591
+ },
592
+ "eval_TITRE": {
593
+ "f1": 0.0,
594
+ "number": 2,
595
+ "precision": 0.0,
596
+ "recall": 0.0
597
+ },
598
+ "eval_TITREH": {
599
+ "f1": 0.6153846153846153,
600
+ "number": 33,
601
+ "precision": 0.5333333333333333,
602
+ "recall": 0.7272727272727273
603
+ },
604
+ "eval_TITREP": {
605
+ "f1": 0.0,
606
+ "number": 6,
607
+ "precision": 0.0,
608
+ "recall": 0.0
609
+ },
610
+ "eval_accuracy": 0.9574230387288977,
611
+ "eval_accuracy-all": 0.9694637537239325,
612
+ "eval_accuracy-das": 0.9736842105263158,
613
+ "eval_accuracy-l1": 0.9637537239324727,
614
+ "eval_accuracy-l1l2": 0.9577954319761668,
615
+ "eval_accuracy-l2": 0.9751737835153923,
616
+ "eval_f1": 0.9586253673976939,
617
+ "eval_f1-all": 0.9512659154105078,
618
+ "eval_f1-das": 0.9626185605356147,
619
+ "eval_f1-l1": 0.9521331945889697,
620
+ "eval_f1-l1l2": 0.9551764025448236,
621
+ "eval_f1-l2": 0.9501505520240883,
622
+ "eval_loss": 0.18777723610401154,
623
+ "eval_precision": 0.9612332804352755,
624
+ "eval_precision-all": 0.9486281377699942,
625
+ "eval_precision-das": 0.961010025993316,
626
+ "eval_precision-l1": 0.9437854564208354,
627
+ "eval_precision-l1l2": 0.9543484542039873,
628
+ "eval_precision-l2": 0.9549428379287155,
629
+ "eval_recall": 0.9560315670800451,
630
+ "eval_recall-all": 0.9539184032873496,
631
+ "eval_recall-das": 0.9642324888226528,
632
+ "eval_recall-l1": 0.9606299212598425,
633
+ "eval_recall-l1l2": 0.9560057887120116,
634
+ "eval_recall-l2": 0.9454061251664447,
635
+ "eval_runtime": 6.8662,
636
+ "eval_samples_per_second": 98.453,
637
+ "eval_steps_per_second": 6.263,
638
+ "step": 600
639
+ },
640
+ {
641
+ "epoch": 1.84,
642
+ "eval_ACT": {
643
+ "f1": 0.92090395480226,
644
+ "number": 519,
645
+ "precision": 0.9005524861878453,
646
+ "recall": 0.9421965317919075
647
+ },
648
+ "eval_ACT_L1": {
649
+ "f1": 0.9358851674641149,
650
+ "number": 503,
651
+ "precision": 0.9022140221402214,
652
+ "recall": 0.9721669980119284
653
+ },
654
+ "eval_ACT_L2": {
655
+ "f1": 0.0,
656
+ "number": 16,
657
+ "precision": 0.0,
658
+ "recall": 0.0
659
+ },
660
+ "eval_CARDINAL": {
661
+ "f1": 0.9926362297496317,
662
+ "number": 678,
663
+ "precision": 0.9911764705882353,
664
+ "recall": 0.9941002949852508
665
+ },
666
+ "eval_DESC": {
667
+ "f1": 0.32786885245901637,
668
+ "number": 30,
669
+ "precision": 0.3225806451612903,
670
+ "recall": 0.3333333333333333
671
+ },
672
+ "eval_FT": {
673
+ "f1": 0.0,
674
+ "number": 7,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_LOC": {
679
+ "f1": 0.9195849546044099,
680
+ "number": 762,
681
+ "precision": 0.908974358974359,
682
+ "recall": 0.9304461942257218
683
+ },
684
+ "eval_PER": {
685
+ "f1": 0.9859778597785979,
686
+ "number": 676,
687
+ "precision": 0.9837997054491899,
688
+ "recall": 0.9881656804733728
689
+ },
690
+ "eval_SPAT": {
691
+ "f1": 0.9300998573466476,
692
+ "number": 694,
693
+ "precision": 0.9209039548022598,
694
+ "recall": 0.9394812680115274
695
+ },
696
+ "eval_TITRE": {
697
+ "f1": 0.0,
698
+ "number": 2,
699
+ "precision": 0.0,
700
+ "recall": 0.0
701
+ },
702
+ "eval_TITREH": {
703
+ "f1": 0.7733333333333333,
704
+ "number": 33,
705
+ "precision": 0.6904761904761905,
706
+ "recall": 0.8787878787878788
707
+ },
708
+ "eval_TITREP": {
709
+ "f1": 0.0,
710
+ "number": 6,
711
+ "precision": 0.0,
712
+ "recall": 0.0
713
+ },
714
+ "eval_accuracy": 0.9540714995034757,
715
+ "eval_accuracy-all": 0.9665466732869911,
716
+ "eval_accuracy-das": 0.9702085402184707,
717
+ "eval_accuracy-l1": 0.961519364448858,
718
+ "eval_accuracy-l1l2": 0.9543197616683218,
719
+ "eval_accuracy-l2": 0.9715739821251241,
720
+ "eval_f1": 0.9554011653966832,
721
+ "eval_f1-all": 0.9406113537117904,
722
+ "eval_f1-das": 0.9578927842700797,
723
+ "eval_f1-l1": 0.9412677878395861,
724
+ "eval_f1-l1l2": 0.9506031016657095,
725
+ "eval_f1-l2": 0.9397670549084858,
726
+ "eval_loss": 0.18267092108726501,
727
+ "eval_precision": 0.9496547115170416,
728
+ "eval_precision-all": 0.9330060641062663,
729
+ "eval_precision-das": 0.95382342076099,
730
+ "eval_precision-l1": 0.9280612244897959,
731
+ "eval_precision-l1l2": 0.9432886862353947,
732
+ "eval_precision-l2": 0.9394544244843646,
733
+ "eval_recall": 0.961217587373168,
734
+ "eval_recall-all": 0.9483416495450543,
735
+ "eval_recall-das": 0.9619970193740686,
736
+ "eval_recall-l1": 0.9548556430446195,
737
+ "eval_recall-l1l2": 0.9580318379160637,
738
+ "eval_recall-l2": 0.9400798934753661,
739
+ "eval_runtime": 6.2904,
740
+ "eval_samples_per_second": 107.465,
741
+ "eval_steps_per_second": 6.836,
742
+ "step": 700
743
+ },
744
+ {
745
+ "epoch": 2.1,
746
+ "eval_ACT": {
747
+ "f1": 0.9372623574144486,
748
+ "number": 519,
749
+ "precision": 0.924953095684803,
750
+ "recall": 0.9499036608863198
751
+ },
752
+ "eval_ACT_L1": {
753
+ "f1": 0.9683168316831683,
754
+ "number": 503,
755
+ "precision": 0.9644970414201184,
756
+ "recall": 0.9721669980119284
757
+ },
758
+ "eval_ACT_L2": {
759
+ "f1": 0.1904761904761905,
760
+ "number": 16,
761
+ "precision": 0.15384615384615385,
762
+ "recall": 0.25
763
+ },
764
+ "eval_CARDINAL": {
765
+ "f1": 0.9941089837997055,
766
+ "number": 678,
767
+ "precision": 0.9926470588235294,
768
+ "recall": 0.995575221238938
769
+ },
770
+ "eval_DESC": {
771
+ "f1": 0.30379746835443044,
772
+ "number": 30,
773
+ "precision": 0.24489795918367346,
774
+ "recall": 0.4
775
+ },
776
+ "eval_FT": {
777
+ "f1": 0.0,
778
+ "number": 7,
779
+ "precision": 0.0,
780
+ "recall": 0.0
781
+ },
782
+ "eval_LOC": {
783
+ "f1": 0.9516971279373369,
784
+ "number": 762,
785
+ "precision": 0.9467532467532468,
786
+ "recall": 0.9566929133858267
787
+ },
788
+ "eval_PER": {
789
+ "f1": 0.9764011799410028,
790
+ "number": 676,
791
+ "precision": 0.9735294117647059,
792
+ "recall": 0.9792899408284024
793
+ },
794
+ "eval_SPAT": {
795
+ "f1": 0.9690869877785765,
796
+ "number": 694,
797
+ "precision": 0.9670014347202296,
798
+ "recall": 0.9711815561959655
799
+ },
800
+ "eval_TITRE": {
801
+ "f1": 0.0,
802
+ "number": 2,
803
+ "precision": 0.0,
804
+ "recall": 0.0
805
+ },
806
+ "eval_TITREH": {
807
+ "f1": 0.7894736842105263,
808
+ "number": 33,
809
+ "precision": 0.6976744186046512,
810
+ "recall": 0.9090909090909091
811
+ },
812
+ "eval_TITREP": {
813
+ "f1": 0.16666666666666666,
814
+ "number": 6,
815
+ "precision": 0.16666666666666666,
816
+ "recall": 0.16666666666666666
817
+ },
818
+ "eval_accuracy": 0.9464995034756704,
819
+ "eval_accuracy-all": 0.9582298907646475,
820
+ "eval_accuracy-das": 0.9748013902681232,
821
+ "eval_accuracy-l1": 0.95506454816286,
822
+ "eval_accuracy-l1l2": 0.9472442899702085,
823
+ "eval_accuracy-l2": 0.961395233366435,
824
+ "eval_f1": 0.958225425064745,
825
+ "eval_f1-all": 0.9544064093226512,
826
+ "eval_f1-das": 0.966747167007245,
827
+ "eval_f1-l1": 0.9572694111516414,
828
+ "eval_f1-l1l2": 0.9569598387793291,
829
+ "eval_f1-l2": 0.9507763462173769,
830
+ "eval_loss": 0.17230063676834106,
831
+ "eval_precision": 0.9570400359874044,
832
+ "eval_precision-all": 0.9473684210526315,
833
+ "eval_precision-das": 0.9640607632456465,
834
+ "eval_precision-l1": 0.950336264873254,
835
+ "eval_precision-l1l2": 0.9518900343642611,
836
+ "eval_precision-l2": 0.9436065573770491,
837
+ "eval_recall": 0.9594137542277339,
838
+ "eval_recall-all": 0.9615497505136483,
839
+ "eval_recall-das": 0.9694485842026825,
840
+ "eval_recall-l1": 0.9643044619422572,
841
+ "eval_recall-l1l2": 0.9620839363241679,
842
+ "eval_recall-l2": 0.9580559254327563,
843
+ "eval_runtime": 6.5238,
844
+ "eval_samples_per_second": 103.62,
845
+ "eval_steps_per_second": 6.591,
846
+ "step": 800
847
+ },
848
+ {
849
+ "epoch": 2.36,
850
+ "eval_ACT": {
851
+ "f1": 0.935361216730038,
852
+ "number": 519,
853
+ "precision": 0.9230769230769231,
854
+ "recall": 0.9479768786127167
855
+ },
856
+ "eval_ACT_L1": {
857
+ "f1": 0.9521951219512196,
858
+ "number": 503,
859
+ "precision": 0.9348659003831418,
860
+ "recall": 0.9701789264413518
861
+ },
862
+ "eval_ACT_L2": {
863
+ "f1": 0.2962962962962963,
864
+ "number": 16,
865
+ "precision": 0.36363636363636365,
866
+ "recall": 0.25
867
+ },
868
+ "eval_CARDINAL": {
869
+ "f1": 0.9926253687315634,
870
+ "number": 678,
871
+ "precision": 0.9926253687315634,
872
+ "recall": 0.9926253687315634
873
+ },
874
+ "eval_DESC": {
875
+ "f1": 0.4615384615384615,
876
+ "number": 30,
877
+ "precision": 0.42857142857142855,
878
+ "recall": 0.5
879
+ },
880
+ "eval_FT": {
881
+ "f1": 0.0,
882
+ "number": 7,
883
+ "precision": 0.0,
884
+ "recall": 0.0
885
+ },
886
+ "eval_LOC": {
887
+ "f1": 0.9436163318211277,
888
+ "number": 762,
889
+ "precision": 0.9321382842509603,
890
+ "recall": 0.9553805774278216
891
+ },
892
+ "eval_PER": {
893
+ "f1": 0.9881831610044313,
894
+ "number": 676,
895
+ "precision": 0.9867256637168141,
896
+ "recall": 0.9896449704142012
897
+ },
898
+ "eval_SPAT": {
899
+ "f1": 0.9562096195262024,
900
+ "number": 694,
901
+ "precision": 0.9527896995708155,
902
+ "recall": 0.9596541786743515
903
+ },
904
+ "eval_TITRE": {
905
+ "f1": 0.0,
906
+ "number": 2,
907
+ "precision": 0.0,
908
+ "recall": 0.0
909
+ },
910
+ "eval_TITREH": {
911
+ "f1": 0.9142857142857143,
912
+ "number": 33,
913
+ "precision": 0.8648648648648649,
914
+ "recall": 0.9696969696969697
915
+ },
916
+ "eval_TITREP": {
917
+ "f1": 0.0,
918
+ "number": 6,
919
+ "precision": 0.0,
920
+ "recall": 0.0
921
+ },
922
+ "eval_accuracy": 0.9574230387288977,
923
+ "eval_accuracy-all": 0.968098311817279,
924
+ "eval_accuracy-das": 0.9729394240317776,
925
+ "eval_accuracy-l1": 0.9642502482621649,
926
+ "eval_accuracy-l1l2": 0.9579195630585898,
927
+ "eval_accuracy-l2": 0.9719463753723933,
928
+ "eval_f1": 0.96378767431399,
929
+ "eval_f1-all": 0.9563439918236238,
930
+ "eval_f1-das": 0.9658246656760773,
931
+ "eval_f1-l1": 0.9575410263089347,
932
+ "eval_f1-l1l2": 0.9604145674391824,
933
+ "eval_f1-l2": 0.9548172757475082,
934
+ "eval_loss": 0.1622493714094162,
935
+ "eval_precision": 0.9614090195198564,
936
+ "eval_precision-all": 0.9514816966879721,
937
+ "eval_precision-das": 0.9629629629629629,
938
+ "eval_precision-l1": 0.9503619441571872,
939
+ "eval_precision-l1l2": 0.9553264604810997,
940
+ "eval_precision-l2": 0.9529177718832891,
941
+ "eval_recall": 0.9661781285231116,
942
+ "eval_recall-all": 0.9612562371587907,
943
+ "eval_recall-das": 0.9687034277198212,
944
+ "eval_recall-l1": 0.9648293963254593,
945
+ "eval_recall-l1l2": 0.9655571635311143,
946
+ "eval_recall-l2": 0.9567243675099867,
947
+ "eval_runtime": 6.4324,
948
+ "eval_samples_per_second": 105.093,
949
+ "eval_steps_per_second": 6.685,
950
+ "step": 900
951
+ },
952
+ {
953
+ "epoch": 2.62,
954
+ "learning_rate": 8e-05,
955
+ "loss": 0.1717,
956
+ "step": 1000
957
+ },
958
+ {
959
+ "epoch": 2.62,
960
+ "eval_ACT": {
961
+ "f1": 0.9169811320754717,
962
+ "number": 519,
963
+ "precision": 0.8983364140480592,
964
+ "recall": 0.9364161849710982
965
+ },
966
+ "eval_ACT_L1": {
967
+ "f1": 0.9388560157790926,
968
+ "number": 503,
969
+ "precision": 0.9315068493150684,
970
+ "recall": 0.9463220675944334
971
+ },
972
+ "eval_ACT_L2": {
973
+ "f1": 0.43478260869565216,
974
+ "number": 16,
975
+ "precision": 0.3333333333333333,
976
+ "recall": 0.625
977
+ },
978
+ "eval_CARDINAL": {
979
+ "f1": 0.9933677229182019,
980
+ "number": 678,
981
+ "precision": 0.9926362297496318,
982
+ "recall": 0.9941002949852508
983
+ },
984
+ "eval_DESC": {
985
+ "f1": 0.4470588235294118,
986
+ "number": 30,
987
+ "precision": 0.34545454545454546,
988
+ "recall": 0.6333333333333333
989
+ },
990
+ "eval_FT": {
991
+ "f1": 0.0,
992
+ "number": 7,
993
+ "precision": 0.0,
994
+ "recall": 0.0
995
+ },
996
+ "eval_LOC": {
997
+ "f1": 0.9557291666666666,
998
+ "number": 762,
999
+ "precision": 0.9483204134366925,
1000
+ "recall": 0.963254593175853
1001
+ },
1002
+ "eval_PER": {
1003
+ "f1": 0.9793510324483775,
1004
+ "number": 676,
1005
+ "precision": 0.9764705882352941,
1006
+ "recall": 0.9822485207100592
1007
+ },
1008
+ "eval_SPAT": {
1009
+ "f1": 0.9648745519713262,
1010
+ "number": 694,
1011
+ "precision": 0.9600570613409415,
1012
+ "recall": 0.9697406340057637
1013
+ },
1014
+ "eval_TITRE": {
1015
+ "f1": 0.0,
1016
+ "number": 2,
1017
+ "precision": 0.0,
1018
+ "recall": 0.0
1019
+ },
1020
+ "eval_TITREH": {
1021
+ "f1": 0.8421052631578948,
1022
+ "number": 33,
1023
+ "precision": 0.7441860465116279,
1024
+ "recall": 0.9696969696969697
1025
+ },
1026
+ "eval_TITREP": {
1027
+ "f1": 0.4,
1028
+ "number": 6,
1029
+ "precision": 0.5,
1030
+ "recall": 0.3333333333333333
1031
+ },
1032
+ "eval_accuracy": 0.9484856007944389,
1033
+ "eval_accuracy-all": 0.9622020854021847,
1034
+ "eval_accuracy-das": 0.971077457795432,
1035
+ "eval_accuracy-l1": 0.9541956305858987,
1036
+ "eval_accuracy-l1l2": 0.948857994041708,
1037
+ "eval_accuracy-l2": 0.9702085402184707,
1038
+ "eval_f1": 0.9612490171852185,
1039
+ "eval_f1-all": 0.9540964555490993,
1040
+ "eval_f1-das": 0.9636498516320475,
1041
+ "eval_f1-l1": 0.9511941848390446,
1042
+ "eval_f1-l1l2": 0.9569707401032701,
1043
+ "eval_f1-l2": 0.9577836411609498,
1044
+ "eval_loss": 0.16451582312583923,
1045
+ "eval_precision": 0.9576991942703671,
1046
+ "eval_precision-all": 0.9444923784872016,
1047
+ "eval_precision-das": 0.9593796159527327,
1048
+ "eval_precision-l1": 0.940934771443246,
1049
+ "eval_precision-l1l2": 0.9485356838214387,
1050
+ "eval_precision-l2": 0.9490196078431372,
1051
+ "eval_recall": 0.964825253664036,
1052
+ "eval_recall-all": 0.9638978573525095,
1053
+ "eval_recall-das": 0.9679582712369598,
1054
+ "eval_recall-l1": 0.9616797900262467,
1055
+ "eval_recall-l1l2": 0.9655571635311143,
1056
+ "eval_recall-l2": 0.966711051930759,
1057
+ "eval_runtime": 6.4739,
1058
+ "eval_samples_per_second": 104.42,
1059
+ "eval_steps_per_second": 6.642,
1060
+ "step": 1000
1061
+ },
1062
+ {
1063
+ "epoch": 2.89,
1064
+ "eval_ACT": {
1065
+ "f1": 0.9351145038167938,
1066
+ "number": 519,
1067
+ "precision": 0.9262759924385633,
1068
+ "recall": 0.9441233140655106
1069
+ },
1070
+ "eval_ACT_L1": {
1071
+ "f1": 0.9614243323442137,
1072
+ "number": 503,
1073
+ "precision": 0.9566929133858267,
1074
+ "recall": 0.9662027833001988
1075
+ },
1076
+ "eval_ACT_L2": {
1077
+ "f1": 0.2162162162162162,
1078
+ "number": 16,
1079
+ "precision": 0.19047619047619047,
1080
+ "recall": 0.25
1081
+ },
1082
+ "eval_CARDINAL": {
1083
+ "f1": 0.9926144756277695,
1084
+ "number": 678,
1085
+ "precision": 0.9940828402366864,
1086
+ "recall": 0.9911504424778761
1087
+ },
1088
+ "eval_DESC": {
1089
+ "f1": 0.4571428571428572,
1090
+ "number": 30,
1091
+ "precision": 0.4,
1092
+ "recall": 0.5333333333333333
1093
+ },
1094
+ "eval_FT": {
1095
+ "f1": 0.22222222222222224,
1096
+ "number": 7,
1097
+ "precision": 0.5,
1098
+ "recall": 0.14285714285714285
1099
+ },
1100
+ "eval_LOC": {
1101
+ "f1": 0.9628180039138944,
1102
+ "number": 762,
1103
+ "precision": 0.9571984435797666,
1104
+ "recall": 0.968503937007874
1105
+ },
1106
+ "eval_PER": {
1107
+ "f1": 0.9882005899705014,
1108
+ "number": 676,
1109
+ "precision": 0.9852941176470589,
1110
+ "recall": 0.9911242603550295
1111
+ },
1112
+ "eval_SPAT": {
1113
+ "f1": 0.9646719538572459,
1114
+ "number": 694,
1115
+ "precision": 0.9653679653679653,
1116
+ "recall": 0.9639769452449568
1117
+ },
1118
+ "eval_TITRE": {
1119
+ "f1": 0.0,
1120
+ "number": 2,
1121
+ "precision": 0.0,
1122
+ "recall": 0.0
1123
+ },
1124
+ "eval_TITREH": {
1125
+ "f1": 0.9014084507042254,
1126
+ "number": 33,
1127
+ "precision": 0.8421052631578947,
1128
+ "recall": 0.9696969696969697
1129
+ },
1130
+ "eval_TITREP": {
1131
+ "f1": 0.3333333333333333,
1132
+ "number": 6,
1133
+ "precision": 0.3333333333333333,
1134
+ "recall": 0.3333333333333333
1135
+ },
1136
+ "eval_accuracy": 0.9565541211519365,
1137
+ "eval_accuracy-all": 0.9669190665342602,
1138
+ "eval_accuracy-das": 0.9790218470705064,
1139
+ "eval_accuracy-l1": 0.9622641509433962,
1140
+ "eval_accuracy-l1l2": 0.9572989076464746,
1141
+ "eval_accuracy-l2": 0.9715739821251241,
1142
+ "eval_f1": 0.9650979509119567,
1143
+ "eval_f1-all": 0.9617071031862029,
1144
+ "eval_f1-das": 0.9724804760133879,
1145
+ "eval_f1-l1": 0.9623627809722948,
1146
+ "eval_f1-l1l2": 0.9654078985298358,
1147
+ "eval_f1-l2": 0.9608753315649867,
1148
+ "eval_loss": 0.1514899879693985,
1149
+ "eval_precision": 0.9637958174049921,
1150
+ "eval_precision-all": 0.9577874818049491,
1151
+ "eval_precision-das": 0.9706755753526355,
1152
+ "eval_precision-l1": 0.9583550234252993,
1153
+ "eval_precision-l1l2": 0.96152741889176,
1154
+ "eval_precision-l2": 0.9570673712021136,
1155
+ "eval_recall": 0.9664036076662909,
1156
+ "eval_recall-all": 0.9656589374816554,
1157
+ "eval_recall-das": 0.9742921013412816,
1158
+ "eval_recall-l1": 0.9664041994750656,
1159
+ "eval_recall-l1l2": 0.9693198263386397,
1160
+ "eval_recall-l2": 0.9647137150466045,
1161
+ "eval_runtime": 6.4358,
1162
+ "eval_samples_per_second": 105.038,
1163
+ "eval_steps_per_second": 6.681,
1164
+ "step": 1100
1165
+ },
1166
+ {
1167
+ "epoch": 3.15,
1168
+ "eval_ACT": {
1169
+ "f1": 0.9293119698397738,
1170
+ "number": 519,
1171
+ "precision": 0.9095940959409594,
1172
+ "recall": 0.9499036608863198
1173
+ },
1174
+ "eval_ACT_L1": {
1175
+ "f1": 0.9532163742690059,
1176
+ "number": 503,
1177
+ "precision": 0.9349904397705545,
1178
+ "recall": 0.9721669980119284
1179
+ },
1180
+ "eval_ACT_L2": {
1181
+ "f1": 0.22857142857142856,
1182
+ "number": 16,
1183
+ "precision": 0.21052631578947367,
1184
+ "recall": 0.25
1185
+ },
1186
+ "eval_CARDINAL": {
1187
+ "f1": 0.9941089837997055,
1188
+ "number": 678,
1189
+ "precision": 0.9926470588235294,
1190
+ "recall": 0.995575221238938
1191
+ },
1192
+ "eval_DESC": {
1193
+ "f1": 0.3783783783783784,
1194
+ "number": 30,
1195
+ "precision": 0.3181818181818182,
1196
+ "recall": 0.4666666666666667
1197
+ },
1198
+ "eval_FT": {
1199
+ "f1": 0.25,
1200
+ "number": 7,
1201
+ "precision": 1.0,
1202
+ "recall": 0.14285714285714285
1203
+ },
1204
+ "eval_LOC": {
1205
+ "f1": 0.9654723127035831,
1206
+ "number": 762,
1207
+ "precision": 0.9586028460543338,
1208
+ "recall": 0.9724409448818898
1209
+ },
1210
+ "eval_PER": {
1211
+ "f1": 0.9852507374631269,
1212
+ "number": 676,
1213
+ "precision": 0.9823529411764705,
1214
+ "recall": 0.9881656804733728
1215
+ },
1216
+ "eval_SPAT": {
1217
+ "f1": 0.9698708751793401,
1218
+ "number": 694,
1219
+ "precision": 0.9657142857142857,
1220
+ "recall": 0.9740634005763689
1221
+ },
1222
+ "eval_TITRE": {
1223
+ "f1": 0.0,
1224
+ "number": 2,
1225
+ "precision": 0.0,
1226
+ "recall": 0.0
1227
+ },
1228
+ "eval_TITREH": {
1229
+ "f1": 0.8888888888888888,
1230
+ "number": 33,
1231
+ "precision": 0.8205128205128205,
1232
+ "recall": 0.9696969696969697
1233
+ },
1234
+ "eval_TITREP": {
1235
+ "f1": 0.4444444444444444,
1236
+ "number": 6,
1237
+ "precision": 0.6666666666666666,
1238
+ "recall": 0.3333333333333333
1239
+ },
1240
+ "eval_accuracy": 0.9594091360476663,
1241
+ "eval_accuracy-all": 0.9701464746772592,
1242
+ "eval_accuracy-das": 0.9760427010923535,
1243
+ "eval_accuracy-l1": 0.964498510427011,
1244
+ "eval_accuracy-l1l2": 0.9599056603773585,
1245
+ "eval_accuracy-l2": 0.9757944389275075,
1246
+ "eval_f1": 0.9689957312963379,
1247
+ "eval_f1-all": 0.9614208764012229,
1248
+ "eval_f1-das": 0.9714073523950985,
1249
+ "eval_f1-l1": 0.9589823468328141,
1250
+ "eval_f1-l1l2": 0.9653387027182512,
1251
+ "eval_f1-l2": 0.9645343056015909,
1252
+ "eval_loss": 0.15517939627170563,
1253
+ "eval_precision": 0.9655249608238191,
1254
+ "eval_precision-all": 0.9537839399191219,
1255
+ "eval_precision-das": 0.9681717246484086,
1256
+ "eval_precision-l1": 0.9486389316897792,
1257
+ "eval_precision-l1l2": 0.9594053744997141,
1258
+ "eval_precision-l2": 0.9603960396039604,
1259
+ "eval_recall": 0.9724915445321308,
1260
+ "eval_recall-all": 0.9691810977399472,
1261
+ "eval_recall-das": 0.9746646795827124,
1262
+ "eval_recall-l1": 0.9695538057742782,
1263
+ "eval_recall-l1l2": 0.9713458755426918,
1264
+ "eval_recall-l2": 0.9687083888149135,
1265
+ "eval_runtime": 6.6788,
1266
+ "eval_samples_per_second": 101.216,
1267
+ "eval_steps_per_second": 6.438,
1268
+ "step": 1200
1269
+ },
1270
+ {
1271
+ "epoch": 3.41,
1272
+ "eval_ACT": {
1273
+ "f1": 0.9432892249527409,
1274
+ "number": 519,
1275
+ "precision": 0.9257884972170687,
1276
+ "recall": 0.9614643545279383
1277
+ },
1278
+ "eval_ACT_L1": {
1279
+ "f1": 0.9649122807017545,
1280
+ "number": 503,
1281
+ "precision": 0.9464627151051626,
1282
+ "recall": 0.9840954274353877
1283
+ },
1284
+ "eval_ACT_L2": {
1285
+ "f1": 0.25,
1286
+ "number": 16,
1287
+ "precision": 0.25,
1288
+ "recall": 0.25
1289
+ },
1290
+ "eval_CARDINAL": {
1291
+ "f1": 0.9933677229182019,
1292
+ "number": 678,
1293
+ "precision": 0.9926362297496318,
1294
+ "recall": 0.9941002949852508
1295
+ },
1296
+ "eval_DESC": {
1297
+ "f1": 0.46875,
1298
+ "number": 30,
1299
+ "precision": 0.4411764705882353,
1300
+ "recall": 0.5
1301
+ },
1302
+ "eval_FT": {
1303
+ "f1": 0.22222222222222224,
1304
+ "number": 7,
1305
+ "precision": 0.5,
1306
+ "recall": 0.14285714285714285
1307
+ },
1308
+ "eval_LOC": {
1309
+ "f1": 0.9628664495114005,
1310
+ "number": 762,
1311
+ "precision": 0.9560155239327296,
1312
+ "recall": 0.9698162729658792
1313
+ },
1314
+ "eval_PER": {
1315
+ "f1": 0.9852507374631269,
1316
+ "number": 676,
1317
+ "precision": 0.9823529411764705,
1318
+ "recall": 0.9881656804733728
1319
+ },
1320
+ "eval_SPAT": {
1321
+ "f1": 0.9713055954088954,
1322
+ "number": 694,
1323
+ "precision": 0.9671428571428572,
1324
+ "recall": 0.9755043227665706
1325
+ },
1326
+ "eval_TITRE": {
1327
+ "f1": 0.0,
1328
+ "number": 2,
1329
+ "precision": 0.0,
1330
+ "recall": 0.0
1331
+ },
1332
+ "eval_TITREH": {
1333
+ "f1": 0.927536231884058,
1334
+ "number": 33,
1335
+ "precision": 0.8888888888888888,
1336
+ "recall": 0.9696969696969697
1337
+ },
1338
+ "eval_TITREP": {
1339
+ "f1": 0.26666666666666666,
1340
+ "number": 6,
1341
+ "precision": 0.2222222222222222,
1342
+ "recall": 0.3333333333333333
1343
+ },
1344
+ "eval_accuracy": 0.9586643495531281,
1345
+ "eval_accuracy-all": 0.969401688182721,
1346
+ "eval_accuracy-das": 0.9760427010923535,
1347
+ "eval_accuracy-l1": 0.9656156901688183,
1348
+ "eval_accuracy-l1l2": 0.9590367428003972,
1349
+ "eval_accuracy-l2": 0.9731876861966237,
1350
+ "eval_f1": 0.9669365721997301,
1351
+ "eval_f1-all": 0.9642805073625893,
1352
+ "eval_f1-das": 0.9712590394956426,
1353
+ "eval_f1-l1": 0.9656428943258718,
1354
+ "eval_f1-l1l2": 0.9661627069834413,
1355
+ "eval_f1-l2": 0.9625455750745775,
1356
+ "eval_loss": 0.15928798913955688,
1357
+ "eval_precision": 0.9645501458380076,
1358
+ "eval_precision-all": 0.9579953650057937,
1359
+ "eval_precision-das": 0.9667774086378738,
1360
+ "eval_precision-l1": 0.9576664945792462,
1361
+ "eval_precision-l1l2": 0.9613180515759312,
1362
+ "eval_precision-l2": 0.9584158415841584,
1363
+ "eval_recall": 0.9693348365276212,
1364
+ "eval_recall-all": 0.9706486645142354,
1365
+ "eval_recall-das": 0.9757824143070045,
1366
+ "eval_recall-l1": 0.973753280839895,
1367
+ "eval_recall-l1l2": 0.9710564399421129,
1368
+ "eval_recall-l2": 0.966711051930759,
1369
+ "eval_runtime": 6.3391,
1370
+ "eval_samples_per_second": 106.64,
1371
+ "eval_steps_per_second": 6.783,
1372
+ "step": 1300
1373
+ },
1374
+ {
1375
+ "epoch": 3.67,
1376
+ "eval_ACT": {
1377
+ "f1": 0.9256820319849483,
1378
+ "number": 519,
1379
+ "precision": 0.9044117647058824,
1380
+ "recall": 0.9479768786127167
1381
+ },
1382
+ "eval_ACT_L1": {
1383
+ "f1": 0.9459459459459459,
1384
+ "number": 503,
1385
+ "precision": 0.9193245778611632,
1386
+ "recall": 0.974155069582505
1387
+ },
1388
+ "eval_ACT_L2": {
1389
+ "f1": 0.14814814814814814,
1390
+ "number": 16,
1391
+ "precision": 0.18181818181818182,
1392
+ "recall": 0.125
1393
+ },
1394
+ "eval_CARDINAL": {
1395
+ "f1": 0.9941089837997055,
1396
+ "number": 678,
1397
+ "precision": 0.9926470588235294,
1398
+ "recall": 0.995575221238938
1399
+ },
1400
+ "eval_DESC": {
1401
+ "f1": 0.4482758620689655,
1402
+ "number": 30,
1403
+ "precision": 0.4642857142857143,
1404
+ "recall": 0.43333333333333335
1405
+ },
1406
+ "eval_FT": {
1407
+ "f1": 0.22222222222222224,
1408
+ "number": 7,
1409
+ "precision": 0.5,
1410
+ "recall": 0.14285714285714285
1411
+ },
1412
+ "eval_LOC": {
1413
+ "f1": 0.963777490297542,
1414
+ "number": 762,
1415
+ "precision": 0.9502551020408163,
1416
+ "recall": 0.9776902887139107
1417
+ },
1418
+ "eval_PER": {
1419
+ "f1": 0.9726937269372694,
1420
+ "number": 676,
1421
+ "precision": 0.9705449189985272,
1422
+ "recall": 0.9748520710059172
1423
+ },
1424
+ "eval_SPAT": {
1425
+ "f1": 0.9622238061297219,
1426
+ "number": 694,
1427
+ "precision": 0.9520451339915373,
1428
+ "recall": 0.9726224783861671
1429
+ },
1430
+ "eval_TITRE": {
1431
+ "f1": 0.0,
1432
+ "number": 2,
1433
+ "precision": 0.0,
1434
+ "recall": 0.0
1435
+ },
1436
+ "eval_TITREH": {
1437
+ "f1": 0.8823529411764706,
1438
+ "number": 33,
1439
+ "precision": 0.8571428571428571,
1440
+ "recall": 0.9090909090909091
1441
+ },
1442
+ "eval_TITREP": {
1443
+ "f1": 0.5,
1444
+ "number": 6,
1445
+ "precision": 0.5,
1446
+ "recall": 0.5
1447
+ },
1448
+ "eval_accuracy": 0.9572989076464746,
1449
+ "eval_accuracy-all": 0.9682845084409136,
1450
+ "eval_accuracy-das": 0.9735600794438928,
1451
+ "eval_accuracy-l1": 0.9623882820258193,
1452
+ "eval_accuracy-l1l2": 0.958291956305859,
1453
+ "eval_accuracy-l2": 0.974180734856008,
1454
+ "eval_f1": 0.9632790567097137,
1455
+ "eval_f1-all": 0.9581029967995344,
1456
+ "eval_f1-das": 0.9666543164134863,
1457
+ "eval_f1-l1": 0.9532952776336274,
1458
+ "eval_f1-l1l2": 0.9618759890663215,
1459
+ "eval_f1-l2": 0.9642384105960266,
1460
+ "eval_loss": 0.18276441097259521,
1461
+ "eval_precision": 0.9595078299776286,
1462
+ "eval_precision-all": 0.9498125180271128,
1463
+ "eval_precision-das": 0.9613117170228445,
1464
+ "eval_precision-l1": 0.9425346331452027,
1465
+ "eval_precision-l1l2": 0.9562356979405034,
1466
+ "eval_precision-l2": 0.9591567852437418,
1467
+ "eval_recall": 0.9670800450958287,
1468
+ "eval_recall-all": 0.9665394775462284,
1469
+ "eval_recall-das": 0.9720566318926974,
1470
+ "eval_recall-l1": 0.9643044619422572,
1471
+ "eval_recall-l1l2": 0.9675832127351665,
1472
+ "eval_recall-l2": 0.9693741677762983,
1473
+ "eval_runtime": 6.3479,
1474
+ "eval_samples_per_second": 106.493,
1475
+ "eval_steps_per_second": 6.774,
1476
+ "step": 1400
1477
+ },
1478
+ {
1479
+ "epoch": 3.94,
1480
+ "learning_rate": 7e-05,
1481
+ "loss": 0.1088,
1482
+ "step": 1500
1483
+ },
1484
+ {
1485
+ "epoch": 3.94,
1486
+ "eval_ACT": {
1487
+ "f1": 0.947468958930277,
1488
+ "number": 519,
1489
+ "precision": 0.9393939393939394,
1490
+ "recall": 0.9556840077071291
1491
+ },
1492
+ "eval_ACT_L1": {
1493
+ "f1": 0.962962962962963,
1494
+ "number": 503,
1495
+ "precision": 0.9445506692160612,
1496
+ "recall": 0.9821073558648111
1497
+ },
1498
+ "eval_ACT_L2": {
1499
+ "f1": 0.19047619047619047,
1500
+ "number": 16,
1501
+ "precision": 0.4,
1502
+ "recall": 0.125
1503
+ },
1504
+ "eval_CARDINAL": {
1505
+ "f1": 0.9941089837997055,
1506
+ "number": 678,
1507
+ "precision": 0.9926470588235294,
1508
+ "recall": 0.995575221238938
1509
+ },
1510
+ "eval_DESC": {
1511
+ "f1": 0.3793103448275862,
1512
+ "number": 30,
1513
+ "precision": 0.39285714285714285,
1514
+ "recall": 0.36666666666666664
1515
+ },
1516
+ "eval_FT": {
1517
+ "f1": 0.22222222222222224,
1518
+ "number": 7,
1519
+ "precision": 0.5,
1520
+ "recall": 0.14285714285714285
1521
+ },
1522
+ "eval_LOC": {
1523
+ "f1": 0.9661016949152543,
1524
+ "number": 762,
1525
+ "precision": 0.9598445595854922,
1526
+ "recall": 0.9724409448818898
1527
+ },
1528
+ "eval_PER": {
1529
+ "f1": 0.9867452135493372,
1530
+ "number": 676,
1531
+ "precision": 0.9824046920821115,
1532
+ "recall": 0.9911242603550295
1533
+ },
1534
+ "eval_SPAT": {
1535
+ "f1": 0.9684361549497849,
1536
+ "number": 694,
1537
+ "precision": 0.9642857142857143,
1538
+ "recall": 0.9726224783861671
1539
+ },
1540
+ "eval_TITRE": {
1541
+ "f1": 0.0,
1542
+ "number": 2,
1543
+ "precision": 0.0,
1544
+ "recall": 0.0
1545
+ },
1546
+ "eval_TITREH": {
1547
+ "f1": 0.9142857142857143,
1548
+ "number": 33,
1549
+ "precision": 0.8648648648648649,
1550
+ "recall": 0.9696969696969697
1551
+ },
1552
+ "eval_TITREP": {
1553
+ "f1": 0.5,
1554
+ "number": 6,
1555
+ "precision": 0.5,
1556
+ "recall": 0.5
1557
+ },
1558
+ "eval_accuracy": 0.9623882820258193,
1559
+ "eval_accuracy-all": 0.9726911618669315,
1560
+ "eval_accuracy-das": 0.9746772591857001,
1561
+ "eval_accuracy-l1": 0.967974180734856,
1562
+ "eval_accuracy-l1l2": 0.9631330685203575,
1563
+ "eval_accuracy-l2": 0.9774081429990069,
1564
+ "eval_f1": 0.9703461495095276,
1565
+ "eval_f1-all": 0.9657994738380591,
1566
+ "eval_f1-das": 0.9754738015607581,
1567
+ "eval_f1-l1": 0.9640437727983324,
1568
+ "eval_f1-l1l2": 0.9698107756752853,
1569
+ "eval_f1-l2": 0.9680426098535286,
1570
+ "eval_loss": 0.1590852439403534,
1571
+ "eval_precision": 0.9704555705908886,
1572
+ "eval_precision-all": 0.961863173216885,
1573
+ "eval_precision-das": 0.9729429206819866,
1574
+ "eval_precision-l1": 0.9570615623383342,
1575
+ "eval_precision-l1l2": 0.9679930795847751,
1576
+ "eval_precision-l2": 0.9680426098535286,
1577
+ "eval_recall": 0.9702367531003382,
1578
+ "eval_recall-all": 0.9697681244496624,
1579
+ "eval_recall-das": 0.9780178837555886,
1580
+ "eval_recall-l1": 0.9711286089238845,
1581
+ "eval_recall-l1l2": 0.9716353111432706,
1582
+ "eval_recall-l2": 0.9680426098535286,
1583
+ "eval_runtime": 6.5058,
1584
+ "eval_samples_per_second": 103.908,
1585
+ "eval_steps_per_second": 6.61,
1586
+ "step": 1500
1587
+ }
1588
+ ],
1589
+ "max_steps": 5000,
1590
+ "num_train_epochs": 14,
1591
+ "total_flos": 609170163929712.0,
1592
+ "trial_name": null,
1593
+ "trial_params": null
1594
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fee7b0a5c0cead45cd80a82accf180617d300eb3ff37c6a5e83d93476fdd269
3
+ size 3503