nlpso commited on
Commit
d9298b7
·
1 Parent(s): df51ed7

Load model and tokenizer

Browse files
config.json ADDED
@@ -0,0 +1,91 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Jean-Baptiste/camembert-ner",
3
+ "architectures": [
4
+ "CamembertForTokenClassification"
5
+ ],
6
+ "attention_probs_dropout_prob": 0.1,
7
+ "bos_token_id": 5,
8
+ "classifier_dropout": null,
9
+ "eos_token_id": 6,
10
+ "gradient_checkpointing": false,
11
+ "hidden_act": "gelu",
12
+ "hidden_dropout_prob": 0.1,
13
+ "hidden_size": 768,
14
+ "id2label": {
15
+ "0": "O+O",
16
+ "1": "I-b_PER+O",
17
+ "2": "I-i_PER+O",
18
+ "3": "I-b_PER+b_TITREH",
19
+ "4": "I-i_PER+b_TITREH",
20
+ "5": "I-i_PER+i_TITREH",
21
+ "6": "I-b_ACT+O",
22
+ "7": "I-i_ACT+O",
23
+ "8": "I-b_DESC+O",
24
+ "9": "I-i_DESC+O",
25
+ "10": "I-b_DESC+b_ACT",
26
+ "11": "I-i_DESC+b_ACT",
27
+ "12": "I-i_DESC+i_ACT",
28
+ "13": "I-b_DESC+b_TITREP",
29
+ "14": "I-i_DESC+b_TITREP",
30
+ "15": "I-i_DESC+i_TITREP",
31
+ "16": "I-b_SPAT+O",
32
+ "17": "I-i_SPAT+O",
33
+ "18": "I-b_SPAT+b_LOC",
34
+ "19": "I-i_SPAT+b_LOC",
35
+ "20": "I-i_SPAT+i_LOC",
36
+ "21": "I-b_SPAT+b_CARDINAL",
37
+ "22": "I-i_SPAT+b_CARDINAL",
38
+ "23": "I-i_SPAT+i_CARDINAL",
39
+ "24": "I-b_SPAT+b_FT",
40
+ "25": "I-i_SPAT+b_FT",
41
+ "26": "I-i_SPAT+i_FT",
42
+ "27": "I-b_TITRE+O",
43
+ "28": "I-i_TITRE+O"
44
+ },
45
+ "initializer_range": 0.02,
46
+ "intermediate_size": 3072,
47
+ "label2id": {
48
+ "I-b_ACT+O": 6,
49
+ "I-b_DESC+O": 8,
50
+ "I-b_DESC+b_ACT": 10,
51
+ "I-b_DESC+b_TITREP": 13,
52
+ "I-b_PER+O": 1,
53
+ "I-b_PER+b_TITREH": 3,
54
+ "I-b_SPAT+O": 16,
55
+ "I-b_SPAT+b_CARDINAL": 21,
56
+ "I-b_SPAT+b_FT": 24,
57
+ "I-b_SPAT+b_LOC": 18,
58
+ "I-b_TITRE+O": 27,
59
+ "I-i_ACT+O": 7,
60
+ "I-i_DESC+O": 9,
61
+ "I-i_DESC+b_ACT": 11,
62
+ "I-i_DESC+b_TITREP": 14,
63
+ "I-i_DESC+i_ACT": 12,
64
+ "I-i_DESC+i_TITREP": 15,
65
+ "I-i_PER+O": 2,
66
+ "I-i_PER+b_TITREH": 4,
67
+ "I-i_PER+i_TITREH": 5,
68
+ "I-i_SPAT+O": 17,
69
+ "I-i_SPAT+b_CARDINAL": 22,
70
+ "I-i_SPAT+b_FT": 25,
71
+ "I-i_SPAT+b_LOC": 19,
72
+ "I-i_SPAT+i_CARDINAL": 23,
73
+ "I-i_SPAT+i_FT": 26,
74
+ "I-i_SPAT+i_LOC": 20,
75
+ "I-i_TITRE+O": 28,
76
+ "O+O": 0
77
+ },
78
+ "layer_norm_eps": 1e-05,
79
+ "max_position_embeddings": 514,
80
+ "model_type": "camembert",
81
+ "num_attention_heads": 12,
82
+ "num_hidden_layers": 12,
83
+ "output_past": true,
84
+ "pad_token_id": 1,
85
+ "position_embedding_type": "absolute",
86
+ "torch_dtype": "float32",
87
+ "transformers_version": "4.25.1",
88
+ "type_vocab_size": 1,
89
+ "use_cache": true,
90
+ "vocab_size": 32005
91
+ }
optimizer.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffb0b74488b6c7f51e4009979a9da81d48e2c37ff1de106f3dd18da1095e18a3
3
+ size 880544613
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73bd9c5e1634f6d07a4bd325f295d84f229ddd978ffeb6a37830aa1b8f613f18
3
+ size 440285681
rng_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faeb728e59024a5ab1c0ec907ea61fb66dd14a0815881a2e4e4753670bf14047
3
+ size 14503
scheduler.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c1dc559109f5a14fe9958d635fb0eb260fd00c013a8a1d56dd0c334a63c489f
3
+ size 623
sentencepiece.bpe.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:988bc5a00281c6d210a5d34bd143d0363741a432fefe741bf71e61b1869d4314
3
+ size 810912
special_tokens_map.json ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": "<mask>",
10
+ "pad_token": "<pad>",
11
+ "sep_token": "</s>",
12
+ "unk_token": "<unk>"
13
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,25 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<s>NOTUSED",
4
+ "</s>NOTUSED"
5
+ ],
6
+ "bos_token": "<s>",
7
+ "cls_token": "<s>",
8
+ "eos_token": "</s>",
9
+ "mask_token": {
10
+ "__type": "AddedToken",
11
+ "content": "<mask>",
12
+ "lstrip": true,
13
+ "normalized": true,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ },
17
+ "model_max_length": 512,
18
+ "name_or_path": "Jean-Baptiste/camembert-ner",
19
+ "pad_token": "<pad>",
20
+ "sep_token": "</s>",
21
+ "sp_model_kwargs": {},
22
+ "special_tokens_map_file": "/lrde/home2/stual/.cache/huggingface/hub/models--Jean-Baptiste--camembert-ner/snapshots/9f8b2203b6a2daba1ad279ac2adb822518caa167/special_tokens_map.json",
23
+ "tokenizer_class": "CamembertTokenizer",
24
+ "unk_token": "<unk>"
25
+ }
trainer_state.json ADDED
@@ -0,0 +1,1698 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.9663580943779635,
3
+ "best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/322-camembert-ner-hierarchical-loss-iob2/checkpoint-1600",
4
+ "epoch": 4.199475065616798,
5
+ "global_step": 1600,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.26,
12
+ "eval_ACT": {
13
+ "f1": 0.8650137741046832,
14
+ "number": 519,
15
+ "precision": 0.8263157894736842,
16
+ "recall": 0.9075144508670521
17
+ },
18
+ "eval_ACT_L1": {
19
+ "f1": 0.8779123951537745,
20
+ "number": 503,
21
+ "precision": 0.8263157894736842,
22
+ "recall": 0.9363817097415507
23
+ },
24
+ "eval_ACT_L2": {
25
+ "f1": 0.0,
26
+ "number": 16,
27
+ "precision": 0.0,
28
+ "recall": 0.0
29
+ },
30
+ "eval_CARDINAL": {
31
+ "f1": 0.9608127721335268,
32
+ "number": 678,
33
+ "precision": 0.9457142857142857,
34
+ "recall": 0.976401179941003
35
+ },
36
+ "eval_DESC": {
37
+ "f1": 0.0,
38
+ "number": 30,
39
+ "precision": 0.0,
40
+ "recall": 0.0
41
+ },
42
+ "eval_FT": {
43
+ "f1": 0.0,
44
+ "number": 7,
45
+ "precision": 0.0,
46
+ "recall": 0.0
47
+ },
48
+ "eval_LOC": {
49
+ "f1": 0.9040207522697795,
50
+ "number": 762,
51
+ "precision": 0.8935897435897436,
52
+ "recall": 0.9146981627296588
53
+ },
54
+ "eval_PER": {
55
+ "f1": 0.9098901098901099,
56
+ "number": 676,
57
+ "precision": 0.9013062409288825,
58
+ "recall": 0.9186390532544378
59
+ },
60
+ "eval_SPAT": {
61
+ "f1": 0.8698060941828255,
62
+ "number": 694,
63
+ "precision": 0.8373333333333334,
64
+ "recall": 0.9048991354466859
65
+ },
66
+ "eval_TITRE": {
67
+ "f1": 0.0,
68
+ "number": 2,
69
+ "precision": 0.0,
70
+ "recall": 0.0
71
+ },
72
+ "eval_TITREH": {
73
+ "f1": 0.0,
74
+ "number": 33,
75
+ "precision": 0.0,
76
+ "recall": 0.0
77
+ },
78
+ "eval_TITREP": {
79
+ "f1": 0.0,
80
+ "number": 6,
81
+ "precision": 0.0,
82
+ "recall": 0.0
83
+ },
84
+ "eval_accuracy": 0.9234371045304987,
85
+ "eval_accuracy-all": 0.9469754492533535,
86
+ "eval_accuracy-das": 0.9468488990129081,
87
+ "eval_accuracy-l1": 0.9316628701594533,
88
+ "eval_accuracy-l1l2": 0.9244495064540622,
89
+ "eval_accuracy-l2": 0.9622880283472539,
90
+ "eval_f1": 0.9209387104123946,
91
+ "eval_f1-all": 0.8929814385150812,
92
+ "eval_f1-das": 0.9186780542146306,
93
+ "eval_f1-l1": 0.8788962698007154,
94
+ "eval_f1-l1l2": 0.9116279069767442,
95
+ "eval_f1-l2": 0.9114688128772636,
96
+ "eval_loss": 0.5969773530960083,
97
+ "eval_precision": 0.9281285878300803,
98
+ "eval_precision-all": 0.882487818859272,
99
+ "eval_precision-das": 0.9159570529433543,
100
+ "eval_precision-l1": 0.8561473369835739,
101
+ "eval_precision-l1l2": 0.9118929921488805,
102
+ "eval_precision-l2": 0.9182432432432432,
103
+ "eval_recall": 0.9138593714673299,
104
+ "eval_recall-all": 0.9037276196066921,
105
+ "eval_recall-das": 0.921415270018622,
106
+ "eval_recall-l1": 0.9028871391076115,
107
+ "eval_recall-l1l2": 0.9113629758791049,
108
+ "eval_recall-l2": 0.9047936085219707,
109
+ "eval_runtime": 6.8404,
110
+ "eval_samples_per_second": 98.825,
111
+ "eval_steps_per_second": 6.286,
112
+ "step": 100
113
+ },
114
+ {
115
+ "epoch": 0.52,
116
+ "eval_ACT": {
117
+ "f1": 0.871889400921659,
118
+ "number": 519,
119
+ "precision": 0.8356890459363958,
120
+ "recall": 0.9113680154142582
121
+ },
122
+ "eval_ACT_L1": {
123
+ "f1": 0.8849391955098223,
124
+ "number": 503,
125
+ "precision": 0.8356890459363958,
126
+ "recall": 0.9403578528827038
127
+ },
128
+ "eval_ACT_L2": {
129
+ "f1": 0.0,
130
+ "number": 16,
131
+ "precision": 0.0,
132
+ "recall": 0.0
133
+ },
134
+ "eval_CARDINAL": {
135
+ "f1": 0.965768390386016,
136
+ "number": 678,
137
+ "precision": 0.9539568345323741,
138
+ "recall": 0.9778761061946902
139
+ },
140
+ "eval_DESC": {
141
+ "f1": 0.0,
142
+ "number": 30,
143
+ "precision": 0.0,
144
+ "recall": 0.0
145
+ },
146
+ "eval_FT": {
147
+ "f1": 0.0,
148
+ "number": 7,
149
+ "precision": 0.0,
150
+ "recall": 0.0
151
+ },
152
+ "eval_LOC": {
153
+ "f1": 0.9341935483870968,
154
+ "number": 762,
155
+ "precision": 0.9187817258883249,
156
+ "recall": 0.9501312335958005
157
+ },
158
+ "eval_PER": {
159
+ "f1": 0.9242089771891097,
160
+ "number": 676,
161
+ "precision": 0.9194729136163983,
162
+ "recall": 0.9289940828402367
163
+ },
164
+ "eval_SPAT": {
165
+ "f1": 0.9322033898305087,
166
+ "number": 694,
167
+ "precision": 0.9141274238227147,
168
+ "recall": 0.9510086455331412
169
+ },
170
+ "eval_TITRE": {
171
+ "f1": 0.0,
172
+ "number": 2,
173
+ "precision": 0.0,
174
+ "recall": 0.0
175
+ },
176
+ "eval_TITREH": {
177
+ "f1": 0.0,
178
+ "number": 33,
179
+ "precision": 0.0,
180
+ "recall": 0.0
181
+ },
182
+ "eval_TITREP": {
183
+ "f1": 0.0,
184
+ "number": 6,
185
+ "precision": 0.0,
186
+ "recall": 0.0
187
+ },
188
+ "eval_accuracy": 0.9330549228043533,
189
+ "eval_accuracy-all": 0.9520374588711719,
190
+ "eval_accuracy-das": 0.9511516071880537,
191
+ "eval_accuracy-l1": 0.9421665401164262,
192
+ "eval_accuracy-l1l2": 0.9338142242470261,
193
+ "eval_accuracy-l2": 0.9619083776259175,
194
+ "eval_f1": 0.9332123823562762,
195
+ "eval_f1-all": 0.9176504882670165,
196
+ "eval_f1-das": 0.9288500835965074,
197
+ "eval_f1-l1": 0.9086687306501549,
198
+ "eval_f1-l1l2": 0.9253947559032305,
199
+ "eval_f1-l2": 0.9293132328308208,
200
+ "eval_loss": 0.38377615809440613,
201
+ "eval_precision": 0.9360782529572339,
202
+ "eval_precision-all": 0.9114070642733063,
203
+ "eval_precision-das": 0.9266123054114158,
204
+ "eval_precision-l1": 0.893455098934551,
205
+ "eval_precision-l1l2": 0.9225880993645291,
206
+ "eval_precision-l2": 0.935266351989211,
207
+ "eval_recall": 0.9303640063305448,
208
+ "eval_recall-all": 0.9239800410918697,
209
+ "eval_recall-das": 0.931098696461825,
210
+ "eval_recall-l1": 0.9244094488188976,
211
+ "eval_recall-l1l2": 0.9282185411217669,
212
+ "eval_recall-l2": 0.9234354194407457,
213
+ "eval_runtime": 6.6668,
214
+ "eval_samples_per_second": 101.398,
215
+ "eval_steps_per_second": 6.45,
216
+ "step": 200
217
+ },
218
+ {
219
+ "epoch": 0.79,
220
+ "eval_ACT": {
221
+ "f1": 0.9262759924385633,
222
+ "number": 519,
223
+ "precision": 0.9090909090909091,
224
+ "recall": 0.9441233140655106
225
+ },
226
+ "eval_ACT_L1": {
227
+ "f1": 0.9404990403071017,
228
+ "number": 503,
229
+ "precision": 0.9090909090909091,
230
+ "recall": 0.974155069582505
231
+ },
232
+ "eval_ACT_L2": {
233
+ "f1": 0.0,
234
+ "number": 16,
235
+ "precision": 0.0,
236
+ "recall": 0.0
237
+ },
238
+ "eval_CARDINAL": {
239
+ "f1": 0.9672250546249092,
240
+ "number": 678,
241
+ "precision": 0.9553956834532374,
242
+ "recall": 0.9793510324483776
243
+ },
244
+ "eval_DESC": {
245
+ "f1": 0.0,
246
+ "number": 30,
247
+ "precision": 0.0,
248
+ "recall": 0.0
249
+ },
250
+ "eval_FT": {
251
+ "f1": 0.0,
252
+ "number": 7,
253
+ "precision": 0.0,
254
+ "recall": 0.0
255
+ },
256
+ "eval_LOC": {
257
+ "f1": 0.9270767279644896,
258
+ "number": 762,
259
+ "precision": 0.8969325153374234,
260
+ "recall": 0.9593175853018373
261
+ },
262
+ "eval_PER": {
263
+ "f1": 0.9270449521002211,
264
+ "number": 676,
265
+ "precision": 0.9236417033773862,
266
+ "recall": 0.9304733727810651
267
+ },
268
+ "eval_SPAT": {
269
+ "f1": 0.9272727272727274,
270
+ "number": 694,
271
+ "precision": 0.9008152173913043,
272
+ "recall": 0.9553314121037464
273
+ },
274
+ "eval_TITRE": {
275
+ "f1": 0.0,
276
+ "number": 2,
277
+ "precision": 0.0,
278
+ "recall": 0.0
279
+ },
280
+ "eval_TITREH": {
281
+ "f1": 0.3181818181818182,
282
+ "number": 33,
283
+ "precision": 0.6363636363636364,
284
+ "recall": 0.21212121212121213
285
+ },
286
+ "eval_TITREP": {
287
+ "f1": 0.0,
288
+ "number": 6,
289
+ "precision": 0.0,
290
+ "recall": 0.0
291
+ },
292
+ "eval_accuracy": 0.9422930903568717,
293
+ "eval_accuracy-all": 0.956656542647431,
294
+ "eval_accuracy-das": 0.9616552771450265,
295
+ "eval_accuracy-l1": 0.9492533535813718,
296
+ "eval_accuracy-l1l2": 0.9425461908377626,
297
+ "eval_accuracy-l2": 0.9640597317134902,
298
+ "eval_f1": 0.9428926834784576,
299
+ "eval_f1-all": 0.9228985507246376,
300
+ "eval_f1-das": 0.9365871695322611,
301
+ "eval_f1-l1": 0.9192674748516895,
302
+ "eval_f1-l1l2": 0.9350086655112652,
303
+ "eval_f1-l2": 0.9275554085345683,
304
+ "eval_loss": 0.2978482246398926,
305
+ "eval_precision": 0.9432126696832579,
306
+ "eval_precision-all": 0.911537360435156,
307
+ "eval_precision-das": 0.9298825256975036,
308
+ "eval_precision-l1": 0.9036511156186613,
309
+ "eval_precision-l1l2": 0.9293712316968131,
310
+ "eval_precision-l2": 0.9217619986850756,
311
+ "eval_recall": 0.9425729143115532,
312
+ "eval_recall-all": 0.9345465218667449,
313
+ "eval_recall-das": 0.943389199255121,
314
+ "eval_recall-l1": 0.9354330708661417,
315
+ "eval_recall-l1l2": 0.9407149084568439,
316
+ "eval_recall-l2": 0.933422103861518,
317
+ "eval_runtime": 6.9078,
318
+ "eval_samples_per_second": 97.861,
319
+ "eval_steps_per_second": 6.225,
320
+ "step": 300
321
+ },
322
+ {
323
+ "epoch": 1.05,
324
+ "eval_ACT": {
325
+ "f1": 0.9080675422138836,
326
+ "number": 519,
327
+ "precision": 0.8848263254113345,
328
+ "recall": 0.9325626204238922
329
+ },
330
+ "eval_ACT_L1": {
331
+ "f1": 0.9219047619047619,
332
+ "number": 503,
333
+ "precision": 0.8848263254113345,
334
+ "recall": 0.9622266401590457
335
+ },
336
+ "eval_ACT_L2": {
337
+ "f1": 0.0,
338
+ "number": 16,
339
+ "precision": 0.0,
340
+ "recall": 0.0
341
+ },
342
+ "eval_CARDINAL": {
343
+ "f1": 0.9860396767083027,
344
+ "number": 678,
345
+ "precision": 0.9824304538799414,
346
+ "recall": 0.9896755162241888
347
+ },
348
+ "eval_DESC": {
349
+ "f1": 0.0,
350
+ "number": 30,
351
+ "precision": 0.0,
352
+ "recall": 0.0
353
+ },
354
+ "eval_FT": {
355
+ "f1": 0.0,
356
+ "number": 7,
357
+ "precision": 0.0,
358
+ "recall": 0.0
359
+ },
360
+ "eval_LOC": {
361
+ "f1": 0.9439374185136897,
362
+ "number": 762,
363
+ "precision": 0.9378238341968912,
364
+ "recall": 0.9501312335958005
365
+ },
366
+ "eval_PER": {
367
+ "f1": 0.9616519174041299,
368
+ "number": 676,
369
+ "precision": 0.9588235294117647,
370
+ "recall": 0.9644970414201184
371
+ },
372
+ "eval_SPAT": {
373
+ "f1": 0.9435310936383131,
374
+ "number": 694,
375
+ "precision": 0.9361702127659575,
376
+ "recall": 0.9510086455331412
377
+ },
378
+ "eval_TITRE": {
379
+ "f1": 0.0,
380
+ "number": 2,
381
+ "precision": 0.0,
382
+ "recall": 0.0
383
+ },
384
+ "eval_TITREH": {
385
+ "f1": 0.32258064516129037,
386
+ "number": 33,
387
+ "precision": 0.3448275862068966,
388
+ "recall": 0.30303030303030304
389
+ },
390
+ "eval_TITREP": {
391
+ "f1": 0.0,
392
+ "number": 6,
393
+ "precision": 0.0,
394
+ "recall": 0.0
395
+ },
396
+ "eval_accuracy": 0.9446975449253353,
397
+ "eval_accuracy-all": 0.9616552771450265,
398
+ "eval_accuracy-das": 0.9641862819539357,
399
+ "eval_accuracy-l1": 0.9526702100733991,
400
+ "eval_accuracy-l1l2": 0.9450771956466717,
401
+ "eval_accuracy-l2": 0.970640344216654,
402
+ "eval_f1": 0.9483929379809869,
403
+ "eval_f1-all": 0.9356913183279743,
404
+ "eval_f1-das": 0.9449814126394052,
405
+ "eval_f1-l1": 0.9315352697095436,
406
+ "eval_f1-l1l2": 0.9384215091066782,
407
+ "eval_f1-l2": 0.9410582719356999,
408
+ "eval_loss": 0.2418714463710785,
409
+ "eval_precision": 0.9494674824382506,
410
+ "eval_precision-all": 0.9318777292576419,
411
+ "eval_precision-das": 0.9432282003710575,
412
+ "eval_precision-l1": 0.920553562275756,
413
+ "eval_precision-l1l2": 0.9335634167385677,
414
+ "eval_precision-l2": 0.9467654986522911,
415
+ "eval_recall": 0.9473208229708343,
416
+ "eval_recall-all": 0.939536248899325,
417
+ "eval_recall-das": 0.9467411545623836,
418
+ "eval_recall-l1": 0.9427821522309712,
419
+ "eval_recall-l1l2": 0.9433304272013949,
420
+ "eval_recall-l2": 0.9354194407456724,
421
+ "eval_runtime": 6.7353,
422
+ "eval_samples_per_second": 100.367,
423
+ "eval_steps_per_second": 6.384,
424
+ "step": 400
425
+ },
426
+ {
427
+ "epoch": 1.31,
428
+ "learning_rate": 9e-05,
429
+ "loss": 0.561,
430
+ "step": 500
431
+ },
432
+ {
433
+ "epoch": 1.31,
434
+ "eval_ACT": {
435
+ "f1": 0.9264150943396225,
436
+ "number": 519,
437
+ "precision": 0.9075785582255084,
438
+ "recall": 0.9460500963391136
439
+ },
440
+ "eval_ACT_L1": {
441
+ "f1": 0.9406130268199234,
442
+ "number": 503,
443
+ "precision": 0.9075785582255084,
444
+ "recall": 0.9761431411530815
445
+ },
446
+ "eval_ACT_L2": {
447
+ "f1": 0.0,
448
+ "number": 16,
449
+ "precision": 0.0,
450
+ "recall": 0.0
451
+ },
452
+ "eval_CARDINAL": {
453
+ "f1": 0.9824561403508772,
454
+ "number": 678,
455
+ "precision": 0.9739130434782609,
456
+ "recall": 0.9911504424778761
457
+ },
458
+ "eval_DESC": {
459
+ "f1": 0.04,
460
+ "number": 30,
461
+ "precision": 0.05,
462
+ "recall": 0.03333333333333333
463
+ },
464
+ "eval_FT": {
465
+ "f1": 0.0,
466
+ "number": 7,
467
+ "precision": 0.0,
468
+ "recall": 0.0
469
+ },
470
+ "eval_LOC": {
471
+ "f1": 0.9362808842652797,
472
+ "number": 762,
473
+ "precision": 0.9278350515463918,
474
+ "recall": 0.9448818897637795
475
+ },
476
+ "eval_PER": {
477
+ "f1": 0.948377581120944,
478
+ "number": 676,
479
+ "precision": 0.9455882352941176,
480
+ "recall": 0.9511834319526628
481
+ },
482
+ "eval_SPAT": {
483
+ "f1": 0.9446022727272728,
484
+ "number": 694,
485
+ "precision": 0.9313725490196079,
486
+ "recall": 0.9582132564841499
487
+ },
488
+ "eval_TITRE": {
489
+ "f1": 0.0,
490
+ "number": 2,
491
+ "precision": 0.0,
492
+ "recall": 0.0
493
+ },
494
+ "eval_TITREH": {
495
+ "f1": 0.40579710144927533,
496
+ "number": 33,
497
+ "precision": 0.3888888888888889,
498
+ "recall": 0.42424242424242425
499
+ },
500
+ "eval_TITREP": {
501
+ "f1": 0.0,
502
+ "number": 6,
503
+ "precision": 0.0,
504
+ "recall": 0.0
505
+ },
506
+ "eval_accuracy": 0.9503923057453809,
507
+ "eval_accuracy-all": 0.964123006833713,
508
+ "eval_accuracy-das": 0.9665907365223994,
509
+ "eval_accuracy-l1": 0.9588711718552265,
510
+ "eval_accuracy-l1l2": 0.9507719564667173,
511
+ "eval_accuracy-l2": 0.9693748418121995,
512
+ "eval_f1": 0.9477367648718816,
513
+ "eval_f1-all": 0.9341491841491842,
514
+ "eval_f1-das": 0.9472511144130759,
515
+ "eval_f1-l1": 0.932642487046632,
516
+ "eval_f1-l1l2": 0.9404624277456647,
517
+ "eval_f1-l2": 0.9360852197070573,
518
+ "eval_loss": 0.2279864400625229,
519
+ "eval_precision": 0.9463480613165014,
520
+ "eval_precision-all": 0.9273936939542956,
521
+ "eval_precision-das": 0.9447943682845499,
522
+ "eval_precision-l1": 0.9207161125319693,
523
+ "eval_precision-l1l2": 0.9353262431733257,
524
+ "eval_precision-l2": 0.9360852197070573,
525
+ "eval_recall": 0.9491295500791318,
526
+ "eval_recall-all": 0.9410038156736131,
527
+ "eval_recall-das": 0.9497206703910615,
528
+ "eval_recall-l1": 0.9448818897637795,
529
+ "eval_recall-l1l2": 0.9456553327521069,
530
+ "eval_recall-l2": 0.9360852197070573,
531
+ "eval_runtime": 6.9814,
532
+ "eval_samples_per_second": 96.828,
533
+ "eval_steps_per_second": 6.159,
534
+ "step": 500
535
+ },
536
+ {
537
+ "epoch": 1.57,
538
+ "eval_ACT": {
539
+ "f1": 0.9343482397716459,
540
+ "number": 519,
541
+ "precision": 0.9229323308270677,
542
+ "recall": 0.9460500963391136
543
+ },
544
+ "eval_ACT_L1": {
545
+ "f1": 0.948792270531401,
546
+ "number": 503,
547
+ "precision": 0.9229323308270677,
548
+ "recall": 0.9761431411530815
549
+ },
550
+ "eval_ACT_L2": {
551
+ "f1": 0.0,
552
+ "number": 16,
553
+ "precision": 0.0,
554
+ "recall": 0.0
555
+ },
556
+ "eval_CARDINAL": {
557
+ "f1": 0.9882179675994109,
558
+ "number": 678,
559
+ "precision": 0.986764705882353,
560
+ "recall": 0.9896755162241888
561
+ },
562
+ "eval_DESC": {
563
+ "f1": 0.07692307692307691,
564
+ "number": 30,
565
+ "precision": 0.09090909090909091,
566
+ "recall": 0.06666666666666667
567
+ },
568
+ "eval_FT": {
569
+ "f1": 0.0,
570
+ "number": 7,
571
+ "precision": 0.0,
572
+ "recall": 0.0
573
+ },
574
+ "eval_LOC": {
575
+ "f1": 0.9483322432962721,
576
+ "number": 762,
577
+ "precision": 0.9452411994784876,
578
+ "recall": 0.9514435695538058
579
+ },
580
+ "eval_PER": {
581
+ "f1": 0.9254612546125461,
582
+ "number": 676,
583
+ "precision": 0.9234167893961709,
584
+ "recall": 0.9275147928994083
585
+ },
586
+ "eval_SPAT": {
587
+ "f1": 0.952108649035025,
588
+ "number": 694,
589
+ "precision": 0.9446808510638298,
590
+ "recall": 0.9596541786743515
591
+ },
592
+ "eval_TITRE": {
593
+ "f1": 0.0,
594
+ "number": 2,
595
+ "precision": 0.0,
596
+ "recall": 0.0
597
+ },
598
+ "eval_TITREH": {
599
+ "f1": 0.3283582089552239,
600
+ "number": 33,
601
+ "precision": 0.3235294117647059,
602
+ "recall": 0.3333333333333333
603
+ },
604
+ "eval_TITREP": {
605
+ "f1": 0.0,
606
+ "number": 6,
607
+ "precision": 0.0,
608
+ "recall": 0.0
609
+ },
610
+ "eval_accuracy": 0.9458364970893445,
611
+ "eval_accuracy-all": 0.9623513034674765,
612
+ "eval_accuracy-das": 0.9616552771450265,
613
+ "eval_accuracy-l1": 0.9564667172867628,
614
+ "eval_accuracy-l1l2": 0.9463426980511263,
615
+ "eval_accuracy-l2": 0.9682358896481903,
616
+ "eval_f1": 0.9478694469628286,
617
+ "eval_f1-all": 0.9355405801347787,
618
+ "eval_f1-das": 0.9418127564341664,
619
+ "eval_f1-l1": 0.9294821753838147,
620
+ "eval_f1-l1l2": 0.9375181633246149,
621
+ "eval_f1-l2": 0.9433456252095207,
622
+ "eval_loss": 0.22755712270736694,
623
+ "eval_precision": 0.9502385821404227,
624
+ "eval_precision-all": 0.9338988008189529,
625
+ "eval_precision-das": 0.9432200224131491,
626
+ "eval_precision-l1": 0.9215686274509803,
627
+ "eval_precision-l1l2": 0.9375181633246149,
628
+ "eval_precision-l2": 0.950033760972316,
629
+ "eval_recall": 0.9455120958625367,
630
+ "eval_recall-all": 0.9371881420604637,
631
+ "eval_recall-das": 0.9404096834264432,
632
+ "eval_recall-l1": 0.9375328083989501,
633
+ "eval_recall-l1l2": 0.9375181633246149,
634
+ "eval_recall-l2": 0.936750998668442,
635
+ "eval_runtime": 6.9231,
636
+ "eval_samples_per_second": 97.644,
637
+ "eval_steps_per_second": 6.211,
638
+ "step": 600
639
+ },
640
+ {
641
+ "epoch": 1.84,
642
+ "eval_ACT": {
643
+ "f1": 0.8997188378631678,
644
+ "number": 519,
645
+ "precision": 0.8759124087591241,
646
+ "recall": 0.9248554913294798
647
+ },
648
+ "eval_ACT_L1": {
649
+ "f1": 0.9239653512993262,
650
+ "number": 503,
651
+ "precision": 0.8955223880597015,
652
+ "recall": 0.9542743538767395
653
+ },
654
+ "eval_ACT_L2": {
655
+ "f1": 0.0,
656
+ "number": 16,
657
+ "precision": 0.0,
658
+ "recall": 0.0
659
+ },
660
+ "eval_CARDINAL": {
661
+ "f1": 0.9882179675994109,
662
+ "number": 678,
663
+ "precision": 0.986764705882353,
664
+ "recall": 0.9896755162241888
665
+ },
666
+ "eval_DESC": {
667
+ "f1": 0.24324324324324326,
668
+ "number": 30,
669
+ "precision": 0.20454545454545456,
670
+ "recall": 0.3
671
+ },
672
+ "eval_FT": {
673
+ "f1": 0.0,
674
+ "number": 7,
675
+ "precision": 0.0,
676
+ "recall": 0.0
677
+ },
678
+ "eval_LOC": {
679
+ "f1": 0.9250645994832041,
680
+ "number": 762,
681
+ "precision": 0.910941475826972,
682
+ "recall": 0.9396325459317585
683
+ },
684
+ "eval_PER": {
685
+ "f1": 0.9712601326455416,
686
+ "number": 676,
687
+ "precision": 0.9676945668135095,
688
+ "recall": 0.9748520710059172
689
+ },
690
+ "eval_SPAT": {
691
+ "f1": 0.9321912919343327,
692
+ "number": 694,
693
+ "precision": 0.9236209335219236,
694
+ "recall": 0.9409221902017291
695
+ },
696
+ "eval_TITRE": {
697
+ "f1": 0.0,
698
+ "number": 2,
699
+ "precision": 0.0,
700
+ "recall": 0.0
701
+ },
702
+ "eval_TITREH": {
703
+ "f1": 0.6666666666666666,
704
+ "number": 33,
705
+ "precision": 0.5625,
706
+ "recall": 0.8181818181818182
707
+ },
708
+ "eval_TITREP": {
709
+ "f1": 0.0,
710
+ "number": 6,
711
+ "precision": 0.0,
712
+ "recall": 0.0
713
+ },
714
+ "eval_accuracy": 0.9505188559858264,
715
+ "eval_accuracy-all": 0.9654517843583903,
716
+ "eval_accuracy-das": 0.9669703872437357,
717
+ "eval_accuracy-l1": 0.9611490761832447,
718
+ "eval_accuracy-l1l2": 0.9510250569476082,
719
+ "eval_accuracy-l2": 0.9697544925335359,
720
+ "eval_f1": 0.9473565804274465,
721
+ "eval_f1-all": 0.9317490218808867,
722
+ "eval_f1-das": 0.9491839762611276,
723
+ "eval_f1-l1": 0.930028401755745,
724
+ "eval_f1-l1l2": 0.9392201834862385,
725
+ "eval_f1-l2": 0.9339498018494057,
726
+ "eval_loss": 0.2043749988079071,
727
+ "eval_precision": 0.9426908439668682,
728
+ "eval_precision-all": 0.9201488265598168,
729
+ "eval_precision-das": 0.9453269301810122,
730
+ "eval_precision-l1": 0.9151422764227642,
731
+ "eval_precision-l1l2": 0.9267326732673268,
732
+ "eval_precision-l2": 0.926605504587156,
733
+ "eval_recall": 0.9520687316301153,
734
+ "eval_recall-all": 0.943645435867332,
735
+ "eval_recall-das": 0.9530726256983241,
736
+ "eval_recall-l1": 0.9454068241469816,
737
+ "eval_recall-l1l2": 0.9520488230165649,
738
+ "eval_recall-l2": 0.9414114513981359,
739
+ "eval_runtime": 6.6319,
740
+ "eval_samples_per_second": 101.932,
741
+ "eval_steps_per_second": 6.484,
742
+ "step": 700
743
+ },
744
+ {
745
+ "epoch": 2.1,
746
+ "eval_ACT": {
747
+ "f1": 0.9188679245283018,
748
+ "number": 519,
749
+ "precision": 0.9001848428835489,
750
+ "recall": 0.9383429672447013
751
+ },
752
+ "eval_ACT_L1": {
753
+ "f1": 0.9427740058195926,
754
+ "number": 503,
755
+ "precision": 0.9204545454545454,
756
+ "recall": 0.9662027833001988
757
+ },
758
+ "eval_ACT_L2": {
759
+ "f1": 0.06896551724137931,
760
+ "number": 16,
761
+ "precision": 0.07692307692307693,
762
+ "recall": 0.0625
763
+ },
764
+ "eval_CARDINAL": {
765
+ "f1": 0.9838472834067548,
766
+ "number": 678,
767
+ "precision": 0.97953216374269,
768
+ "recall": 0.9882005899705014
769
+ },
770
+ "eval_DESC": {
771
+ "f1": 0.29850746268656714,
772
+ "number": 30,
773
+ "precision": 0.2702702702702703,
774
+ "recall": 0.3333333333333333
775
+ },
776
+ "eval_FT": {
777
+ "f1": 0.0,
778
+ "number": 7,
779
+ "precision": 0.0,
780
+ "recall": 0.0
781
+ },
782
+ "eval_LOC": {
783
+ "f1": 0.9433962264150944,
784
+ "number": 762,
785
+ "precision": 0.9354838709677419,
786
+ "recall": 0.9514435695538058
787
+ },
788
+ "eval_PER": {
789
+ "f1": 0.9638376383763838,
790
+ "number": 676,
791
+ "precision": 0.9617083946980854,
792
+ "recall": 0.9659763313609467
793
+ },
794
+ "eval_SPAT": {
795
+ "f1": 0.9472182596291013,
796
+ "number": 694,
797
+ "precision": 0.9378531073446328,
798
+ "recall": 0.9567723342939481
799
+ },
800
+ "eval_TITRE": {
801
+ "f1": 0.0,
802
+ "number": 2,
803
+ "precision": 0.0,
804
+ "recall": 0.0
805
+ },
806
+ "eval_TITREH": {
807
+ "f1": 0.6857142857142857,
808
+ "number": 33,
809
+ "precision": 0.6486486486486487,
810
+ "recall": 0.7272727272727273
811
+ },
812
+ "eval_TITREP": {
813
+ "f1": 0.0,
814
+ "number": 6,
815
+ "precision": 0.0,
816
+ "recall": 0.0
817
+ },
818
+ "eval_accuracy": 0.9502657555049354,
819
+ "eval_accuracy-all": 0.9630473297899266,
820
+ "eval_accuracy-das": 0.9681093394077449,
821
+ "eval_accuracy-l1": 0.9578587699316629,
822
+ "eval_accuracy-l1l2": 0.9507719564667173,
823
+ "eval_accuracy-l2": 0.9682358896481903,
824
+ "eval_f1": 0.953853097145436,
825
+ "eval_f1-all": 0.9413306158101615,
826
+ "eval_f1-das": 0.9552626693892705,
827
+ "eval_f1-l1": 0.9401088929219601,
828
+ "eval_f1-l1l2": 0.9481588447653428,
829
+ "eval_f1-l2": 0.9428950863213811,
830
+ "eval_loss": 0.18969722092151642,
831
+ "eval_precision": 0.952027027027027,
832
+ "eval_precision-all": 0.9338532640092432,
833
+ "eval_precision-das": 0.9522575869726129,
834
+ "eval_precision-l1": 0.9287909836065574,
835
+ "eval_precision-l1l2": 0.9423076923076923,
836
+ "eval_precision-l2": 0.9403973509933775,
837
+ "eval_recall": 0.9556861858467104,
838
+ "eval_recall-all": 0.9489286762547696,
839
+ "eval_recall-das": 0.9582867783985103,
840
+ "eval_recall-l1": 0.9517060367454068,
841
+ "eval_recall-l1l2": 0.9540831153734379,
842
+ "eval_recall-l2": 0.9454061251664447,
843
+ "eval_runtime": 7.376,
844
+ "eval_samples_per_second": 91.648,
845
+ "eval_steps_per_second": 5.83,
846
+ "step": 800
847
+ },
848
+ {
849
+ "epoch": 2.36,
850
+ "eval_ACT": {
851
+ "f1": 0.9351145038167938,
852
+ "number": 519,
853
+ "precision": 0.9262759924385633,
854
+ "recall": 0.9441233140655106
855
+ },
856
+ "eval_ACT_L1": {
857
+ "f1": 0.949514563106796,
858
+ "number": 503,
859
+ "precision": 0.9278937381404174,
860
+ "recall": 0.9721669980119284
861
+ },
862
+ "eval_ACT_L2": {
863
+ "f1": 0.1111111111111111,
864
+ "number": 16,
865
+ "precision": 0.5,
866
+ "recall": 0.0625
867
+ },
868
+ "eval_CARDINAL": {
869
+ "f1": 0.986019131714496,
870
+ "number": 678,
871
+ "precision": 0.9838472834067548,
872
+ "recall": 0.9882005899705014
873
+ },
874
+ "eval_DESC": {
875
+ "f1": 0.32,
876
+ "number": 30,
877
+ "precision": 0.4,
878
+ "recall": 0.26666666666666666
879
+ },
880
+ "eval_FT": {
881
+ "f1": 0.0,
882
+ "number": 7,
883
+ "precision": 0.0,
884
+ "recall": 0.0
885
+ },
886
+ "eval_LOC": {
887
+ "f1": 0.9252577319587628,
888
+ "number": 762,
889
+ "precision": 0.9088607594936708,
890
+ "recall": 0.9422572178477691
891
+ },
892
+ "eval_PER": {
893
+ "f1": 0.9705449189985274,
894
+ "number": 676,
895
+ "precision": 0.966275659824047,
896
+ "recall": 0.9748520710059172
897
+ },
898
+ "eval_SPAT": {
899
+ "f1": 0.9371428571428572,
900
+ "number": 694,
901
+ "precision": 0.9291784702549575,
902
+ "recall": 0.9452449567723343
903
+ },
904
+ "eval_TITRE": {
905
+ "f1": 0.0,
906
+ "number": 2,
907
+ "precision": 0.0,
908
+ "recall": 0.0
909
+ },
910
+ "eval_TITREH": {
911
+ "f1": 0.6666666666666667,
912
+ "number": 33,
913
+ "precision": 0.5952380952380952,
914
+ "recall": 0.7575757575757576
915
+ },
916
+ "eval_TITREP": {
917
+ "f1": 0.0,
918
+ "number": 6,
919
+ "precision": 0.0,
920
+ "recall": 0.0
921
+ },
922
+ "eval_accuracy": 0.9520374588711719,
923
+ "eval_accuracy-all": 0.9636168058719311,
924
+ "eval_accuracy-das": 0.9689951910908631,
925
+ "eval_accuracy-l1": 0.9600101240192357,
926
+ "eval_accuracy-l1l2": 0.9525436598329536,
927
+ "eval_accuracy-l2": 0.9672234877246266,
928
+ "eval_f1": 0.955247435463871,
929
+ "eval_f1-all": 0.9405247813411078,
930
+ "eval_f1-das": 0.9516577143915541,
931
+ "eval_f1-l1": 0.9437500000000001,
932
+ "eval_f1-l1l2": 0.9492994366604072,
933
+ "eval_f1-l2": 0.9364238410596026,
934
+ "eval_loss": 0.20938263833522797,
935
+ "eval_precision": 0.9525629496402878,
936
+ "eval_precision-all": 0.9342600637127135,
937
+ "eval_precision-das": 0.9465733235077377,
938
+ "eval_precision-l1": 0.9364341085271318,
939
+ "eval_precision-l1l2": 0.9437105112004595,
940
+ "eval_precision-l2": 0.9314888010540184,
941
+ "eval_recall": 0.9579470947320823,
942
+ "eval_recall-all": 0.9468740827707661,
943
+ "eval_recall-das": 0.9567970204841714,
944
+ "eval_recall-l1": 0.9511811023622048,
945
+ "eval_recall-l1l2": 0.954954954954955,
946
+ "eval_recall-l2": 0.9414114513981359,
947
+ "eval_runtime": 7.1684,
948
+ "eval_samples_per_second": 94.303,
949
+ "eval_steps_per_second": 5.999,
950
+ "step": 900
951
+ },
952
+ {
953
+ "epoch": 2.62,
954
+ "learning_rate": 8e-05,
955
+ "loss": 0.1912,
956
+ "step": 1000
957
+ },
958
+ {
959
+ "epoch": 2.62,
960
+ "eval_ACT": {
961
+ "f1": 0.9382716049382717,
962
+ "number": 519,
963
+ "precision": 0.9250936329588015,
964
+ "recall": 0.9518304431599229
965
+ },
966
+ "eval_ACT_L1": {
967
+ "f1": 0.960552268244576,
968
+ "number": 503,
969
+ "precision": 0.9530332681017613,
970
+ "recall": 0.9681908548707754
971
+ },
972
+ "eval_ACT_L2": {
973
+ "f1": 0.358974358974359,
974
+ "number": 16,
975
+ "precision": 0.30434782608695654,
976
+ "recall": 0.4375
977
+ },
978
+ "eval_CARDINAL": {
979
+ "f1": 0.9859985261606484,
980
+ "number": 678,
981
+ "precision": 0.9852724594992637,
982
+ "recall": 0.9867256637168141
983
+ },
984
+ "eval_DESC": {
985
+ "f1": 0.4102564102564102,
986
+ "number": 30,
987
+ "precision": 0.3333333333333333,
988
+ "recall": 0.5333333333333333
989
+ },
990
+ "eval_FT": {
991
+ "f1": 0.0,
992
+ "number": 7,
993
+ "precision": 0.0,
994
+ "recall": 0.0
995
+ },
996
+ "eval_LOC": {
997
+ "f1": 0.9557291666666666,
998
+ "number": 762,
999
+ "precision": 0.9483204134366925,
1000
+ "recall": 0.963254593175853
1001
+ },
1002
+ "eval_PER": {
1003
+ "f1": 0.9741697416974169,
1004
+ "number": 676,
1005
+ "precision": 0.9720176730486009,
1006
+ "recall": 0.9763313609467456
1007
+ },
1008
+ "eval_SPAT": {
1009
+ "f1": 0.952108649035025,
1010
+ "number": 694,
1011
+ "precision": 0.9446808510638298,
1012
+ "recall": 0.9596541786743515
1013
+ },
1014
+ "eval_TITRE": {
1015
+ "f1": 0.0,
1016
+ "number": 2,
1017
+ "precision": 0.0,
1018
+ "recall": 0.0
1019
+ },
1020
+ "eval_TITREH": {
1021
+ "f1": 0.7941176470588236,
1022
+ "number": 33,
1023
+ "precision": 0.7714285714285715,
1024
+ "recall": 0.8181818181818182
1025
+ },
1026
+ "eval_TITREP": {
1027
+ "f1": 0.3636363636363636,
1028
+ "number": 6,
1029
+ "precision": 0.4,
1030
+ "recall": 0.3333333333333333
1031
+ },
1032
+ "eval_accuracy": 0.9583649708934447,
1033
+ "eval_accuracy-all": 0.9694381169324222,
1034
+ "eval_accuracy-das": 0.9744368514300177,
1035
+ "eval_accuracy-l1": 0.9646924829157175,
1036
+ "eval_accuracy-l1l2": 0.958997722095672,
1037
+ "eval_accuracy-l2": 0.9741837509491268,
1038
+ "eval_f1": 0.9609921082299888,
1039
+ "eval_f1-all": 0.9517984563856124,
1040
+ "eval_f1-das": 0.9652480951496005,
1041
+ "eval_f1-l1": 0.9506237006237006,
1042
+ "eval_f1-l1l2": 0.9588685235964786,
1043
+ "eval_f1-l2": 0.9532957933090427,
1044
+ "eval_loss": 0.15711340308189392,
1045
+ "eval_precision": 0.9583989206206431,
1046
+ "eval_precision-all": 0.9445086705202312,
1047
+ "eval_precision-das": 0.9632789317507419,
1048
+ "eval_precision-l1": 0.9413278435409161,
1049
+ "eval_precision-l1l2": 0.9524082568807339,
1050
+ "eval_precision-l2": 0.948582729070534,
1051
+ "eval_recall": 0.9635993669455121,
1052
+ "eval_recall-all": 0.9592016436747872,
1053
+ "eval_recall-das": 0.9672253258845438,
1054
+ "eval_recall-l1": 0.9601049868766404,
1055
+ "eval_recall-l1l2": 0.9654170299331589,
1056
+ "eval_recall-l2": 0.9580559254327563,
1057
+ "eval_runtime": 6.9238,
1058
+ "eval_samples_per_second": 97.635,
1059
+ "eval_steps_per_second": 6.21,
1060
+ "step": 1000
1061
+ },
1062
+ {
1063
+ "epoch": 2.89,
1064
+ "eval_ACT": {
1065
+ "f1": 0.9284369114877589,
1066
+ "number": 519,
1067
+ "precision": 0.9079189686924494,
1068
+ "recall": 0.9499036608863198
1069
+ },
1070
+ "eval_ACT_L1": {
1071
+ "f1": 0.9557522123893806,
1072
+ "number": 503,
1073
+ "precision": 0.9455252918287937,
1074
+ "recall": 0.9662027833001988
1075
+ },
1076
+ "eval_ACT_L2": {
1077
+ "f1": 0.3111111111111111,
1078
+ "number": 16,
1079
+ "precision": 0.2413793103448276,
1080
+ "recall": 0.4375
1081
+ },
1082
+ "eval_CARDINAL": {
1083
+ "f1": 0.9904341427520236,
1084
+ "number": 678,
1085
+ "precision": 0.9882525697503671,
1086
+ "recall": 0.9926253687315634
1087
+ },
1088
+ "eval_DESC": {
1089
+ "f1": 0.3611111111111111,
1090
+ "number": 30,
1091
+ "precision": 0.30952380952380953,
1092
+ "recall": 0.43333333333333335
1093
+ },
1094
+ "eval_FT": {
1095
+ "f1": 0.0,
1096
+ "number": 7,
1097
+ "precision": 0.0,
1098
+ "recall": 0.0
1099
+ },
1100
+ "eval_LOC": {
1101
+ "f1": 0.9468911917098446,
1102
+ "number": 762,
1103
+ "precision": 0.9347826086956522,
1104
+ "recall": 0.9593175853018373
1105
+ },
1106
+ "eval_PER": {
1107
+ "f1": 0.9749262536873157,
1108
+ "number": 676,
1109
+ "precision": 0.9720588235294118,
1110
+ "recall": 0.977810650887574
1111
+ },
1112
+ "eval_SPAT": {
1113
+ "f1": 0.9549033643521831,
1114
+ "number": 694,
1115
+ "precision": 0.9487908961593172,
1116
+ "recall": 0.9610951008645533
1117
+ },
1118
+ "eval_TITRE": {
1119
+ "f1": 0.0,
1120
+ "number": 2,
1121
+ "precision": 0.0,
1122
+ "recall": 0.0
1123
+ },
1124
+ "eval_TITREH": {
1125
+ "f1": 0.8181818181818182,
1126
+ "number": 33,
1127
+ "precision": 0.8181818181818182,
1128
+ "recall": 0.8181818181818182
1129
+ },
1130
+ "eval_TITREP": {
1131
+ "f1": 0.15384615384615383,
1132
+ "number": 6,
1133
+ "precision": 0.14285714285714285,
1134
+ "recall": 0.16666666666666666
1135
+ },
1136
+ "eval_accuracy": 0.95292331055429,
1137
+ "eval_accuracy-all": 0.9657048848392812,
1138
+ "eval_accuracy-das": 0.9725385978233358,
1139
+ "eval_accuracy-l1": 0.9620349278663629,
1140
+ "eval_accuracy-l1l2": 0.9538091622374083,
1141
+ "eval_accuracy-l2": 0.9693748418121995,
1142
+ "eval_f1": 0.956971126839681,
1143
+ "eval_f1-all": 0.9494186046511628,
1144
+ "eval_f1-das": 0.9590664937951473,
1145
+ "eval_f1-l1": 0.9505723204994797,
1146
+ "eval_f1-l1l2": 0.9534348950847945,
1147
+ "eval_f1-l2": 0.947957839262187,
1148
+ "eval_loss": 0.16421228647232056,
1149
+ "eval_precision": 0.9510942384993301,
1150
+ "eval_precision-all": 0.9403973509933775,
1151
+ "eval_precision-das": 0.9539425202652911,
1152
+ "eval_precision-l1": 0.9422382671480144,
1153
+ "eval_precision-l1l2": 0.9431333522888826,
1154
+ "eval_precision-l2": 0.9380704041720991,
1155
+ "eval_recall": 0.9629210942799005,
1156
+ "eval_recall-all": 0.9586146169650719,
1157
+ "eval_recall-das": 0.964245810055866,
1158
+ "eval_recall-l1": 0.9590551181102362,
1159
+ "eval_recall-l1l2": 0.963963963963964,
1160
+ "eval_recall-l2": 0.9580559254327563,
1161
+ "eval_runtime": 6.9342,
1162
+ "eval_samples_per_second": 97.488,
1163
+ "eval_steps_per_second": 6.201,
1164
+ "step": 1100
1165
+ },
1166
+ {
1167
+ "epoch": 3.15,
1168
+ "eval_ACT": {
1169
+ "f1": 0.9303201506591338,
1170
+ "number": 519,
1171
+ "precision": 0.9097605893186004,
1172
+ "recall": 0.9518304431599229
1173
+ },
1174
+ "eval_ACT_L1": {
1175
+ "f1": 0.9560975609756097,
1176
+ "number": 503,
1177
+ "precision": 0.9386973180076629,
1178
+ "recall": 0.974155069582505
1179
+ },
1180
+ "eval_ACT_L2": {
1181
+ "f1": 0.2162162162162162,
1182
+ "number": 16,
1183
+ "precision": 0.19047619047619047,
1184
+ "recall": 0.25
1185
+ },
1186
+ "eval_CARDINAL": {
1187
+ "f1": 0.9831006612784717,
1188
+ "number": 678,
1189
+ "precision": 0.9795021961932651,
1190
+ "recall": 0.9867256637168141
1191
+ },
1192
+ "eval_DESC": {
1193
+ "f1": 0.4411764705882353,
1194
+ "number": 30,
1195
+ "precision": 0.39473684210526316,
1196
+ "recall": 0.5
1197
+ },
1198
+ "eval_FT": {
1199
+ "f1": 0.25,
1200
+ "number": 7,
1201
+ "precision": 1.0,
1202
+ "recall": 0.14285714285714285
1203
+ },
1204
+ "eval_LOC": {
1205
+ "f1": 0.9536855838225701,
1206
+ "number": 762,
1207
+ "precision": 0.9481193255512321,
1208
+ "recall": 0.9593175853018373
1209
+ },
1210
+ "eval_PER": {
1211
+ "f1": 0.9741697416974169,
1212
+ "number": 676,
1213
+ "precision": 0.9720176730486009,
1214
+ "recall": 0.9763313609467456
1215
+ },
1216
+ "eval_SPAT": {
1217
+ "f1": 0.9577060931899642,
1218
+ "number": 694,
1219
+ "precision": 0.9529243937232525,
1220
+ "recall": 0.962536023054755
1221
+ },
1222
+ "eval_TITRE": {
1223
+ "f1": 0.0,
1224
+ "number": 2,
1225
+ "precision": 0.0,
1226
+ "recall": 0.0
1227
+ },
1228
+ "eval_TITREH": {
1229
+ "f1": 0.7941176470588236,
1230
+ "number": 33,
1231
+ "precision": 0.7714285714285715,
1232
+ "recall": 0.8181818181818182
1233
+ },
1234
+ "eval_TITREP": {
1235
+ "f1": 0.25,
1236
+ "number": 6,
1237
+ "precision": 0.5,
1238
+ "recall": 0.16666666666666666
1239
+ },
1240
+ "eval_accuracy": 0.9535560617565173,
1241
+ "eval_accuracy-all": 0.9642495570741585,
1242
+ "eval_accuracy-das": 0.975069602632245,
1243
+ "eval_accuracy-l1": 0.960642875221463,
1244
+ "eval_accuracy-l1l2": 0.9536826119969628,
1245
+ "eval_accuracy-l2": 0.9678562389268539,
1246
+ "eval_f1": 0.9631715283252619,
1247
+ "eval_f1-all": 0.9521865889212828,
1248
+ "eval_f1-das": 0.9622886866059818,
1249
+ "eval_f1-l1": 0.953446033810143,
1250
+ "eval_f1-l1l2": 0.9576405956339453,
1251
+ "eval_f1-l2": 0.9505804311774461,
1252
+ "eval_loss": 0.1735592782497406,
1253
+ "eval_precision": 0.9596050269299821,
1254
+ "eval_precision-all": 0.9458441934549667,
1255
+ "eval_precision-das": 0.9599703484062269,
1256
+ "eval_precision-l1": 0.9448453608247422,
1257
+ "eval_precision-l1l2": 0.952819332566168,
1258
+ "eval_precision-l2": 0.9471249173826835,
1259
+ "eval_recall": 0.9667646393850328,
1260
+ "eval_recall-all": 0.9586146169650719,
1261
+ "eval_recall-das": 0.9646182495344506,
1262
+ "eval_recall-l1": 0.9622047244094488,
1263
+ "eval_recall-l1l2": 0.962510897994769,
1264
+ "eval_recall-l2": 0.9540612516644474,
1265
+ "eval_runtime": 6.7491,
1266
+ "eval_samples_per_second": 100.161,
1267
+ "eval_steps_per_second": 6.371,
1268
+ "step": 1200
1269
+ },
1270
+ {
1271
+ "epoch": 3.41,
1272
+ "eval_ACT": {
1273
+ "f1": 0.9385052034058656,
1274
+ "number": 519,
1275
+ "precision": 0.9219330855018587,
1276
+ "recall": 0.9556840077071291
1277
+ },
1278
+ "eval_ACT_L1": {
1279
+ "f1": 0.9571150097465887,
1280
+ "number": 503,
1281
+ "precision": 0.9388145315487572,
1282
+ "recall": 0.9761431411530815
1283
+ },
1284
+ "eval_ACT_L2": {
1285
+ "f1": 0.3225806451612903,
1286
+ "number": 16,
1287
+ "precision": 0.3333333333333333,
1288
+ "recall": 0.3125
1289
+ },
1290
+ "eval_CARDINAL": {
1291
+ "f1": 0.9831254585473221,
1292
+ "number": 678,
1293
+ "precision": 0.9781021897810219,
1294
+ "recall": 0.9882005899705014
1295
+ },
1296
+ "eval_DESC": {
1297
+ "f1": 0.4444444444444445,
1298
+ "number": 30,
1299
+ "precision": 0.42424242424242425,
1300
+ "recall": 0.4666666666666667
1301
+ },
1302
+ "eval_FT": {
1303
+ "f1": 0.16666666666666666,
1304
+ "number": 7,
1305
+ "precision": 0.2,
1306
+ "recall": 0.14285714285714285
1307
+ },
1308
+ "eval_LOC": {
1309
+ "f1": 0.9461388708630759,
1310
+ "number": 762,
1311
+ "precision": 0.9358151476251605,
1312
+ "recall": 0.9566929133858267
1313
+ },
1314
+ "eval_PER": {
1315
+ "f1": 0.9748520710059172,
1316
+ "number": 676,
1317
+ "precision": 0.9748520710059172,
1318
+ "recall": 0.9748520710059172
1319
+ },
1320
+ "eval_SPAT": {
1321
+ "f1": 0.9513590844062948,
1322
+ "number": 694,
1323
+ "precision": 0.9446022727272727,
1324
+ "recall": 0.9582132564841499
1325
+ },
1326
+ "eval_TITRE": {
1327
+ "f1": 0.0,
1328
+ "number": 2,
1329
+ "precision": 0.0,
1330
+ "recall": 0.0
1331
+ },
1332
+ "eval_TITREH": {
1333
+ "f1": 0.8059701492537314,
1334
+ "number": 33,
1335
+ "precision": 0.7941176470588235,
1336
+ "recall": 0.8181818181818182
1337
+ },
1338
+ "eval_TITREP": {
1339
+ "f1": 0.28571428571428575,
1340
+ "number": 6,
1341
+ "precision": 0.25,
1342
+ "recall": 0.3333333333333333
1343
+ },
1344
+ "eval_accuracy": 0.958997722095672,
1345
+ "eval_accuracy-all": 0.9700708681346495,
1346
+ "eval_accuracy-das": 0.9730447987851177,
1347
+ "eval_accuracy-l1": 0.9678562389268539,
1348
+ "eval_accuracy-l1l2": 0.9596304732978993,
1349
+ "eval_accuracy-l2": 0.972285497342445,
1350
+ "eval_f1": 0.9589010246593853,
1351
+ "eval_f1-all": 0.9500655117193187,
1352
+ "eval_f1-das": 0.959614672100778,
1353
+ "eval_f1-l1": 0.952356157250716,
1354
+ "eval_f1-l1l2": 0.953810623556582,
1355
+ "eval_f1-l2": 0.9471598414795245,
1356
+ "eval_loss": 0.17504489421844482,
1357
+ "eval_precision": 0.9551368326603858,
1358
+ "eval_precision-all": 0.9425187752744079,
1359
+ "eval_precision-das": 0.9546627349797272,
1360
+ "eval_precision-l1": 0.9447314049586777,
1361
+ "eval_precision-l1l2": 0.9475193576139949,
1362
+ "eval_precision-l2": 0.9397116644823067,
1363
+ "eval_recall": 0.9626950033913634,
1364
+ "eval_recall-all": 0.9577340769004989,
1365
+ "eval_recall-das": 0.9646182495344506,
1366
+ "eval_recall-l1": 0.9601049868766404,
1367
+ "eval_recall-l1l2": 0.960185992444057,
1368
+ "eval_recall-l2": 0.9547270306258322,
1369
+ "eval_runtime": 6.7727,
1370
+ "eval_samples_per_second": 99.813,
1371
+ "eval_steps_per_second": 6.349,
1372
+ "step": 1300
1373
+ },
1374
+ {
1375
+ "epoch": 3.67,
1376
+ "eval_ACT": {
1377
+ "f1": 0.9466666666666668,
1378
+ "number": 519,
1379
+ "precision": 0.935969868173258,
1380
+ "recall": 0.9576107899807321
1381
+ },
1382
+ "eval_ACT_L1": {
1383
+ "f1": 0.970414201183432,
1384
+ "number": 503,
1385
+ "precision": 0.9628180039138943,
1386
+ "recall": 0.9781312127236581
1387
+ },
1388
+ "eval_ACT_L2": {
1389
+ "f1": 0.2777777777777778,
1390
+ "number": 16,
1391
+ "precision": 0.25,
1392
+ "recall": 0.3125
1393
+ },
1394
+ "eval_CARDINAL": {
1395
+ "f1": 0.9874723655121592,
1396
+ "number": 678,
1397
+ "precision": 0.9867452135493373,
1398
+ "recall": 0.9882005899705014
1399
+ },
1400
+ "eval_DESC": {
1401
+ "f1": 0.5396825396825397,
1402
+ "number": 30,
1403
+ "precision": 0.5151515151515151,
1404
+ "recall": 0.5666666666666667
1405
+ },
1406
+ "eval_FT": {
1407
+ "f1": 0.15384615384615383,
1408
+ "number": 7,
1409
+ "precision": 0.16666666666666666,
1410
+ "recall": 0.14285714285714285
1411
+ },
1412
+ "eval_LOC": {
1413
+ "f1": 0.9500324464633355,
1414
+ "number": 762,
1415
+ "precision": 0.9396662387676509,
1416
+ "recall": 0.9606299212598425
1417
+ },
1418
+ "eval_PER": {
1419
+ "f1": 0.9771554900515844,
1420
+ "number": 676,
1421
+ "precision": 0.973568281938326,
1422
+ "recall": 0.9807692307692307
1423
+ },
1424
+ "eval_SPAT": {
1425
+ "f1": 0.9606299212598425,
1426
+ "number": 694,
1427
+ "precision": 0.9544807965860598,
1428
+ "recall": 0.9668587896253602
1429
+ },
1430
+ "eval_TITRE": {
1431
+ "f1": 0.0,
1432
+ "number": 2,
1433
+ "precision": 0.0,
1434
+ "recall": 0.0
1435
+ },
1436
+ "eval_TITREH": {
1437
+ "f1": 0.8285714285714285,
1438
+ "number": 33,
1439
+ "precision": 0.7837837837837838,
1440
+ "recall": 0.8787878787878788
1441
+ },
1442
+ "eval_TITREP": {
1443
+ "f1": 0.26666666666666666,
1444
+ "number": 6,
1445
+ "precision": 0.2222222222222222,
1446
+ "recall": 0.3333333333333333
1447
+ },
1448
+ "eval_accuracy": 0.9569729182485447,
1449
+ "eval_accuracy-all": 0.9686155403695267,
1450
+ "eval_accuracy-das": 0.973424449506454,
1451
+ "eval_accuracy-l1": 0.9667172867628449,
1452
+ "eval_accuracy-l1l2": 0.9578587699316629,
1453
+ "eval_accuracy-l2": 0.9705137939762085,
1454
+ "eval_f1": 0.96063877642825,
1455
+ "eval_f1-all": 0.9561544064093226,
1456
+ "eval_f1-das": 0.9627846695056471,
1457
+ "eval_f1-l1": 0.9616488390294807,
1458
+ "eval_f1-l1l2": 0.9576612903225806,
1459
+ "eval_f1-l2": 0.9492084432717678,
1460
+ "eval_loss": 0.18832801282405853,
1461
+ "eval_precision": 0.9556947863056612,
1462
+ "eval_precision-all": 0.9491035280508965,
1463
+ "eval_precision-das": 0.9572901325478645,
1464
+ "eval_precision-l1": 0.9559128630705395,
1465
+ "eval_precision-l1l2": 0.9491864116471596,
1466
+ "eval_precision-l2": 0.9405228758169935,
1467
+ "eval_recall": 0.9656341849423469,
1468
+ "eval_recall-all": 0.9633108306427942,
1469
+ "eval_recall-das": 0.9683426443202979,
1470
+ "eval_recall-l1": 0.9674540682414698,
1471
+ "eval_recall-l1l2": 0.966288869514676,
1472
+ "eval_recall-l2": 0.9580559254327563,
1473
+ "eval_runtime": 6.9287,
1474
+ "eval_samples_per_second": 97.565,
1475
+ "eval_steps_per_second": 6.206,
1476
+ "step": 1400
1477
+ },
1478
+ {
1479
+ "epoch": 3.94,
1480
+ "learning_rate": 7e-05,
1481
+ "loss": 0.1156,
1482
+ "step": 1500
1483
+ },
1484
+ {
1485
+ "epoch": 3.94,
1486
+ "eval_ACT": {
1487
+ "f1": 0.9324452901998097,
1488
+ "number": 519,
1489
+ "precision": 0.9210526315789473,
1490
+ "recall": 0.9441233140655106
1491
+ },
1492
+ "eval_ACT_L1": {
1493
+ "f1": 0.9452054794520548,
1494
+ "number": 503,
1495
+ "precision": 0.930635838150289,
1496
+ "recall": 0.9602385685884692
1497
+ },
1498
+ "eval_ACT_L2": {
1499
+ "f1": 0.4827586206896552,
1500
+ "number": 16,
1501
+ "precision": 0.5384615384615384,
1502
+ "recall": 0.4375
1503
+ },
1504
+ "eval_CARDINAL": {
1505
+ "f1": 0.9882179675994109,
1506
+ "number": 678,
1507
+ "precision": 0.986764705882353,
1508
+ "recall": 0.9896755162241888
1509
+ },
1510
+ "eval_DESC": {
1511
+ "f1": 0.39393939393939387,
1512
+ "number": 30,
1513
+ "precision": 0.3611111111111111,
1514
+ "recall": 0.43333333333333335
1515
+ },
1516
+ "eval_FT": {
1517
+ "f1": 0.16666666666666666,
1518
+ "number": 7,
1519
+ "precision": 0.2,
1520
+ "recall": 0.14285714285714285
1521
+ },
1522
+ "eval_LOC": {
1523
+ "f1": 0.9561805101373447,
1524
+ "number": 762,
1525
+ "precision": 0.9530638852672751,
1526
+ "recall": 0.9593175853018373
1527
+ },
1528
+ "eval_PER": {
1529
+ "f1": 0.9800443458980044,
1530
+ "number": 676,
1531
+ "precision": 0.9793205317577548,
1532
+ "recall": 0.9807692307692307
1533
+ },
1534
+ "eval_SPAT": {
1535
+ "f1": 0.9633883704235463,
1536
+ "number": 694,
1537
+ "precision": 0.9599427753934192,
1538
+ "recall": 0.9668587896253602
1539
+ },
1540
+ "eval_TITRE": {
1541
+ "f1": 0.0,
1542
+ "number": 2,
1543
+ "precision": 0.0,
1544
+ "recall": 0.0
1545
+ },
1546
+ "eval_TITREH": {
1547
+ "f1": 0.8615384615384615,
1548
+ "number": 33,
1549
+ "precision": 0.875,
1550
+ "recall": 0.8484848484848485
1551
+ },
1552
+ "eval_TITREP": {
1553
+ "f1": 0.3333333333333333,
1554
+ "number": 6,
1555
+ "precision": 0.3333333333333333,
1556
+ "recall": 0.3333333333333333
1557
+ },
1558
+ "eval_accuracy": 0.961781827385472,
1559
+ "eval_accuracy-all": 0.9729182485446722,
1560
+ "eval_accuracy-das": 0.973424449506454,
1561
+ "eval_accuracy-l1": 0.9698810427739812,
1562
+ "eval_accuracy-l1l2": 0.9626676790685902,
1563
+ "eval_accuracy-l2": 0.9759554543153632,
1564
+ "eval_f1": 0.9647298213881981,
1565
+ "eval_f1-all": 0.9560005847098376,
1566
+ "eval_f1-das": 0.9639405204460967,
1567
+ "eval_f1-l1": 0.9541188738269031,
1568
+ "eval_f1-l1l2": 0.960046323103648,
1569
+ "eval_f1-l2": 0.9584026622296173,
1570
+ "eval_loss": 0.169138103723526,
1571
+ "eval_precision": 0.9647298213881981,
1572
+ "eval_precision-all": 0.9522422830518346,
1573
+ "eval_precision-das": 0.9621521335807051,
1574
+ "eval_precision-l1": 0.9476954945624029,
1575
+ "eval_precision-l1l2": 0.9564464955292761,
1576
+ "eval_precision-l2": 0.9580838323353293,
1577
+ "eval_recall": 0.9647298213881981,
1578
+ "eval_recall-all": 0.9597886703845024,
1579
+ "eval_recall-das": 0.9657355679702049,
1580
+ "eval_recall-l1": 0.9606299212598425,
1581
+ "eval_recall-l1l2": 0.963673350770125,
1582
+ "eval_recall-l2": 0.9587217043941412,
1583
+ "eval_runtime": 7.001,
1584
+ "eval_samples_per_second": 96.558,
1585
+ "eval_steps_per_second": 6.142,
1586
+ "step": 1500
1587
+ },
1588
+ {
1589
+ "epoch": 4.2,
1590
+ "eval_ACT": {
1591
+ "f1": 0.9484732824427481,
1592
+ "number": 519,
1593
+ "precision": 0.9395085066162571,
1594
+ "recall": 0.9576107899807321
1595
+ },
1596
+ "eval_ACT_L1": {
1597
+ "f1": 0.9619512195121951,
1598
+ "number": 503,
1599
+ "precision": 0.9444444444444444,
1600
+ "recall": 0.9801192842942346
1601
+ },
1602
+ "eval_ACT_L2": {
1603
+ "f1": 0.34782608695652173,
1604
+ "number": 16,
1605
+ "precision": 0.5714285714285714,
1606
+ "recall": 0.25
1607
+ },
1608
+ "eval_CARDINAL": {
1609
+ "f1": 0.9867256637168141,
1610
+ "number": 678,
1611
+ "precision": 0.9867256637168141,
1612
+ "recall": 0.9867256637168141
1613
+ },
1614
+ "eval_DESC": {
1615
+ "f1": 0.5263157894736842,
1616
+ "number": 30,
1617
+ "precision": 0.5555555555555556,
1618
+ "recall": 0.5
1619
+ },
1620
+ "eval_FT": {
1621
+ "f1": 0.2,
1622
+ "number": 7,
1623
+ "precision": 0.3333333333333333,
1624
+ "recall": 0.14285714285714285
1625
+ },
1626
+ "eval_LOC": {
1627
+ "f1": 0.9601567602873938,
1628
+ "number": 762,
1629
+ "precision": 0.9557867360208062,
1630
+ "recall": 0.9645669291338582
1631
+ },
1632
+ "eval_PER": {
1633
+ "f1": 0.9778434268833086,
1634
+ "number": 676,
1635
+ "precision": 0.976401179941003,
1636
+ "recall": 0.9792899408284024
1637
+ },
1638
+ "eval_SPAT": {
1639
+ "f1": 0.9597701149425288,
1640
+ "number": 694,
1641
+ "precision": 0.9570200573065902,
1642
+ "recall": 0.962536023054755
1643
+ },
1644
+ "eval_TITRE": {
1645
+ "f1": 0.0,
1646
+ "number": 2,
1647
+ "precision": 0.0,
1648
+ "recall": 0.0
1649
+ },
1650
+ "eval_TITREH": {
1651
+ "f1": 0.8571428571428572,
1652
+ "number": 33,
1653
+ "precision": 0.9,
1654
+ "recall": 0.8181818181818182
1655
+ },
1656
+ "eval_TITREP": {
1657
+ "f1": 0.30769230769230765,
1658
+ "number": 6,
1659
+ "precision": 0.2857142857142857,
1660
+ "recall": 0.3333333333333333
1661
+ },
1662
+ "eval_accuracy": 0.9630473297899266,
1663
+ "eval_accuracy-all": 0.9731713490255631,
1664
+ "eval_accuracy-das": 0.976461655277145,
1665
+ "eval_accuracy-l1": 0.9705137939762085,
1666
+ "eval_accuracy-l1l2": 0.9635535307517085,
1667
+ "eval_accuracy-l2": 0.9758289040749177,
1668
+ "eval_f1": 0.9663580943779635,
1669
+ "eval_f1-all": 0.9598593612657487,
1670
+ "eval_f1-das": 0.9657992565055762,
1671
+ "eval_f1-l1": 0.9597911227154047,
1672
+ "eval_f1-l1l2": 0.9638973466724663,
1673
+ "eval_f1-l2": 0.9599465954606141,
1674
+ "eval_loss": 0.17647188901901245,
1675
+ "eval_precision": 0.9650507328072153,
1676
+ "eval_precision-all": 0.9581749049429658,
1677
+ "eval_precision-das": 0.9640074211502783,
1678
+ "eval_precision-l1": 0.9548051948051948,
1679
+ "eval_precision-l1l2": 0.9618055555555556,
1680
+ "eval_precision-l2": 0.9625167336010709,
1681
+ "eval_recall": 0.9676690029391816,
1682
+ "eval_recall-all": 0.9615497505136483,
1683
+ "eval_recall-das": 0.9675977653631285,
1684
+ "eval_recall-l1": 0.9648293963254593,
1685
+ "eval_recall-l1l2": 0.9659982563208369,
1686
+ "eval_recall-l2": 0.9573901464713716,
1687
+ "eval_runtime": 6.873,
1688
+ "eval_samples_per_second": 98.356,
1689
+ "eval_steps_per_second": 6.256,
1690
+ "step": 1600
1691
+ }
1692
+ ],
1693
+ "max_steps": 5000,
1694
+ "num_train_epochs": 14,
1695
+ "total_flos": 651216540910320.0,
1696
+ "trial_name": null,
1697
+ "trial_params": null
1698
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:faab69dc4a6e7da77af20ba5e7a5083a3bab77b2015e853e2bbd5cb839ae498b
3
+ size 3503