tieandrews commited on
Commit
f4165ec
·
1 Parent(s): 47d82aa

Update Roberta v6 Model as Outlined in Final Report (#3)

Browse files

- Update Roberta v6 Model as Outlined in Final Report (92c53b230b8240d37dfed955e7c444daab1e53b2)

all_results.json ADDED
@@ -0,0 +1,53 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 14.72,
3
+ "eval_AGE_f1": 0.7025495750708216,
4
+ "eval_AGE_number": 159,
5
+ "eval_AGE_precision": 0.6391752577319587,
6
+ "eval_AGE_recall": 0.779874213836478,
7
+ "eval_ALTI_f1": 0.3225806451612903,
8
+ "eval_ALTI_number": 16,
9
+ "eval_ALTI_precision": 0.3333333333333333,
10
+ "eval_ALTI_recall": 0.3125,
11
+ "eval_EMAIL_f1": 0.7819548872180451,
12
+ "eval_EMAIL_number": 52,
13
+ "eval_EMAIL_precision": 0.6419753086419753,
14
+ "eval_EMAIL_recall": 1.0,
15
+ "eval_GEOG_f1": 0.4,
16
+ "eval_GEOG_number": 9,
17
+ "eval_GEOG_precision": 0.2857142857142857,
18
+ "eval_GEOG_recall": 0.6666666666666666,
19
+ "eval_REGION_f1": 0.5511811023622047,
20
+ "eval_REGION_number": 351,
21
+ "eval_REGION_precision": 0.45539033457249073,
22
+ "eval_REGION_recall": 0.698005698005698,
23
+ "eval_SITE_f1": 0.4936530324400564,
24
+ "eval_SITE_number": 330,
25
+ "eval_SITE_precision": 0.46174142480211083,
26
+ "eval_SITE_recall": 0.5303030303030303,
27
+ "eval_TAXA_f1": 0.8047445255474452,
28
+ "eval_TAXA_number": 525,
29
+ "eval_TAXA_precision": 0.7723292469352014,
30
+ "eval_TAXA_recall": 0.84,
31
+ "eval_accuracy_entity": 0.9571207347679821,
32
+ "eval_accuracy_token": 0.9571207347679821,
33
+ "eval_f1_entity": 0.7682700421940929,
34
+ "eval_f1_token": 0.7682700421940929,
35
+ "eval_loss": 0.154266357421875,
36
+ "eval_overall_accuracy": 0.9559993592139692,
37
+ "eval_overall_f1": 0.646713977167541,
38
+ "eval_overall_precision": 0.5825458588104503,
39
+ "eval_overall_recall": 0.7267683772538142,
40
+ "eval_precision_entity": 0.7118060985144644,
41
+ "eval_precision_token": 0.7118060985144644,
42
+ "eval_recall_entity": 0.8344637946837764,
43
+ "eval_recall_token": 0.8344637946837764,
44
+ "eval_runtime": 10.2775,
45
+ "eval_samples": 189,
46
+ "eval_samples_per_second": 18.39,
47
+ "eval_steps_per_second": 2.335,
48
+ "train_loss": 0.23708797097206116,
49
+ "train_runtime": 1988.5186,
50
+ "train_samples": 1269,
51
+ "train_samples_per_second": 9.572,
52
+ "train_steps_per_second": 0.294
53
+ }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/content/drive/MyDrive/Colab Notebooks/ffossils/roberta-finetune-v3/models/",
3
  "architectures": [
4
  "RobertaForTokenClassification"
5
  ],
@@ -53,7 +53,7 @@
53
  "pad_token_id": 1,
54
  "position_embedding_type": "absolute",
55
  "torch_dtype": "float32",
56
- "transformers_version": "4.29.2",
57
  "type_vocab_size": 1,
58
  "use_cache": true,
59
  "vocab_size": 50265
 
1
  {
2
+ "_name_or_path": "roberta-base",
3
  "architectures": [
4
  "RobertaForTokenClassification"
5
  ],
 
53
  "pad_token_id": 1,
54
  "position_embedding_type": "absolute",
55
  "torch_dtype": "float32",
56
+ "transformers_version": "4.30.2",
57
  "type_vocab_size": 1,
58
  "use_cache": true,
59
  "vocab_size": 50265
eval_results.json ADDED
@@ -0,0 +1,48 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 14.72,
3
+ "eval_AGE_f1": 0.7025495750708216,
4
+ "eval_AGE_number": 159,
5
+ "eval_AGE_precision": 0.6391752577319587,
6
+ "eval_AGE_recall": 0.779874213836478,
7
+ "eval_ALTI_f1": 0.3225806451612903,
8
+ "eval_ALTI_number": 16,
9
+ "eval_ALTI_precision": 0.3333333333333333,
10
+ "eval_ALTI_recall": 0.3125,
11
+ "eval_EMAIL_f1": 0.7819548872180451,
12
+ "eval_EMAIL_number": 52,
13
+ "eval_EMAIL_precision": 0.6419753086419753,
14
+ "eval_EMAIL_recall": 1.0,
15
+ "eval_GEOG_f1": 0.4,
16
+ "eval_GEOG_number": 9,
17
+ "eval_GEOG_precision": 0.2857142857142857,
18
+ "eval_GEOG_recall": 0.6666666666666666,
19
+ "eval_REGION_f1": 0.5511811023622047,
20
+ "eval_REGION_number": 351,
21
+ "eval_REGION_precision": 0.45539033457249073,
22
+ "eval_REGION_recall": 0.698005698005698,
23
+ "eval_SITE_f1": 0.4936530324400564,
24
+ "eval_SITE_number": 330,
25
+ "eval_SITE_precision": 0.46174142480211083,
26
+ "eval_SITE_recall": 0.5303030303030303,
27
+ "eval_TAXA_f1": 0.8047445255474452,
28
+ "eval_TAXA_number": 525,
29
+ "eval_TAXA_precision": 0.7723292469352014,
30
+ "eval_TAXA_recall": 0.84,
31
+ "eval_accuracy_entity": 0.9571207347679821,
32
+ "eval_accuracy_token": 0.9571207347679821,
33
+ "eval_f1_entity": 0.7682700421940929,
34
+ "eval_f1_token": 0.7682700421940929,
35
+ "eval_loss": 0.154266357421875,
36
+ "eval_overall_accuracy": 0.9559993592139692,
37
+ "eval_overall_f1": 0.646713977167541,
38
+ "eval_overall_precision": 0.5825458588104503,
39
+ "eval_overall_recall": 0.7267683772538142,
40
+ "eval_precision_entity": 0.7118060985144644,
41
+ "eval_precision_token": 0.7118060985144644,
42
+ "eval_recall_entity": 0.8344637946837764,
43
+ "eval_recall_token": 0.8344637946837764,
44
+ "eval_runtime": 10.2775,
45
+ "eval_samples": 189,
46
+ "eval_samples_per_second": 18.39,
47
+ "eval_steps_per_second": 2.335
48
+ }
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c4f40c00bc3c9f9fd0866974d99d9726182a68afb3a6aee234f75e7091d33b9f
3
- size 496333165
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:58e6d0c505cadb3389a805ec9b08e579725be60ea75b3f73f899f289832fb437
3
+ size 496335917
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 14.72,
3
+ "train_loss": 0.23708797097206116,
4
+ "train_runtime": 1988.5186,
5
+ "train_samples": 1269,
6
+ "train_samples_per_second": 9.572,
7
+ "train_steps_per_second": 0.294
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,1477 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.646713977167541,
3
+ "best_model_checkpoint": "/content/drive/MyDrive/Colab Notebooks/ffossils/roberta-finetuned-v6/models/checkpoint-400",
4
+ "epoch": 14.716981132075471,
5
+ "global_step": 585,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.25,
12
+ "learning_rate": 2.0000000000000003e-06,
13
+ "loss": 2.785,
14
+ "step": 10
15
+ },
16
+ {
17
+ "epoch": 0.5,
18
+ "learning_rate": 4.000000000000001e-06,
19
+ "loss": 2.592,
20
+ "step": 20
21
+ },
22
+ {
23
+ "epoch": 0.63,
24
+ "eval_AGE_f1": 0.0,
25
+ "eval_AGE_number": 159,
26
+ "eval_AGE_precision": 0.0,
27
+ "eval_AGE_recall": 0.0,
28
+ "eval_ALTI_f1": 0.0,
29
+ "eval_ALTI_number": 16,
30
+ "eval_ALTI_precision": 0.0,
31
+ "eval_ALTI_recall": 0.0,
32
+ "eval_EMAIL_f1": 0.013565891472868219,
33
+ "eval_EMAIL_number": 52,
34
+ "eval_EMAIL_precision": 0.006958250497017893,
35
+ "eval_EMAIL_recall": 0.2692307692307692,
36
+ "eval_GEOG_f1": 0.0,
37
+ "eval_GEOG_number": 9,
38
+ "eval_GEOG_precision": 0.0,
39
+ "eval_GEOG_recall": 0.0,
40
+ "eval_REGION_f1": 0.0,
41
+ "eval_REGION_number": 351,
42
+ "eval_REGION_precision": 0.0,
43
+ "eval_REGION_recall": 0.0,
44
+ "eval_SITE_f1": 0.0,
45
+ "eval_SITE_number": 330,
46
+ "eval_SITE_precision": 0.0,
47
+ "eval_SITE_recall": 0.0,
48
+ "eval_TAXA_f1": 0.0,
49
+ "eval_TAXA_number": 525,
50
+ "eval_TAXA_precision": 0.0,
51
+ "eval_TAXA_recall": 0.0,
52
+ "eval_accuracy_entity": 0.8152934266033001,
53
+ "eval_accuracy_token": 0.8152934266033001,
54
+ "eval_f1_entity": 0.022789506227365072,
55
+ "eval_f1_token": 0.022789506227365072,
56
+ "eval_loss": 2.0357258319854736,
57
+ "eval_overall_accuracy": 0.8141186522133818,
58
+ "eval_overall_f1": 0.004022988505747126,
59
+ "eval_overall_precision": 0.0025371511417180137,
60
+ "eval_overall_recall": 0.009708737864077669,
61
+ "eval_precision_entity": 0.02199113535629049,
62
+ "eval_precision_token": 0.02199113535629049,
63
+ "eval_recall_entity": 0.02364802933088909,
64
+ "eval_recall_token": 0.02364802933088909,
65
+ "eval_runtime": 10.2464,
66
+ "eval_samples_per_second": 18.446,
67
+ "eval_steps_per_second": 2.342,
68
+ "step": 25
69
+ },
70
+ {
71
+ "epoch": 0.75,
72
+ "learning_rate": 6e-06,
73
+ "loss": 1.9963,
74
+ "step": 30
75
+ },
76
+ {
77
+ "epoch": 1.01,
78
+ "learning_rate": 8.000000000000001e-06,
79
+ "loss": 0.8245,
80
+ "step": 40
81
+ },
82
+ {
83
+ "epoch": 1.26,
84
+ "learning_rate": 1e-05,
85
+ "loss": 0.5512,
86
+ "step": 50
87
+ },
88
+ {
89
+ "epoch": 1.26,
90
+ "eval_AGE_f1": 0.0,
91
+ "eval_AGE_number": 159,
92
+ "eval_AGE_precision": 0.0,
93
+ "eval_AGE_recall": 0.0,
94
+ "eval_ALTI_f1": 0.0,
95
+ "eval_ALTI_number": 16,
96
+ "eval_ALTI_precision": 0.0,
97
+ "eval_ALTI_recall": 0.0,
98
+ "eval_EMAIL_f1": 0.0,
99
+ "eval_EMAIL_number": 52,
100
+ "eval_EMAIL_precision": 0.0,
101
+ "eval_EMAIL_recall": 0.0,
102
+ "eval_GEOG_f1": 0.0,
103
+ "eval_GEOG_number": 9,
104
+ "eval_GEOG_precision": 0.0,
105
+ "eval_GEOG_recall": 0.0,
106
+ "eval_REGION_f1": 0.0,
107
+ "eval_REGION_number": 351,
108
+ "eval_REGION_precision": 0.0,
109
+ "eval_REGION_recall": 0.0,
110
+ "eval_SITE_f1": 0.0,
111
+ "eval_SITE_number": 330,
112
+ "eval_SITE_precision": 0.0,
113
+ "eval_SITE_recall": 0.0,
114
+ "eval_TAXA_f1": 0.0,
115
+ "eval_TAXA_number": 525,
116
+ "eval_TAXA_precision": 0.0,
117
+ "eval_TAXA_recall": 0.0,
118
+ "eval_accuracy_entity": 0.9028853171000872,
119
+ "eval_accuracy_token": 0.9028853171000872,
120
+ "eval_f1_entity": 0.0,
121
+ "eval_f1_token": 0.0,
122
+ "eval_loss": 0.4787032902240753,
123
+ "eval_overall_accuracy": 0.9028853171000872,
124
+ "eval_overall_f1": 0.0,
125
+ "eval_overall_precision": 0.0,
126
+ "eval_overall_recall": 0.0,
127
+ "eval_precision_entity": 0.0,
128
+ "eval_precision_token": 0.0,
129
+ "eval_recall_entity": 0.0,
130
+ "eval_recall_token": 0.0,
131
+ "eval_runtime": 10.1567,
132
+ "eval_samples_per_second": 18.608,
133
+ "eval_steps_per_second": 2.363,
134
+ "step": 50
135
+ },
136
+ {
137
+ "epoch": 1.51,
138
+ "learning_rate": 1.2e-05,
139
+ "loss": 0.4716,
140
+ "step": 60
141
+ },
142
+ {
143
+ "epoch": 1.76,
144
+ "learning_rate": 1.4e-05,
145
+ "loss": 0.3759,
146
+ "step": 70
147
+ },
148
+ {
149
+ "epoch": 1.89,
150
+ "eval_AGE_f1": 0.0,
151
+ "eval_AGE_number": 159,
152
+ "eval_AGE_precision": 0.0,
153
+ "eval_AGE_recall": 0.0,
154
+ "eval_ALTI_f1": 0.0,
155
+ "eval_ALTI_number": 16,
156
+ "eval_ALTI_precision": 0.0,
157
+ "eval_ALTI_recall": 0.0,
158
+ "eval_EMAIL_f1": 0.0,
159
+ "eval_EMAIL_number": 52,
160
+ "eval_EMAIL_precision": 0.0,
161
+ "eval_EMAIL_recall": 0.0,
162
+ "eval_GEOG_f1": 0.0,
163
+ "eval_GEOG_number": 9,
164
+ "eval_GEOG_precision": 0.0,
165
+ "eval_GEOG_recall": 0.0,
166
+ "eval_REGION_f1": 0.0,
167
+ "eval_REGION_number": 351,
168
+ "eval_REGION_precision": 0.0,
169
+ "eval_REGION_recall": 0.0,
170
+ "eval_SITE_f1": 0.0,
171
+ "eval_SITE_number": 330,
172
+ "eval_SITE_precision": 0.0,
173
+ "eval_SITE_recall": 0.0,
174
+ "eval_TAXA_f1": 0.4575645756457565,
175
+ "eval_TAXA_number": 525,
176
+ "eval_TAXA_precision": 0.44364937388193204,
177
+ "eval_TAXA_recall": 0.4723809523809524,
178
+ "eval_accuracy_entity": 0.9267723963617593,
179
+ "eval_accuracy_token": 0.9267723963617593,
180
+ "eval_f1_entity": 0.45445053510832684,
181
+ "eval_f1_token": 0.45445053510832684,
182
+ "eval_loss": 0.28952518105506897,
183
+ "eval_overall_accuracy": 0.9190651643794165,
184
+ "eval_overall_f1": 0.23732057416267943,
185
+ "eval_overall_precision": 0.38271604938271603,
186
+ "eval_overall_recall": 0.17198335644937587,
187
+ "eval_precision_entity": 0.7888536474852741,
188
+ "eval_precision_token": 0.7888536474852741,
189
+ "eval_recall_entity": 0.3191567369385884,
190
+ "eval_recall_token": 0.3191567369385884,
191
+ "eval_runtime": 10.7946,
192
+ "eval_samples_per_second": 17.509,
193
+ "eval_steps_per_second": 2.223,
194
+ "step": 75
195
+ },
196
+ {
197
+ "epoch": 2.01,
198
+ "learning_rate": 1.6000000000000003e-05,
199
+ "loss": 0.3221,
200
+ "step": 80
201
+ },
202
+ {
203
+ "epoch": 2.26,
204
+ "learning_rate": 1.8e-05,
205
+ "loss": 0.2555,
206
+ "step": 90
207
+ },
208
+ {
209
+ "epoch": 2.52,
210
+ "learning_rate": 2e-05,
211
+ "loss": 0.2161,
212
+ "step": 100
213
+ },
214
+ {
215
+ "epoch": 2.52,
216
+ "eval_AGE_f1": 0.36414565826330536,
217
+ "eval_AGE_number": 159,
218
+ "eval_AGE_precision": 0.3282828282828283,
219
+ "eval_AGE_recall": 0.4088050314465409,
220
+ "eval_ALTI_f1": 0.0,
221
+ "eval_ALTI_number": 16,
222
+ "eval_ALTI_precision": 0.0,
223
+ "eval_ALTI_recall": 0.0,
224
+ "eval_EMAIL_f1": 0.0,
225
+ "eval_EMAIL_number": 52,
226
+ "eval_EMAIL_precision": 0.0,
227
+ "eval_EMAIL_recall": 0.0,
228
+ "eval_GEOG_f1": 0.058823529411764705,
229
+ "eval_GEOG_number": 9,
230
+ "eval_GEOG_precision": 0.04,
231
+ "eval_GEOG_recall": 0.1111111111111111,
232
+ "eval_REGION_f1": 0.25806451612903225,
233
+ "eval_REGION_number": 351,
234
+ "eval_REGION_precision": 0.1907356948228883,
235
+ "eval_REGION_recall": 0.39886039886039887,
236
+ "eval_SITE_f1": 0.028925619834710745,
237
+ "eval_SITE_number": 330,
238
+ "eval_SITE_precision": 0.045454545454545456,
239
+ "eval_SITE_recall": 0.021212121212121213,
240
+ "eval_TAXA_f1": 0.6412859560067682,
241
+ "eval_TAXA_number": 525,
242
+ "eval_TAXA_precision": 0.5768645357686454,
243
+ "eval_TAXA_recall": 0.7219047619047619,
244
+ "eval_accuracy_entity": 0.943005642476994,
245
+ "eval_accuracy_token": 0.943005642476994,
246
+ "eval_f1_entity": 0.654824165915239,
247
+ "eval_f1_token": 0.654824165915239,
248
+ "eval_loss": 0.20675021409988403,
249
+ "eval_overall_accuracy": 0.9366867802281911,
250
+ "eval_overall_f1": 0.3688473520249221,
251
+ "eval_overall_precision": 0.334841628959276,
252
+ "eval_overall_recall": 0.4105409153952843,
253
+ "eval_precision_entity": 0.6443655723158829,
254
+ "eval_precision_token": 0.6443655723158829,
255
+ "eval_recall_entity": 0.6656278643446379,
256
+ "eval_recall_token": 0.6656278643446379,
257
+ "eval_runtime": 11.4868,
258
+ "eval_samples_per_second": 16.454,
259
+ "eval_steps_per_second": 2.089,
260
+ "step": 100
261
+ },
262
+ {
263
+ "epoch": 2.77,
264
+ "learning_rate": 1.9587628865979382e-05,
265
+ "loss": 0.1805,
266
+ "step": 110
267
+ },
268
+ {
269
+ "epoch": 3.02,
270
+ "learning_rate": 1.9175257731958766e-05,
271
+ "loss": 0.1729,
272
+ "step": 120
273
+ },
274
+ {
275
+ "epoch": 3.14,
276
+ "eval_AGE_f1": 0.47398843930635837,
277
+ "eval_AGE_number": 159,
278
+ "eval_AGE_precision": 0.4385026737967914,
279
+ "eval_AGE_recall": 0.5157232704402516,
280
+ "eval_ALTI_f1": 0.0,
281
+ "eval_ALTI_number": 16,
282
+ "eval_ALTI_precision": 0.0,
283
+ "eval_ALTI_recall": 0.0,
284
+ "eval_EMAIL_f1": 0.0,
285
+ "eval_EMAIL_number": 52,
286
+ "eval_EMAIL_precision": 0.0,
287
+ "eval_EMAIL_recall": 0.0,
288
+ "eval_GEOG_f1": 0.2758620689655173,
289
+ "eval_GEOG_number": 9,
290
+ "eval_GEOG_precision": 0.2,
291
+ "eval_GEOG_recall": 0.4444444444444444,
292
+ "eval_REGION_f1": 0.3544813695871098,
293
+ "eval_REGION_number": 351,
294
+ "eval_REGION_precision": 0.27414330218068533,
295
+ "eval_REGION_recall": 0.5014245014245015,
296
+ "eval_SITE_f1": 0.14779874213836475,
297
+ "eval_SITE_number": 330,
298
+ "eval_SITE_precision": 0.15359477124183007,
299
+ "eval_SITE_recall": 0.14242424242424243,
300
+ "eval_TAXA_f1": 0.7314578005115089,
301
+ "eval_TAXA_number": 525,
302
+ "eval_TAXA_precision": 0.6620370370370371,
303
+ "eval_TAXA_recall": 0.8171428571428572,
304
+ "eval_accuracy_entity": 0.9479539346042256,
305
+ "eval_accuracy_token": 0.9479539346042256,
306
+ "eval_f1_entity": 0.7052475850665739,
307
+ "eval_f1_token": 0.7052475850665739,
308
+ "eval_loss": 0.16586871445178986,
309
+ "eval_overall_accuracy": 0.9440380199711647,
310
+ "eval_overall_f1": 0.4548536209553159,
311
+ "eval_overall_precision": 0.40931780366056575,
312
+ "eval_overall_recall": 0.5117891816920943,
313
+ "eval_precision_entity": 0.6713055003313453,
314
+ "eval_precision_token": 0.6713055003313453,
315
+ "eval_recall_entity": 0.7428047662694776,
316
+ "eval_recall_token": 0.7428047662694776,
317
+ "eval_runtime": 12.6888,
318
+ "eval_samples_per_second": 14.895,
319
+ "eval_steps_per_second": 1.891,
320
+ "step": 125
321
+ },
322
+ {
323
+ "epoch": 3.27,
324
+ "learning_rate": 1.8762886597938147e-05,
325
+ "loss": 0.1471,
326
+ "step": 130
327
+ },
328
+ {
329
+ "epoch": 3.52,
330
+ "learning_rate": 1.8350515463917527e-05,
331
+ "loss": 0.1384,
332
+ "step": 140
333
+ },
334
+ {
335
+ "epoch": 3.77,
336
+ "learning_rate": 1.793814432989691e-05,
337
+ "loss": 0.1233,
338
+ "step": 150
339
+ },
340
+ {
341
+ "epoch": 3.77,
342
+ "eval_AGE_f1": 0.42245989304812837,
343
+ "eval_AGE_number": 159,
344
+ "eval_AGE_precision": 0.3674418604651163,
345
+ "eval_AGE_recall": 0.4968553459119497,
346
+ "eval_ALTI_f1": 0.0,
347
+ "eval_ALTI_number": 16,
348
+ "eval_ALTI_precision": 0.0,
349
+ "eval_ALTI_recall": 0.0,
350
+ "eval_EMAIL_f1": 0.17543859649122806,
351
+ "eval_EMAIL_number": 52,
352
+ "eval_EMAIL_precision": 1.0,
353
+ "eval_EMAIL_recall": 0.09615384615384616,
354
+ "eval_GEOG_f1": 0.3703703703703704,
355
+ "eval_GEOG_number": 9,
356
+ "eval_GEOG_precision": 0.2777777777777778,
357
+ "eval_GEOG_recall": 0.5555555555555556,
358
+ "eval_REGION_f1": 0.43149946062567424,
359
+ "eval_REGION_number": 351,
360
+ "eval_REGION_precision": 0.3472222222222222,
361
+ "eval_REGION_recall": 0.5698005698005698,
362
+ "eval_SITE_f1": 0.2934472934472935,
363
+ "eval_SITE_number": 330,
364
+ "eval_SITE_precision": 0.2768817204301075,
365
+ "eval_SITE_recall": 0.31212121212121213,
366
+ "eval_TAXA_f1": 0.7345890410958905,
367
+ "eval_TAXA_number": 525,
368
+ "eval_TAXA_precision": 0.6671850699844479,
369
+ "eval_TAXA_recall": 0.8171428571428572,
370
+ "eval_accuracy_entity": 0.9522080418646873,
371
+ "eval_accuracy_token": 0.9522080418646873,
372
+ "eval_f1_entity": 0.7402282947077135,
373
+ "eval_f1_token": 0.7402282947077135,
374
+ "eval_loss": 0.14876657724380493,
375
+ "eval_overall_accuracy": 0.9501076876524092,
376
+ "eval_overall_f1": 0.5018337408312958,
377
+ "eval_overall_precision": 0.4486338797814208,
378
+ "eval_overall_recall": 0.5693481276005548,
379
+ "eval_precision_entity": 0.7006056637747585,
380
+ "eval_precision_token": 0.7006056637747585,
381
+ "eval_recall_entity": 0.7846012832263978,
382
+ "eval_recall_token": 0.7846012832263978,
383
+ "eval_runtime": 11.4316,
384
+ "eval_samples_per_second": 16.533,
385
+ "eval_steps_per_second": 2.099,
386
+ "step": 150
387
+ },
388
+ {
389
+ "epoch": 4.03,
390
+ "learning_rate": 1.752577319587629e-05,
391
+ "loss": 0.1231,
392
+ "step": 160
393
+ },
394
+ {
395
+ "epoch": 4.28,
396
+ "learning_rate": 1.7113402061855672e-05,
397
+ "loss": 0.1084,
398
+ "step": 170
399
+ },
400
+ {
401
+ "epoch": 4.4,
402
+ "eval_AGE_f1": 0.6049046321525886,
403
+ "eval_AGE_number": 159,
404
+ "eval_AGE_precision": 0.5336538461538461,
405
+ "eval_AGE_recall": 0.6981132075471698,
406
+ "eval_ALTI_f1": 0.0,
407
+ "eval_ALTI_number": 16,
408
+ "eval_ALTI_precision": 0.0,
409
+ "eval_ALTI_recall": 0.0,
410
+ "eval_EMAIL_f1": 0.5555555555555556,
411
+ "eval_EMAIL_number": 52,
412
+ "eval_EMAIL_precision": 1.0,
413
+ "eval_EMAIL_recall": 0.38461538461538464,
414
+ "eval_GEOG_f1": 0.33333333333333326,
415
+ "eval_GEOG_number": 9,
416
+ "eval_GEOG_precision": 0.23809523809523808,
417
+ "eval_GEOG_recall": 0.5555555555555556,
418
+ "eval_REGION_f1": 0.4647887323943662,
419
+ "eval_REGION_number": 351,
420
+ "eval_REGION_precision": 0.39520958083832336,
421
+ "eval_REGION_recall": 0.5641025641025641,
422
+ "eval_SITE_f1": 0.3371104815864023,
423
+ "eval_SITE_number": 330,
424
+ "eval_SITE_precision": 0.31648936170212766,
425
+ "eval_SITE_recall": 0.3606060606060606,
426
+ "eval_TAXA_f1": 0.776173285198556,
427
+ "eval_TAXA_number": 525,
428
+ "eval_TAXA_precision": 0.7375643224699828,
429
+ "eval_TAXA_recall": 0.819047619047619,
430
+ "eval_accuracy_entity": 0.955144977839483,
431
+ "eval_accuracy_token": 0.955144977839483,
432
+ "eval_f1_entity": 0.7561658212349135,
433
+ "eval_f1_token": 0.7561658212349135,
434
+ "eval_loss": 0.137845978140831,
435
+ "eval_overall_accuracy": 0.9533828162546056,
436
+ "eval_overall_f1": 0.5576255131038838,
437
+ "eval_overall_precision": 0.5118840579710144,
438
+ "eval_overall_recall": 0.6123439667128987,
439
+ "eval_precision_entity": 0.7230306071249373,
440
+ "eval_precision_token": 0.7230306071249373,
441
+ "eval_recall_entity": 0.7924839596700275,
442
+ "eval_recall_token": 0.7924839596700275,
443
+ "eval_runtime": 12.8578,
444
+ "eval_samples_per_second": 14.699,
445
+ "eval_steps_per_second": 1.867,
446
+ "step": 175
447
+ },
448
+ {
449
+ "epoch": 4.53,
450
+ "learning_rate": 1.6701030927835052e-05,
451
+ "loss": 0.1,
452
+ "step": 180
453
+ },
454
+ {
455
+ "epoch": 4.78,
456
+ "learning_rate": 1.6288659793814433e-05,
457
+ "loss": 0.1068,
458
+ "step": 190
459
+ },
460
+ {
461
+ "epoch": 5.03,
462
+ "learning_rate": 1.5876288659793813e-05,
463
+ "loss": 0.0984,
464
+ "step": 200
465
+ },
466
+ {
467
+ "epoch": 5.03,
468
+ "eval_AGE_f1": 0.672316384180791,
469
+ "eval_AGE_number": 159,
470
+ "eval_AGE_precision": 0.6102564102564103,
471
+ "eval_AGE_recall": 0.7484276729559748,
472
+ "eval_ALTI_f1": 0.06060606060606061,
473
+ "eval_ALTI_number": 16,
474
+ "eval_ALTI_precision": 0.058823529411764705,
475
+ "eval_ALTI_recall": 0.0625,
476
+ "eval_EMAIL_f1": 0.7826086956521738,
477
+ "eval_EMAIL_number": 52,
478
+ "eval_EMAIL_precision": 0.9,
479
+ "eval_EMAIL_recall": 0.6923076923076923,
480
+ "eval_GEOG_f1": 0.42857142857142855,
481
+ "eval_GEOG_number": 9,
482
+ "eval_GEOG_precision": 0.3157894736842105,
483
+ "eval_GEOG_recall": 0.6666666666666666,
484
+ "eval_REGION_f1": 0.44173140954495005,
485
+ "eval_REGION_number": 351,
486
+ "eval_REGION_precision": 0.3618181818181818,
487
+ "eval_REGION_recall": 0.5669515669515669,
488
+ "eval_SITE_f1": 0.4200792602377807,
489
+ "eval_SITE_number": 330,
490
+ "eval_SITE_precision": 0.37236533957845436,
491
+ "eval_SITE_recall": 0.4818181818181818,
492
+ "eval_TAXA_f1": 0.7944954128440367,
493
+ "eval_TAXA_number": 525,
494
+ "eval_TAXA_precision": 0.7663716814159292,
495
+ "eval_TAXA_recall": 0.8247619047619048,
496
+ "eval_accuracy_entity": 0.9572097328278244,
497
+ "eval_accuracy_token": 0.9572097328278244,
498
+ "eval_f1_entity": 0.7708746230073245,
499
+ "eval_f1_token": 0.7708746230073245,
500
+ "eval_loss": 0.13383713364601135,
501
+ "eval_overall_accuracy": 0.9555721685267261,
502
+ "eval_overall_f1": 0.5855606758832566,
503
+ "eval_overall_precision": 0.5256480970766685,
504
+ "eval_overall_recall": 0.6608876560332871,
505
+ "eval_precision_entity": 0.7273170731707317,
506
+ "eval_precision_token": 0.7273170731707317,
507
+ "eval_recall_entity": 0.8199816681943172,
508
+ "eval_recall_token": 0.8199816681943172,
509
+ "eval_runtime": 9.949,
510
+ "eval_samples_per_second": 18.997,
511
+ "eval_steps_per_second": 2.412,
512
+ "step": 200
513
+ },
514
+ {
515
+ "epoch": 5.28,
516
+ "learning_rate": 1.5463917525773197e-05,
517
+ "loss": 0.0887,
518
+ "step": 210
519
+ },
520
+ {
521
+ "epoch": 5.53,
522
+ "learning_rate": 1.5051546391752578e-05,
523
+ "loss": 0.0872,
524
+ "step": 220
525
+ },
526
+ {
527
+ "epoch": 5.66,
528
+ "eval_AGE_f1": 0.6319018404907976,
529
+ "eval_AGE_number": 159,
530
+ "eval_AGE_precision": 0.6167664670658682,
531
+ "eval_AGE_recall": 0.6477987421383647,
532
+ "eval_ALTI_f1": 0.07407407407407407,
533
+ "eval_ALTI_number": 16,
534
+ "eval_ALTI_precision": 0.09090909090909091,
535
+ "eval_ALTI_recall": 0.0625,
536
+ "eval_EMAIL_f1": 0.9622641509433962,
537
+ "eval_EMAIL_number": 52,
538
+ "eval_EMAIL_precision": 0.9444444444444444,
539
+ "eval_EMAIL_recall": 0.9807692307692307,
540
+ "eval_GEOG_f1": 0.3870967741935484,
541
+ "eval_GEOG_number": 9,
542
+ "eval_GEOG_precision": 0.2727272727272727,
543
+ "eval_GEOG_recall": 0.6666666666666666,
544
+ "eval_REGION_f1": 0.4956709956709957,
545
+ "eval_REGION_number": 351,
546
+ "eval_REGION_precision": 0.39965095986038396,
547
+ "eval_REGION_recall": 0.6524216524216524,
548
+ "eval_SITE_f1": 0.4276048714479026,
549
+ "eval_SITE_number": 330,
550
+ "eval_SITE_precision": 0.3863080684596577,
551
+ "eval_SITE_recall": 0.47878787878787876,
552
+ "eval_TAXA_f1": 0.7708703374777975,
553
+ "eval_TAXA_number": 525,
554
+ "eval_TAXA_precision": 0.7221297836938436,
555
+ "eval_TAXA_recall": 0.8266666666666667,
556
+ "eval_accuracy_entity": 0.9552339758993253,
557
+ "eval_accuracy_token": 0.9552339758993253,
558
+ "eval_f1_entity": 0.7587956698240865,
559
+ "eval_f1_token": 0.7587956698240865,
560
+ "eval_loss": 0.14531326293945312,
561
+ "eval_overall_accuracy": 0.9539702034495648,
562
+ "eval_overall_f1": 0.598963098505642,
563
+ "eval_overall_precision": 0.5345672291780076,
564
+ "eval_overall_recall": 0.680998613037448,
565
+ "eval_precision_entity": 0.7043491913958235,
566
+ "eval_precision_token": 0.7043491913958235,
567
+ "eval_recall_entity": 0.8223648029330889,
568
+ "eval_recall_token": 0.8223648029330889,
569
+ "eval_runtime": 10.0713,
570
+ "eval_samples_per_second": 18.766,
571
+ "eval_steps_per_second": 2.383,
572
+ "step": 225
573
+ },
574
+ {
575
+ "epoch": 5.79,
576
+ "learning_rate": 1.4639175257731958e-05,
577
+ "loss": 0.086,
578
+ "step": 230
579
+ },
580
+ {
581
+ "epoch": 6.04,
582
+ "learning_rate": 1.4226804123711342e-05,
583
+ "loss": 0.0789,
584
+ "step": 240
585
+ },
586
+ {
587
+ "epoch": 6.29,
588
+ "learning_rate": 1.3814432989690723e-05,
589
+ "loss": 0.0713,
590
+ "step": 250
591
+ },
592
+ {
593
+ "epoch": 6.29,
594
+ "eval_AGE_f1": 0.6857142857142857,
595
+ "eval_AGE_number": 159,
596
+ "eval_AGE_precision": 0.6282722513089005,
597
+ "eval_AGE_recall": 0.7547169811320755,
598
+ "eval_ALTI_f1": 0.07142857142857144,
599
+ "eval_ALTI_number": 16,
600
+ "eval_ALTI_precision": 0.08333333333333333,
601
+ "eval_ALTI_recall": 0.0625,
602
+ "eval_EMAIL_f1": 0.859504132231405,
603
+ "eval_EMAIL_number": 52,
604
+ "eval_EMAIL_precision": 0.7536231884057971,
605
+ "eval_EMAIL_recall": 1.0,
606
+ "eval_GEOG_f1": 0.4,
607
+ "eval_GEOG_number": 9,
608
+ "eval_GEOG_precision": 0.2857142857142857,
609
+ "eval_GEOG_recall": 0.6666666666666666,
610
+ "eval_REGION_f1": 0.49940262843488653,
611
+ "eval_REGION_number": 351,
612
+ "eval_REGION_precision": 0.43004115226337447,
613
+ "eval_REGION_recall": 0.5954415954415955,
614
+ "eval_SITE_f1": 0.4341736694677871,
615
+ "eval_SITE_number": 330,
616
+ "eval_SITE_precision": 0.4036458333333333,
617
+ "eval_SITE_recall": 0.4696969696969697,
618
+ "eval_TAXA_f1": 0.7922437673130194,
619
+ "eval_TAXA_number": 525,
620
+ "eval_TAXA_precision": 0.7688172043010753,
621
+ "eval_TAXA_recall": 0.8171428571428572,
622
+ "eval_accuracy_entity": 0.9578683184706573,
623
+ "eval_accuracy_token": 0.9578683184706573,
624
+ "eval_f1_entity": 0.768325871301905,
625
+ "eval_f1_token": 0.768325871301905,
626
+ "eval_loss": 0.1395871937274933,
627
+ "eval_overall_accuracy": 0.9568181413645183,
628
+ "eval_overall_f1": 0.6146063863420803,
629
+ "eval_overall_precision": 0.5647879140034864,
630
+ "eval_overall_recall": 0.6740638002773925,
631
+ "eval_precision_entity": 0.7371967654986523,
632
+ "eval_precision_token": 0.7371967654986523,
633
+ "eval_recall_entity": 0.8021998166819432,
634
+ "eval_recall_token": 0.8021998166819432,
635
+ "eval_runtime": 12.126,
636
+ "eval_samples_per_second": 15.586,
637
+ "eval_steps_per_second": 1.979,
638
+ "step": 250
639
+ },
640
+ {
641
+ "epoch": 6.54,
642
+ "learning_rate": 1.3402061855670103e-05,
643
+ "loss": 0.0761,
644
+ "step": 260
645
+ },
646
+ {
647
+ "epoch": 6.79,
648
+ "learning_rate": 1.2989690721649485e-05,
649
+ "loss": 0.0715,
650
+ "step": 270
651
+ },
652
+ {
653
+ "epoch": 6.92,
654
+ "eval_AGE_f1": 0.7211267605633802,
655
+ "eval_AGE_number": 159,
656
+ "eval_AGE_precision": 0.6530612244897959,
657
+ "eval_AGE_recall": 0.8050314465408805,
658
+ "eval_ALTI_f1": 0.13333333333333333,
659
+ "eval_ALTI_number": 16,
660
+ "eval_ALTI_precision": 0.14285714285714285,
661
+ "eval_ALTI_recall": 0.125,
662
+ "eval_EMAIL_f1": 0.8455284552845529,
663
+ "eval_EMAIL_number": 52,
664
+ "eval_EMAIL_precision": 0.7323943661971831,
665
+ "eval_EMAIL_recall": 1.0,
666
+ "eval_GEOG_f1": 0.3870967741935484,
667
+ "eval_GEOG_number": 9,
668
+ "eval_GEOG_precision": 0.2727272727272727,
669
+ "eval_GEOG_recall": 0.6666666666666666,
670
+ "eval_REGION_f1": 0.5431818181818181,
671
+ "eval_REGION_number": 351,
672
+ "eval_REGION_precision": 0.45179584120982985,
673
+ "eval_REGION_recall": 0.6809116809116809,
674
+ "eval_SITE_f1": 0.45517241379310347,
675
+ "eval_SITE_number": 330,
676
+ "eval_SITE_precision": 0.4177215189873418,
677
+ "eval_SITE_recall": 0.5,
678
+ "eval_TAXA_f1": 0.7958412098298677,
679
+ "eval_TAXA_number": 525,
680
+ "eval_TAXA_precision": 0.7898686679174484,
681
+ "eval_TAXA_recall": 0.8019047619047619,
682
+ "eval_accuracy_entity": 0.9568893398123921,
683
+ "eval_accuracy_token": 0.9568893398123921,
684
+ "eval_f1_entity": 0.7651905252317198,
685
+ "eval_f1_token": 0.7651905252317198,
686
+ "eval_loss": 0.14375238120555878,
687
+ "eval_overall_accuracy": 0.9557857638703476,
688
+ "eval_overall_f1": 0.6327295440349782,
689
+ "eval_overall_precision": 0.5755681818181818,
690
+ "eval_overall_recall": 0.70249653259362,
691
+ "eval_precision_entity": 0.7193803453283847,
692
+ "eval_precision_token": 0.7193803453283847,
693
+ "eval_recall_entity": 0.8172318973418882,
694
+ "eval_recall_token": 0.8172318973418882,
695
+ "eval_runtime": 12.8036,
696
+ "eval_samples_per_second": 14.761,
697
+ "eval_steps_per_second": 1.874,
698
+ "step": 275
699
+ },
700
+ {
701
+ "epoch": 7.04,
702
+ "learning_rate": 1.2577319587628866e-05,
703
+ "loss": 0.0779,
704
+ "step": 280
705
+ },
706
+ {
707
+ "epoch": 7.3,
708
+ "learning_rate": 1.2164948453608248e-05,
709
+ "loss": 0.0652,
710
+ "step": 290
711
+ },
712
+ {
713
+ "epoch": 7.55,
714
+ "learning_rate": 1.175257731958763e-05,
715
+ "loss": 0.0651,
716
+ "step": 300
717
+ },
718
+ {
719
+ "epoch": 7.55,
720
+ "eval_AGE_f1": 0.7202380952380952,
721
+ "eval_AGE_number": 159,
722
+ "eval_AGE_precision": 0.6836158192090396,
723
+ "eval_AGE_recall": 0.7610062893081762,
724
+ "eval_ALTI_f1": 0.06896551724137931,
725
+ "eval_ALTI_number": 16,
726
+ "eval_ALTI_precision": 0.07692307692307693,
727
+ "eval_ALTI_recall": 0.0625,
728
+ "eval_EMAIL_f1": 0.7428571428571429,
729
+ "eval_EMAIL_number": 52,
730
+ "eval_EMAIL_precision": 0.5909090909090909,
731
+ "eval_EMAIL_recall": 1.0,
732
+ "eval_GEOG_f1": 0.42857142857142855,
733
+ "eval_GEOG_number": 9,
734
+ "eval_GEOG_precision": 0.3157894736842105,
735
+ "eval_GEOG_recall": 0.6666666666666666,
736
+ "eval_REGION_f1": 0.5471478463329453,
737
+ "eval_REGION_number": 351,
738
+ "eval_REGION_precision": 0.4625984251968504,
739
+ "eval_REGION_recall": 0.6695156695156695,
740
+ "eval_SITE_f1": 0.4159544159544159,
741
+ "eval_SITE_number": 330,
742
+ "eval_SITE_precision": 0.3924731182795699,
743
+ "eval_SITE_recall": 0.44242424242424244,
744
+ "eval_TAXA_f1": 0.8036697247706422,
745
+ "eval_TAXA_number": 525,
746
+ "eval_TAXA_precision": 0.7752212389380531,
747
+ "eval_TAXA_recall": 0.8342857142857143,
748
+ "eval_accuracy_entity": 0.9569427386482975,
749
+ "eval_accuracy_token": 0.9569427386482975,
750
+ "eval_f1_entity": 0.7655160390516038,
751
+ "eval_f1_token": 0.7655160390516038,
752
+ "eval_loss": 0.13883507251739502,
753
+ "eval_overall_accuracy": 0.9559281607660953,
754
+ "eval_overall_f1": 0.6275125628140703,
755
+ "eval_overall_precision": 0.5734787600459242,
756
+ "eval_overall_recall": 0.6927877947295423,
757
+ "eval_precision_entity": 0.7297656639521356,
758
+ "eval_precision_token": 0.7297656639521356,
759
+ "eval_recall_entity": 0.8049495875343722,
760
+ "eval_recall_token": 0.8049495875343722,
761
+ "eval_runtime": 10.0268,
762
+ "eval_samples_per_second": 18.85,
763
+ "eval_steps_per_second": 2.394,
764
+ "step": 300
765
+ },
766
+ {
767
+ "epoch": 7.8,
768
+ "learning_rate": 1.134020618556701e-05,
769
+ "loss": 0.0616,
770
+ "step": 310
771
+ },
772
+ {
773
+ "epoch": 8.05,
774
+ "learning_rate": 1.0927835051546391e-05,
775
+ "loss": 0.0629,
776
+ "step": 320
777
+ },
778
+ {
779
+ "epoch": 8.18,
780
+ "eval_AGE_f1": 0.702857142857143,
781
+ "eval_AGE_number": 159,
782
+ "eval_AGE_precision": 0.643979057591623,
783
+ "eval_AGE_recall": 0.7735849056603774,
784
+ "eval_ALTI_f1": 0.07692307692307693,
785
+ "eval_ALTI_number": 16,
786
+ "eval_ALTI_precision": 0.1,
787
+ "eval_ALTI_recall": 0.0625,
788
+ "eval_EMAIL_f1": 0.787878787878788,
789
+ "eval_EMAIL_number": 52,
790
+ "eval_EMAIL_precision": 0.65,
791
+ "eval_EMAIL_recall": 1.0,
792
+ "eval_GEOG_f1": 0.41379310344827586,
793
+ "eval_GEOG_number": 9,
794
+ "eval_GEOG_precision": 0.3,
795
+ "eval_GEOG_recall": 0.6666666666666666,
796
+ "eval_REGION_f1": 0.5244040862656072,
797
+ "eval_REGION_number": 351,
798
+ "eval_REGION_precision": 0.4358490566037736,
799
+ "eval_REGION_recall": 0.6581196581196581,
800
+ "eval_SITE_f1": 0.39538239538239534,
801
+ "eval_SITE_number": 330,
802
+ "eval_SITE_precision": 0.3774104683195592,
803
+ "eval_SITE_recall": 0.41515151515151516,
804
+ "eval_TAXA_f1": 0.7945701357466064,
805
+ "eval_TAXA_number": 525,
806
+ "eval_TAXA_precision": 0.756896551724138,
807
+ "eval_TAXA_recall": 0.8361904761904762,
808
+ "eval_accuracy_entity": 0.9557857638703476,
809
+ "eval_accuracy_token": 0.9557857638703476,
810
+ "eval_f1_entity": 0.7590018133149123,
811
+ "eval_f1_token": 0.7590018133149123,
812
+ "eval_loss": 0.14412528276443481,
813
+ "eval_overall_accuracy": 0.9548245848240509,
814
+ "eval_overall_f1": 0.6150497512437811,
815
+ "eval_overall_precision": 0.5574971815107103,
816
+ "eval_overall_recall": 0.6858529819694869,
817
+ "eval_precision_entity": 0.7174338883447601,
818
+ "eval_precision_token": 0.7174338883447601,
819
+ "eval_recall_entity": 0.8056828597616865,
820
+ "eval_recall_token": 0.8056828597616865,
821
+ "eval_runtime": 10.4306,
822
+ "eval_samples_per_second": 18.12,
823
+ "eval_steps_per_second": 2.301,
824
+ "step": 325
825
+ },
826
+ {
827
+ "epoch": 8.3,
828
+ "learning_rate": 1.0515463917525775e-05,
829
+ "loss": 0.0556,
830
+ "step": 330
831
+ },
832
+ {
833
+ "epoch": 8.55,
834
+ "learning_rate": 1.0103092783505156e-05,
835
+ "loss": 0.0609,
836
+ "step": 340
837
+ },
838
+ {
839
+ "epoch": 8.81,
840
+ "learning_rate": 9.690721649484536e-06,
841
+ "loss": 0.0558,
842
+ "step": 350
843
+ },
844
+ {
845
+ "epoch": 8.81,
846
+ "eval_AGE_f1": 0.6822157434402333,
847
+ "eval_AGE_number": 159,
848
+ "eval_AGE_precision": 0.6358695652173914,
849
+ "eval_AGE_recall": 0.7358490566037735,
850
+ "eval_ALTI_f1": 0.12121212121212122,
851
+ "eval_ALTI_number": 16,
852
+ "eval_ALTI_precision": 0.11764705882352941,
853
+ "eval_ALTI_recall": 0.125,
854
+ "eval_EMAIL_f1": 0.7482014388489209,
855
+ "eval_EMAIL_number": 52,
856
+ "eval_EMAIL_precision": 0.5977011494252874,
857
+ "eval_EMAIL_recall": 1.0,
858
+ "eval_GEOG_f1": 0.37500000000000006,
859
+ "eval_GEOG_number": 9,
860
+ "eval_GEOG_precision": 0.2608695652173913,
861
+ "eval_GEOG_recall": 0.6666666666666666,
862
+ "eval_REGION_f1": 0.5439429928741093,
863
+ "eval_REGION_number": 351,
864
+ "eval_REGION_precision": 0.4663951120162933,
865
+ "eval_REGION_recall": 0.6524216524216524,
866
+ "eval_SITE_f1": 0.4425531914893617,
867
+ "eval_SITE_number": 330,
868
+ "eval_SITE_precision": 0.416,
869
+ "eval_SITE_recall": 0.4727272727272727,
870
+ "eval_TAXA_f1": 0.7924865831842576,
871
+ "eval_TAXA_number": 525,
872
+ "eval_TAXA_precision": 0.7470489038785835,
873
+ "eval_TAXA_recall": 0.8438095238095238,
874
+ "eval_accuracy_entity": 0.9551983766753884,
875
+ "eval_accuracy_token": 0.9551983766753884,
876
+ "eval_f1_entity": 0.7571195044308698,
877
+ "eval_f1_token": 0.7571195044308698,
878
+ "eval_loss": 0.14811000227928162,
879
+ "eval_overall_accuracy": 0.9542371976290916,
880
+ "eval_overall_f1": 0.6257783312577834,
881
+ "eval_overall_precision": 0.5677966101694916,
882
+ "eval_overall_recall": 0.6969486823855756,
883
+ "eval_precision_entity": 0.7133592736705577,
884
+ "eval_precision_token": 0.7133592736705577,
885
+ "eval_recall_entity": 0.8065994500458296,
886
+ "eval_recall_token": 0.8065994500458296,
887
+ "eval_runtime": 11.3308,
888
+ "eval_samples_per_second": 16.68,
889
+ "eval_steps_per_second": 2.118,
890
+ "step": 350
891
+ },
892
+ {
893
+ "epoch": 9.06,
894
+ "learning_rate": 9.278350515463918e-06,
895
+ "loss": 0.0597,
896
+ "step": 360
897
+ },
898
+ {
899
+ "epoch": 9.31,
900
+ "learning_rate": 8.865979381443299e-06,
901
+ "loss": 0.056,
902
+ "step": 370
903
+ },
904
+ {
905
+ "epoch": 9.43,
906
+ "eval_AGE_f1": 0.7079646017699115,
907
+ "eval_AGE_number": 159,
908
+ "eval_AGE_precision": 0.6666666666666666,
909
+ "eval_AGE_recall": 0.7547169811320755,
910
+ "eval_ALTI_f1": 0.15384615384615385,
911
+ "eval_ALTI_number": 16,
912
+ "eval_ALTI_precision": 0.2,
913
+ "eval_ALTI_recall": 0.125,
914
+ "eval_EMAIL_f1": 0.6666666666666666,
915
+ "eval_EMAIL_number": 52,
916
+ "eval_EMAIL_precision": 0.5,
917
+ "eval_EMAIL_recall": 1.0,
918
+ "eval_GEOG_f1": 0.4,
919
+ "eval_GEOG_number": 9,
920
+ "eval_GEOG_precision": 0.2857142857142857,
921
+ "eval_GEOG_recall": 0.6666666666666666,
922
+ "eval_REGION_f1": 0.5555555555555556,
923
+ "eval_REGION_number": 351,
924
+ "eval_REGION_precision": 0.4613935969868173,
925
+ "eval_REGION_recall": 0.698005698005698,
926
+ "eval_SITE_f1": 0.47632311977715874,
927
+ "eval_SITE_number": 330,
928
+ "eval_SITE_precision": 0.44072164948453607,
929
+ "eval_SITE_recall": 0.5181818181818182,
930
+ "eval_TAXA_f1": 0.8040109389243391,
931
+ "eval_TAXA_number": 525,
932
+ "eval_TAXA_precision": 0.7709790209790209,
933
+ "eval_TAXA_recall": 0.84,
934
+ "eval_accuracy_entity": 0.9559993592139692,
935
+ "eval_accuracy_token": 0.9559993592139692,
936
+ "eval_f1_entity": 0.7634735597229263,
937
+ "eval_f1_token": 0.7634735597229263,
938
+ "eval_loss": 0.15191707015037537,
939
+ "eval_overall_accuracy": 0.9548779836599562,
940
+ "eval_overall_f1": 0.6385467980295567,
941
+ "eval_overall_precision": 0.5741971207087486,
942
+ "eval_overall_recall": 0.7191400832177531,
943
+ "eval_precision_entity": 0.7079743067523109,
944
+ "eval_precision_token": 0.7079743067523109,
945
+ "eval_recall_entity": 0.8284142988084326,
946
+ "eval_recall_token": 0.8284142988084326,
947
+ "eval_runtime": 9.9604,
948
+ "eval_samples_per_second": 18.975,
949
+ "eval_steps_per_second": 2.41,
950
+ "step": 375
951
+ },
952
+ {
953
+ "epoch": 9.56,
954
+ "learning_rate": 8.453608247422681e-06,
955
+ "loss": 0.0579,
956
+ "step": 380
957
+ },
958
+ {
959
+ "epoch": 9.81,
960
+ "learning_rate": 8.041237113402063e-06,
961
+ "loss": 0.0499,
962
+ "step": 390
963
+ },
964
+ {
965
+ "epoch": 10.06,
966
+ "learning_rate": 7.628865979381444e-06,
967
+ "loss": 0.0529,
968
+ "step": 400
969
+ },
970
+ {
971
+ "epoch": 10.06,
972
+ "eval_AGE_f1": 0.7025495750708216,
973
+ "eval_AGE_number": 159,
974
+ "eval_AGE_precision": 0.6391752577319587,
975
+ "eval_AGE_recall": 0.779874213836478,
976
+ "eval_ALTI_f1": 0.3225806451612903,
977
+ "eval_ALTI_number": 16,
978
+ "eval_ALTI_precision": 0.3333333333333333,
979
+ "eval_ALTI_recall": 0.3125,
980
+ "eval_EMAIL_f1": 0.7819548872180451,
981
+ "eval_EMAIL_number": 52,
982
+ "eval_EMAIL_precision": 0.6419753086419753,
983
+ "eval_EMAIL_recall": 1.0,
984
+ "eval_GEOG_f1": 0.4,
985
+ "eval_GEOG_number": 9,
986
+ "eval_GEOG_precision": 0.2857142857142857,
987
+ "eval_GEOG_recall": 0.6666666666666666,
988
+ "eval_REGION_f1": 0.5511811023622047,
989
+ "eval_REGION_number": 351,
990
+ "eval_REGION_precision": 0.45539033457249073,
991
+ "eval_REGION_recall": 0.698005698005698,
992
+ "eval_SITE_f1": 0.4936530324400564,
993
+ "eval_SITE_number": 330,
994
+ "eval_SITE_precision": 0.46174142480211083,
995
+ "eval_SITE_recall": 0.5303030303030303,
996
+ "eval_TAXA_f1": 0.8047445255474452,
997
+ "eval_TAXA_number": 525,
998
+ "eval_TAXA_precision": 0.7723292469352014,
999
+ "eval_TAXA_recall": 0.84,
1000
+ "eval_accuracy_entity": 0.9571207347679821,
1001
+ "eval_accuracy_token": 0.9571207347679821,
1002
+ "eval_f1_entity": 0.7682700421940929,
1003
+ "eval_f1_token": 0.7682700421940929,
1004
+ "eval_loss": 0.154266357421875,
1005
+ "eval_overall_accuracy": 0.9559993592139692,
1006
+ "eval_overall_f1": 0.646713977167541,
1007
+ "eval_overall_precision": 0.5825458588104503,
1008
+ "eval_overall_recall": 0.7267683772538142,
1009
+ "eval_precision_entity": 0.7118060985144644,
1010
+ "eval_precision_token": 0.7118060985144644,
1011
+ "eval_recall_entity": 0.8344637946837764,
1012
+ "eval_recall_token": 0.8344637946837764,
1013
+ "eval_runtime": 10.1935,
1014
+ "eval_samples_per_second": 18.541,
1015
+ "eval_steps_per_second": 2.354,
1016
+ "step": 400
1017
+ },
1018
+ {
1019
+ "epoch": 10.31,
1020
+ "learning_rate": 7.216494845360825e-06,
1021
+ "loss": 0.0504,
1022
+ "step": 410
1023
+ },
1024
+ {
1025
+ "epoch": 10.57,
1026
+ "learning_rate": 6.804123711340207e-06,
1027
+ "loss": 0.0527,
1028
+ "step": 420
1029
+ },
1030
+ {
1031
+ "epoch": 10.69,
1032
+ "eval_AGE_f1": 0.6966292134831462,
1033
+ "eval_AGE_number": 159,
1034
+ "eval_AGE_precision": 0.6294416243654822,
1035
+ "eval_AGE_recall": 0.779874213836478,
1036
+ "eval_ALTI_f1": 0.2962962962962963,
1037
+ "eval_ALTI_number": 16,
1038
+ "eval_ALTI_precision": 0.36363636363636365,
1039
+ "eval_ALTI_recall": 0.25,
1040
+ "eval_EMAIL_f1": 0.7938931297709924,
1041
+ "eval_EMAIL_number": 52,
1042
+ "eval_EMAIL_precision": 0.6582278481012658,
1043
+ "eval_EMAIL_recall": 1.0,
1044
+ "eval_GEOG_f1": 0.37500000000000006,
1045
+ "eval_GEOG_number": 9,
1046
+ "eval_GEOG_precision": 0.2608695652173913,
1047
+ "eval_GEOG_recall": 0.6666666666666666,
1048
+ "eval_REGION_f1": 0.5187878787878788,
1049
+ "eval_REGION_number": 351,
1050
+ "eval_REGION_precision": 0.45147679324894513,
1051
+ "eval_REGION_recall": 0.6096866096866097,
1052
+ "eval_SITE_f1": 0.36940836940836935,
1053
+ "eval_SITE_number": 330,
1054
+ "eval_SITE_precision": 0.3526170798898072,
1055
+ "eval_SITE_recall": 0.3878787878787879,
1056
+ "eval_TAXA_f1": 0.7914735866543096,
1057
+ "eval_TAXA_number": 525,
1058
+ "eval_TAXA_precision": 0.7707581227436823,
1059
+ "eval_TAXA_recall": 0.8133333333333334,
1060
+ "eval_accuracy_entity": 0.9547355867642086,
1061
+ "eval_accuracy_token": 0.9547355867642086,
1062
+ "eval_f1_entity": 0.7530343007915568,
1063
+ "eval_f1_token": 0.7530343007915568,
1064
+ "eval_loss": 0.15111711621284485,
1065
+ "eval_overall_accuracy": 0.9537744077179118,
1066
+ "eval_overall_f1": 0.6076996500159084,
1067
+ "eval_overall_precision": 0.5614344503233392,
1068
+ "eval_overall_recall": 0.6622746185852982,
1069
+ "eval_precision_entity": 0.7237531699070161,
1070
+ "eval_precision_token": 0.7237531699070161,
1071
+ "eval_recall_entity": 0.7847846012832264,
1072
+ "eval_recall_token": 0.7847846012832264,
1073
+ "eval_runtime": 10.0406,
1074
+ "eval_samples_per_second": 18.824,
1075
+ "eval_steps_per_second": 2.39,
1076
+ "step": 425
1077
+ },
1078
+ {
1079
+ "epoch": 10.82,
1080
+ "learning_rate": 6.391752577319588e-06,
1081
+ "loss": 0.0483,
1082
+ "step": 430
1083
+ },
1084
+ {
1085
+ "epoch": 11.07,
1086
+ "learning_rate": 5.979381443298969e-06,
1087
+ "loss": 0.0487,
1088
+ "step": 440
1089
+ },
1090
+ {
1091
+ "epoch": 11.32,
1092
+ "learning_rate": 5.567010309278351e-06,
1093
+ "loss": 0.0508,
1094
+ "step": 450
1095
+ },
1096
+ {
1097
+ "epoch": 11.32,
1098
+ "eval_AGE_f1": 0.7130434782608696,
1099
+ "eval_AGE_number": 159,
1100
+ "eval_AGE_precision": 0.6612903225806451,
1101
+ "eval_AGE_recall": 0.7735849056603774,
1102
+ "eval_ALTI_f1": 0.21428571428571427,
1103
+ "eval_ALTI_number": 16,
1104
+ "eval_ALTI_precision": 0.25,
1105
+ "eval_ALTI_recall": 0.1875,
1106
+ "eval_EMAIL_f1": 0.7428571428571429,
1107
+ "eval_EMAIL_number": 52,
1108
+ "eval_EMAIL_precision": 0.5909090909090909,
1109
+ "eval_EMAIL_recall": 1.0,
1110
+ "eval_GEOG_f1": 0.4,
1111
+ "eval_GEOG_number": 9,
1112
+ "eval_GEOG_precision": 0.2857142857142857,
1113
+ "eval_GEOG_recall": 0.6666666666666666,
1114
+ "eval_REGION_f1": 0.525030525030525,
1115
+ "eval_REGION_number": 351,
1116
+ "eval_REGION_precision": 0.4594017094017094,
1117
+ "eval_REGION_recall": 0.6125356125356125,
1118
+ "eval_SITE_f1": 0.38904899135446686,
1119
+ "eval_SITE_number": 330,
1120
+ "eval_SITE_precision": 0.3708791208791209,
1121
+ "eval_SITE_recall": 0.4090909090909091,
1122
+ "eval_TAXA_f1": 0.7802197802197802,
1123
+ "eval_TAXA_number": 525,
1124
+ "eval_TAXA_precision": 0.7513227513227513,
1125
+ "eval_TAXA_recall": 0.8114285714285714,
1126
+ "eval_accuracy_entity": 0.9558925615421584,
1127
+ "eval_accuracy_token": 0.9558925615421584,
1128
+ "eval_f1_entity": 0.7576967438559136,
1129
+ "eval_f1_token": 0.7576967438559136,
1130
+ "eval_loss": 0.15142428874969482,
1131
+ "eval_overall_accuracy": 0.9549135828838932,
1132
+ "eval_overall_f1": 0.6099110546378654,
1133
+ "eval_overall_precision": 0.5627198124267292,
1134
+ "eval_overall_recall": 0.665742024965326,
1135
+ "eval_precision_entity": 0.734181568088033,
1136
+ "eval_precision_token": 0.734181568088033,
1137
+ "eval_recall_entity": 0.7827681026581118,
1138
+ "eval_recall_token": 0.7827681026581118,
1139
+ "eval_runtime": 9.85,
1140
+ "eval_samples_per_second": 19.188,
1141
+ "eval_steps_per_second": 2.437,
1142
+ "step": 450
1143
+ },
1144
+ {
1145
+ "epoch": 11.57,
1146
+ "learning_rate": 5.154639175257732e-06,
1147
+ "loss": 0.0464,
1148
+ "step": 460
1149
+ },
1150
+ {
1151
+ "epoch": 11.82,
1152
+ "learning_rate": 4.742268041237113e-06,
1153
+ "loss": 0.0459,
1154
+ "step": 470
1155
+ },
1156
+ {
1157
+ "epoch": 11.95,
1158
+ "eval_AGE_f1": 0.6956521739130435,
1159
+ "eval_AGE_number": 159,
1160
+ "eval_AGE_precision": 0.6451612903225806,
1161
+ "eval_AGE_recall": 0.7547169811320755,
1162
+ "eval_ALTI_f1": 0.13793103448275862,
1163
+ "eval_ALTI_number": 16,
1164
+ "eval_ALTI_precision": 0.15384615384615385,
1165
+ "eval_ALTI_recall": 0.125,
1166
+ "eval_EMAIL_f1": 0.732394366197183,
1167
+ "eval_EMAIL_number": 52,
1168
+ "eval_EMAIL_precision": 0.5777777777777777,
1169
+ "eval_EMAIL_recall": 1.0,
1170
+ "eval_GEOG_f1": 0.3870967741935484,
1171
+ "eval_GEOG_number": 9,
1172
+ "eval_GEOG_precision": 0.2727272727272727,
1173
+ "eval_GEOG_recall": 0.6666666666666666,
1174
+ "eval_REGION_f1": 0.5467980295566502,
1175
+ "eval_REGION_number": 351,
1176
+ "eval_REGION_precision": 0.48156182212581344,
1177
+ "eval_REGION_recall": 0.6324786324786325,
1178
+ "eval_SITE_f1": 0.41466854724964736,
1179
+ "eval_SITE_number": 330,
1180
+ "eval_SITE_precision": 0.38786279683377306,
1181
+ "eval_SITE_recall": 0.44545454545454544,
1182
+ "eval_TAXA_f1": 0.7944700460829494,
1183
+ "eval_TAXA_number": 525,
1184
+ "eval_TAXA_precision": 0.7696428571428572,
1185
+ "eval_TAXA_recall": 0.820952380952381,
1186
+ "eval_accuracy_entity": 0.9552161762873569,
1187
+ "eval_accuracy_token": 0.9552161762873569,
1188
+ "eval_f1_entity": 0.7573407684935088,
1189
+ "eval_f1_token": 0.7573407684935088,
1190
+ "eval_loss": 0.15560036897659302,
1191
+ "eval_overall_accuracy": 0.9541481995692493,
1192
+ "eval_overall_f1": 0.6216301934665398,
1193
+ "eval_overall_precision": 0.5727644652250146,
1194
+ "eval_overall_recall": 0.6796116504854369,
1195
+ "eval_precision_entity": 0.7216871471272003,
1196
+ "eval_precision_token": 0.7216871471272003,
1197
+ "eval_recall_entity": 0.7967002749770853,
1198
+ "eval_recall_token": 0.7967002749770853,
1199
+ "eval_runtime": 10.1795,
1200
+ "eval_samples_per_second": 18.567,
1201
+ "eval_steps_per_second": 2.358,
1202
+ "step": 475
1203
+ },
1204
+ {
1205
+ "epoch": 12.08,
1206
+ "learning_rate": 4.329896907216495e-06,
1207
+ "loss": 0.0418,
1208
+ "step": 480
1209
+ },
1210
+ {
1211
+ "epoch": 12.33,
1212
+ "learning_rate": 3.917525773195877e-06,
1213
+ "loss": 0.045,
1214
+ "step": 490
1215
+ },
1216
+ {
1217
+ "epoch": 12.58,
1218
+ "learning_rate": 3.5051546391752577e-06,
1219
+ "loss": 0.0484,
1220
+ "step": 500
1221
+ },
1222
+ {
1223
+ "epoch": 12.58,
1224
+ "eval_AGE_f1": 0.7134502923976608,
1225
+ "eval_AGE_number": 159,
1226
+ "eval_AGE_precision": 0.6666666666666666,
1227
+ "eval_AGE_recall": 0.7672955974842768,
1228
+ "eval_ALTI_f1": 0.20689655172413793,
1229
+ "eval_ALTI_number": 16,
1230
+ "eval_ALTI_precision": 0.23076923076923078,
1231
+ "eval_ALTI_recall": 0.1875,
1232
+ "eval_EMAIL_f1": 0.7172413793103448,
1233
+ "eval_EMAIL_number": 52,
1234
+ "eval_EMAIL_precision": 0.5591397849462365,
1235
+ "eval_EMAIL_recall": 1.0,
1236
+ "eval_GEOG_f1": 0.3870967741935484,
1237
+ "eval_GEOG_number": 9,
1238
+ "eval_GEOG_precision": 0.2727272727272727,
1239
+ "eval_GEOG_recall": 0.6666666666666666,
1240
+ "eval_REGION_f1": 0.560093348891482,
1241
+ "eval_REGION_number": 351,
1242
+ "eval_REGION_precision": 0.4743083003952569,
1243
+ "eval_REGION_recall": 0.6837606837606838,
1244
+ "eval_SITE_f1": 0.44044321329639885,
1245
+ "eval_SITE_number": 330,
1246
+ "eval_SITE_precision": 0.40561224489795916,
1247
+ "eval_SITE_recall": 0.4818181818181818,
1248
+ "eval_TAXA_f1": 0.7956600361663652,
1249
+ "eval_TAXA_number": 525,
1250
+ "eval_TAXA_precision": 0.7573149741824441,
1251
+ "eval_TAXA_recall": 0.8380952380952381,
1252
+ "eval_accuracy_entity": 0.9561061568857799,
1253
+ "eval_accuracy_token": 0.9561061568857799,
1254
+ "eval_f1_entity": 0.7653287788215201,
1255
+ "eval_f1_token": 0.7653287788215201,
1256
+ "eval_loss": 0.15589508414268494,
1257
+ "eval_overall_accuracy": 0.9551271782275147,
1258
+ "eval_overall_f1": 0.6324257425742574,
1259
+ "eval_overall_precision": 0.5709497206703911,
1260
+ "eval_overall_recall": 0.7087378640776699,
1261
+ "eval_precision_entity": 0.71638689048761,
1262
+ "eval_precision_token": 0.71638689048761,
1263
+ "eval_recall_entity": 0.821448212648946,
1264
+ "eval_recall_token": 0.821448212648946,
1265
+ "eval_runtime": 12.7467,
1266
+ "eval_samples_per_second": 14.827,
1267
+ "eval_steps_per_second": 1.883,
1268
+ "step": 500
1269
+ },
1270
+ {
1271
+ "epoch": 12.83,
1272
+ "learning_rate": 3.0927835051546395e-06,
1273
+ "loss": 0.0461,
1274
+ "step": 510
1275
+ },
1276
+ {
1277
+ "epoch": 13.08,
1278
+ "learning_rate": 2.680412371134021e-06,
1279
+ "loss": 0.0386,
1280
+ "step": 520
1281
+ },
1282
+ {
1283
+ "epoch": 13.21,
1284
+ "eval_AGE_f1": 0.7055393586005833,
1285
+ "eval_AGE_number": 159,
1286
+ "eval_AGE_precision": 0.657608695652174,
1287
+ "eval_AGE_recall": 0.7610062893081762,
1288
+ "eval_ALTI_f1": 0.0,
1289
+ "eval_ALTI_number": 16,
1290
+ "eval_ALTI_precision": 0.0,
1291
+ "eval_ALTI_recall": 0.0,
1292
+ "eval_EMAIL_f1": 0.6933333333333334,
1293
+ "eval_EMAIL_number": 52,
1294
+ "eval_EMAIL_precision": 0.5306122448979592,
1295
+ "eval_EMAIL_recall": 1.0,
1296
+ "eval_GEOG_f1": 0.41379310344827586,
1297
+ "eval_GEOG_number": 9,
1298
+ "eval_GEOG_precision": 0.3,
1299
+ "eval_GEOG_recall": 0.6666666666666666,
1300
+ "eval_REGION_f1": 0.558858501783591,
1301
+ "eval_REGION_number": 351,
1302
+ "eval_REGION_precision": 0.47959183673469385,
1303
+ "eval_REGION_recall": 0.6695156695156695,
1304
+ "eval_SITE_f1": 0.42758620689655175,
1305
+ "eval_SITE_number": 330,
1306
+ "eval_SITE_precision": 0.3924050632911392,
1307
+ "eval_SITE_recall": 0.4696969696969697,
1308
+ "eval_TAXA_f1": 0.7948951686417502,
1309
+ "eval_TAXA_number": 525,
1310
+ "eval_TAXA_precision": 0.7622377622377622,
1311
+ "eval_TAXA_recall": 0.8304761904761905,
1312
+ "eval_accuracy_entity": 0.9557679642583792,
1313
+ "eval_accuracy_token": 0.9557679642583792,
1314
+ "eval_f1_entity": 0.7621009268795055,
1315
+ "eval_f1_token": 0.7621009268795055,
1316
+ "eval_loss": 0.15739484131336212,
1317
+ "eval_overall_accuracy": 0.9548245848240509,
1318
+ "eval_overall_f1": 0.6255835667600373,
1319
+ "eval_overall_precision": 0.567476002258611,
1320
+ "eval_overall_recall": 0.6969486823855756,
1321
+ "eval_precision_entity": 0.716475714055188,
1322
+ "eval_precision_token": 0.716475714055188,
1323
+ "eval_recall_entity": 0.8139321723189734,
1324
+ "eval_recall_token": 0.8139321723189734,
1325
+ "eval_runtime": 10.5618,
1326
+ "eval_samples_per_second": 17.895,
1327
+ "eval_steps_per_second": 2.272,
1328
+ "step": 525
1329
+ },
1330
+ {
1331
+ "epoch": 13.33,
1332
+ "learning_rate": 2.268041237113402e-06,
1333
+ "loss": 0.0405,
1334
+ "step": 530
1335
+ },
1336
+ {
1337
+ "epoch": 13.58,
1338
+ "learning_rate": 1.8556701030927837e-06,
1339
+ "loss": 0.0438,
1340
+ "step": 540
1341
+ },
1342
+ {
1343
+ "epoch": 13.84,
1344
+ "learning_rate": 1.4432989690721649e-06,
1345
+ "loss": 0.0464,
1346
+ "step": 550
1347
+ },
1348
+ {
1349
+ "epoch": 13.84,
1350
+ "eval_AGE_f1": 0.7045454545454547,
1351
+ "eval_AGE_number": 159,
1352
+ "eval_AGE_precision": 0.6424870466321243,
1353
+ "eval_AGE_recall": 0.779874213836478,
1354
+ "eval_ALTI_f1": 0.20689655172413793,
1355
+ "eval_ALTI_number": 16,
1356
+ "eval_ALTI_precision": 0.23076923076923078,
1357
+ "eval_ALTI_recall": 0.1875,
1358
+ "eval_EMAIL_f1": 0.7027027027027027,
1359
+ "eval_EMAIL_number": 52,
1360
+ "eval_EMAIL_precision": 0.5416666666666666,
1361
+ "eval_EMAIL_recall": 1.0,
1362
+ "eval_GEOG_f1": 0.36363636363636365,
1363
+ "eval_GEOG_number": 9,
1364
+ "eval_GEOG_precision": 0.25,
1365
+ "eval_GEOG_recall": 0.6666666666666666,
1366
+ "eval_REGION_f1": 0.5545023696682464,
1367
+ "eval_REGION_number": 351,
1368
+ "eval_REGION_precision": 0.4746450304259635,
1369
+ "eval_REGION_recall": 0.6666666666666666,
1370
+ "eval_SITE_f1": 0.41408450704225347,
1371
+ "eval_SITE_number": 330,
1372
+ "eval_SITE_precision": 0.3868421052631579,
1373
+ "eval_SITE_recall": 0.44545454545454544,
1374
+ "eval_TAXA_f1": 0.7978241160471441,
1375
+ "eval_TAXA_number": 525,
1376
+ "eval_TAXA_precision": 0.7612456747404844,
1377
+ "eval_TAXA_recall": 0.8380952380952381,
1378
+ "eval_accuracy_entity": 0.955144977839483,
1379
+ "eval_accuracy_token": 0.955144977839483,
1380
+ "eval_f1_entity": 0.7586857682079438,
1381
+ "eval_f1_token": 0.7586857682079438,
1382
+ "eval_loss": 0.1583557277917862,
1383
+ "eval_overall_accuracy": 0.9541481995692493,
1384
+ "eval_overall_f1": 0.6250388319353837,
1385
+ "eval_overall_precision": 0.566122678671919,
1386
+ "eval_overall_recall": 0.6976421636615812,
1387
+ "eval_precision_entity": 0.7129958078039342,
1388
+ "eval_precision_token": 0.7129958078039342,
1389
+ "eval_recall_entity": 0.8106324472960587,
1390
+ "eval_recall_token": 0.8106324472960587,
1391
+ "eval_runtime": 12.1366,
1392
+ "eval_samples_per_second": 15.573,
1393
+ "eval_steps_per_second": 1.977,
1394
+ "step": 550
1395
+ },
1396
+ {
1397
+ "epoch": 14.09,
1398
+ "learning_rate": 1.0309278350515464e-06,
1399
+ "loss": 0.0405,
1400
+ "step": 560
1401
+ },
1402
+ {
1403
+ "epoch": 14.34,
1404
+ "learning_rate": 6.185567010309279e-07,
1405
+ "loss": 0.0448,
1406
+ "step": 570
1407
+ },
1408
+ {
1409
+ "epoch": 14.47,
1410
+ "eval_AGE_f1": 0.7163323782234957,
1411
+ "eval_AGE_number": 159,
1412
+ "eval_AGE_precision": 0.6578947368421053,
1413
+ "eval_AGE_recall": 0.7861635220125787,
1414
+ "eval_ALTI_f1": 0.20689655172413793,
1415
+ "eval_ALTI_number": 16,
1416
+ "eval_ALTI_precision": 0.23076923076923078,
1417
+ "eval_ALTI_recall": 0.1875,
1418
+ "eval_EMAIL_f1": 0.732394366197183,
1419
+ "eval_EMAIL_number": 52,
1420
+ "eval_EMAIL_precision": 0.5777777777777777,
1421
+ "eval_EMAIL_recall": 1.0,
1422
+ "eval_GEOG_f1": 0.36363636363636365,
1423
+ "eval_GEOG_number": 9,
1424
+ "eval_GEOG_precision": 0.25,
1425
+ "eval_GEOG_recall": 0.6666666666666666,
1426
+ "eval_REGION_f1": 0.56,
1427
+ "eval_REGION_number": 351,
1428
+ "eval_REGION_precision": 0.47695390781563124,
1429
+ "eval_REGION_recall": 0.6780626780626781,
1430
+ "eval_SITE_f1": 0.41310541310541316,
1431
+ "eval_SITE_number": 330,
1432
+ "eval_SITE_precision": 0.3897849462365591,
1433
+ "eval_SITE_recall": 0.4393939393939394,
1434
+ "eval_TAXA_f1": 0.7981735159817351,
1435
+ "eval_TAXA_number": 525,
1436
+ "eval_TAXA_precision": 0.7666666666666667,
1437
+ "eval_TAXA_recall": 0.8323809523809523,
1438
+ "eval_accuracy_entity": 0.9550203805557039,
1439
+ "eval_accuracy_token": 0.9550203805557039,
1440
+ "eval_f1_entity": 0.7577735784229513,
1441
+ "eval_f1_token": 0.7577735784229513,
1442
+ "eval_loss": 0.1591457575559616,
1443
+ "eval_overall_accuracy": 0.9540236022854702,
1444
+ "eval_overall_f1": 0.62875,
1445
+ "eval_overall_precision": 0.5722411831626849,
1446
+ "eval_overall_recall": 0.6976421636615812,
1447
+ "eval_precision_entity": 0.7129465007273315,
1448
+ "eval_precision_token": 0.7129465007273315,
1449
+ "eval_recall_entity": 0.8086159486709441,
1450
+ "eval_recall_token": 0.8086159486709441,
1451
+ "eval_runtime": 10.2385,
1452
+ "eval_samples_per_second": 18.46,
1453
+ "eval_steps_per_second": 2.344,
1454
+ "step": 575
1455
+ },
1456
+ {
1457
+ "epoch": 14.59,
1458
+ "learning_rate": 2.061855670103093e-07,
1459
+ "loss": 0.0413,
1460
+ "step": 580
1461
+ },
1462
+ {
1463
+ "epoch": 14.72,
1464
+ "step": 585,
1465
+ "total_flos": 4125504727794096.0,
1466
+ "train_loss": 0.23708797097206116,
1467
+ "train_runtime": 1988.5186,
1468
+ "train_samples_per_second": 9.572,
1469
+ "train_steps_per_second": 0.294
1470
+ }
1471
+ ],
1472
+ "max_steps": 585,
1473
+ "num_train_epochs": 15,
1474
+ "total_flos": 4125504727794096.0,
1475
+ "trial_name": null,
1476
+ "trial_params": null
1477
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3522745422ae3121f4d463384271ae3a8147e5e16a9d8b1cf4888806843b7d3f
3
+ size 4091