Adriane Boyd commited on
Commit
6b01c7e
·
1 Parent(s): 87aba3e

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,13 +14,13 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.8450704225
18
  - name: NER Recall
19
  type: recall
20
- value: 0.8301886792
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8375634518
24
  - task:
25
  name: TAG
26
  type: token-classification
@@ -34,7 +34,7 @@ model-index:
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9793295403
38
  - task:
39
  name: MORPH
40
  type: token-classification
@@ -48,28 +48,28 @@ model-index:
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.965013864
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.9318744653
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.9208335209
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9469623915
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_trf
75
 
@@ -78,8 +78,8 @@ Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_trf` |
81
- | **Version** | `3.3.0` |
82
- | **spaCy** | `>=3.3.0.dev0,<3.4.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
@@ -109,18 +109,18 @@ Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components
109
  | `TOKEN_P` | 97.65 |
110
  | `TOKEN_R` | 97.90 |
111
  | `TOKEN_F` | 97.77 |
112
- | `POS_ACC` | 97.93 |
113
  | `MORPH_ACC` | 0.00 |
114
  | `MORPH_MICRO_P` | 34.01 |
115
  | `MORPH_MICRO_R` | 98.04 |
116
  | `MORPH_MICRO_F` | 50.51 |
117
- | `SENTS_P` | 92.64 |
118
- | `SENTS_R` | 96.84 |
119
- | `SENTS_F` | 94.70 |
120
- | `DEP_UAS` | 93.19 |
121
- | `DEP_LAS` | 92.08 |
122
  | `TAG_ACC` | 97.12 |
123
- | `LEMMA_ACC` | 96.50 |
124
- | `ENTS_P` | 84.51 |
125
- | `ENTS_R` | 83.02 |
126
- | `ENTS_F` | 83.76 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.8443037975
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.8389937107
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.8416403785
24
  - task:
25
  name: TAG
26
  type: token-classification
 
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9806393516
38
  - task:
39
  name: MORPH
40
  type: token-classification
 
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.9670526831
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.9318325079
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.9202448465
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9794319295
73
  ---
74
  ### Details: https://spacy.io/models/ja#ja_core_news_trf
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `ja_core_news_trf` |
81
+ | **Version** | `3.4.0` |
82
+ | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
84
  | **Components** | `transformer`, `morphologizer`, `parser`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
 
109
  | `TOKEN_P` | 97.65 |
110
  | `TOKEN_R` | 97.90 |
111
  | `TOKEN_F` | 97.77 |
112
+ | `POS_ACC` | 98.06 |
113
  | `MORPH_ACC` | 0.00 |
114
  | `MORPH_MICRO_P` | 34.01 |
115
  | `MORPH_MICRO_R` | 98.04 |
116
  | `MORPH_MICRO_F` | 50.51 |
117
+ | `SENTS_P` | 97.28 |
118
+ | `SENTS_R` | 98.62 |
119
+ | `SENTS_F` | 97.94 |
120
+ | `DEP_UAS` | 93.18 |
121
+ | `DEP_LAS` | 92.02 |
122
  | `TAG_ACC` | 97.12 |
123
+ | `LEMMA_ACC` | 96.71 |
124
+ | `ENTS_P` | 84.43 |
125
+ | `ENTS_R` | 83.90 |
126
+ | `ENTS_F` | 84.16 |
accuracy.json CHANGED
@@ -3,7 +3,7 @@
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
- "pos_acc": 0.9793295403,
7
  "morph_acc": 0.0,
8
  "morph_micro_p": 0.3401360544,
9
  "morph_micro_r": 0.9803921569,
@@ -25,31 +25,31 @@
25
  "f": 0.0
26
  }
27
  },
28
- "sents_p": 0.9264150943,
29
- "sents_r": 0.9684418146,
30
- "sents_f": 0.9469623915,
31
- "dep_uas": 0.9318744653,
32
- "dep_las": 0.9208335209,
33
  "dep_las_per_type": {
34
  "cc": {
35
- "p": 0.9130434783,
36
- "r": 0.875,
37
- "f": 0.8936170213
38
  },
39
  "compound": {
40
- "p": 0.953364817,
41
- "r": 0.9103720406,
42
- "f": 0.931372549
43
  },
44
  "obl": {
45
- "p": 0.8539325843,
46
- "r": 0.8539325843,
47
- "f": 0.8539325843
48
  },
49
  "case": {
50
- "p": 0.9843630816,
51
  "r": 0.9806231003,
52
- "f": 0.9824895318
53
  },
54
  "dislocated": {
55
  "p": 0.7,
@@ -57,74 +57,74 @@
57
  "f": 0.6086956522
58
  },
59
  "nsubj": {
60
- "p": 0.8560460653,
61
- "r": 0.8560460653,
62
- "f": 0.8560460653
63
  },
64
  "nmod": {
65
- "p": 0.9140722291,
66
- "r": 0.8584795322,
67
- "f": 0.8854041013
68
  },
69
  "root": {
70
- "p": 0.9259962049,
71
- "r": 0.9625246548,
72
- "f": 0.9439071567
73
  },
74
  "aux": {
75
- "p": 0.9820075758,
76
- "r": 0.9628597957,
77
- "f": 0.972339428
78
  },
79
  "advcl": {
80
- "p": 0.7400881057,
81
- "r": 0.7550561798,
82
- "f": 0.7474972191
83
  },
84
  "mark": {
85
- "p": 0.9754098361,
86
- "r": 0.952,
87
- "f": 0.963562753
88
  },
89
  "fixed": {
90
- "p": 0.9642218247,
91
  "r": 0.98,
92
- "f": 0.9720468891
93
  },
94
  "acl": {
95
- "p": 0.8886414254,
96
- "r": 0.8769230769,
97
- "f": 0.8827433628
98
  },
99
  "obj": {
100
- "p": 0.9635258359,
101
- "r": 0.9577039275,
102
- "f": 0.9606060606
103
  },
104
  "nummod": {
105
- "p": 0.9868421053,
106
- "r": 0.8875739645,
107
- "f": 0.9345794393
108
  },
109
  "advmod": {
110
- "p": 0.78125,
111
- "r": 0.7142857143,
112
- "f": 0.7462686567
113
  },
114
  "amod": {
115
- "p": 0.9333333333,
116
- "r": 0.7567567568,
117
- "f": 0.8358208955
118
  },
119
  "cop": {
120
- "p": 0.9653179191,
121
- "r": 0.9709302326,
122
- "f": 0.968115942
123
  },
124
  "ccomp": {
125
- "p": 0.9047619048,
126
- "r": 0.8636363636,
127
- "f": 0.8837209302
128
  },
129
  "det": {
130
  "p": 1.0,
@@ -132,111 +132,111 @@
132
  "f": 0.9904761905
133
  },
134
  "csubj": {
135
- "p": 0.7142857143,
136
  "r": 0.8333333333,
137
- "f": 0.7692307692
138
  },
139
  "dep": {
140
- "p": 0.375,
141
  "r": 0.4285714286,
142
- "f": 0.4
143
  }
144
  },
145
  "tag_acc": 0.9712488769,
146
- "lemma_acc": 0.965013864,
147
- "ents_p": 0.8450704225,
148
- "ents_r": 0.8301886792,
149
- "ents_f": 0.8375634518,
150
  "ents_per_type": {
151
  "DATE": {
152
- "p": 0.9722222222,
153
- "r": 0.9633027523,
154
- "f": 0.9677419355
155
  },
156
  "ORG": {
157
- "p": 0.7633587786,
158
- "r": 0.7299270073,
159
- "f": 0.7462686567
160
  },
161
  "TITLE_AFFIX": {
162
- "p": 0.8214285714,
163
- "r": 0.7666666667,
164
- "f": 0.7931034483
165
  },
166
  "PERSON": {
167
- "p": 0.9124087591,
168
- "r": 0.8992805755,
169
- "f": 0.9057971014
170
  },
171
  "GPE": {
172
- "p": 0.82,
173
- "r": 0.8723404255,
174
- "f": 0.8453608247
175
- },
176
- "PRODUCT": {
177
- "p": 0.6666666667,
178
- "r": 0.619047619,
179
- "f": 0.6419753086
180
  },
181
  "TIME": {
182
- "p": 0.8,
183
  "r": 1.0,
184
- "f": 0.8888888889
185
  },
186
  "QUANTITY": {
187
- "p": 0.84,
188
- "r": 0.9545454545,
189
- "f": 0.8936170213
190
  },
191
  "NORP": {
192
- "p": 0.6666666667,
193
- "r": 0.625,
194
- "f": 0.6451612903
195
  },
196
  "ORDINAL": {
197
- "p": 0.7619047619,
198
  "r": 0.7272727273,
199
- "f": 0.7441860465
200
  },
201
  "WORK_OF_ART": {
202
- "p": 0.9285714286,
203
- "r": 0.7647058824,
204
- "f": 0.8387096774
205
- },
206
- "CARDINAL": {
207
- "p": 1.0,
208
- "r": 0.5,
209
- "f": 0.6666666667
210
  },
211
  "PERCENT": {
212
  "p": 1.0,
213
- "r": 0.7142857143,
214
- "f": 0.8333333333
 
 
 
 
 
215
  },
216
  "EVENT": {
217
- "p": 0.9565217391,
218
- "r": 0.8461538462,
219
- "f": 0.8979591837
 
 
 
 
 
220
  },
221
  "FAC": {
222
- "p": 0.875,
223
- "r": 0.7567567568,
224
- "f": 0.8115942029
225
  },
226
  "LOC": {
227
- "p": 0.7272727273,
228
  "r": 0.8,
229
- "f": 0.7619047619
230
  },
231
  "MOVEMENT": {
232
- "p": 0.75,
233
- "r": 0.6,
234
- "f": 0.6666666667
235
  },
236
  "LAW": {
237
- "p": 0.75,
238
- "r": 1.0,
239
- "f": 0.8571428571
240
  },
241
  "MONEY": {
242
  "p": 1.0,
@@ -247,7 +247,12 @@
247
  "p": 1.0,
248
  "r": 1.0,
249
  "f": 1.0
 
 
 
 
 
250
  }
251
  },
252
- "speed": 535.904305803
253
  }
 
3
  "token_p": 0.9764591282,
4
  "token_r": 0.9790021974,
5
  "token_f": 0.9777290092,
6
+ "pos_acc": 0.9806393516,
7
  "morph_acc": 0.0,
8
  "morph_micro_p": 0.3401360544,
9
  "morph_micro_r": 0.9803921569,
 
25
  "f": 0.0
26
  }
27
  },
28
+ "sents_p": 0.9727626459,
29
+ "sents_r": 0.9861932939,
30
+ "sents_f": 0.9794319295,
31
+ "dep_uas": 0.9318325079,
32
+ "dep_las": 0.9202448465,
33
  "dep_las_per_type": {
34
  "cc": {
35
+ "p": 0.8958333333,
36
+ "r": 0.8958333333,
37
+ "f": 0.8958333333
38
  },
39
  "compound": {
40
+ "p": 0.9542755344,
41
+ "r": 0.9058624577,
42
+ "f": 0.9294389821
43
  },
44
  "obl": {
45
+ "p": 0.8513513514,
46
+ "r": 0.8651685393,
47
+ "f": 0.8582043344
48
  },
49
  "case": {
50
+ "p": 0.9873756695,
51
  "r": 0.9806231003,
52
+ "f": 0.9839878002
53
  },
54
  "dislocated": {
55
  "p": 0.7,
 
57
  "f": 0.6086956522
58
  },
59
  "nsubj": {
60
+ "p": 0.8549323017,
61
+ "r": 0.8483685221,
62
+ "f": 0.8516377649
63
  },
64
  "nmod": {
65
+ "p": 0.9195979899,
66
+ "r": 0.8561403509,
67
+ "f": 0.8867353119
68
  },
69
  "root": {
70
+ "p": 0.9486166008,
71
+ "r": 0.9467455621,
72
+ "f": 0.9476801579
73
  },
74
  "aux": {
75
+ "p": 0.9794776119,
76
+ "r": 0.9749303621,
77
+ "f": 0.9771986971
78
  },
79
  "advcl": {
80
+ "p": 0.7342342342,
81
+ "r": 0.7325842697,
82
+ "f": 0.733408324
83
  },
84
  "mark": {
85
+ "p": 0.9757575758,
86
+ "r": 0.966,
87
+ "f": 0.9708542714
88
  },
89
  "fixed": {
90
+ "p": 0.9659498208,
91
  "r": 0.98,
92
+ "f": 0.9729241877
93
  },
94
  "acl": {
95
+ "p": 0.8608695652,
96
+ "r": 0.8703296703,
97
+ "f": 0.8655737705
98
  },
99
  "obj": {
100
+ "p": 0.9386503067,
101
+ "r": 0.9244712991,
102
+ "f": 0.9315068493
103
  },
104
  "nummod": {
105
+ "p": 0.9871794872,
106
+ "r": 0.9112426036,
107
+ "f": 0.9476923077
108
  },
109
  "advmod": {
110
+ "p": 0.7851851852,
111
+ "r": 0.7571428571,
112
+ "f": 0.7709090909
113
  },
114
  "amod": {
115
+ "p": 0.9666666667,
116
+ "r": 0.7837837838,
117
+ "f": 0.8656716418
118
  },
119
  "cop": {
120
+ "p": 0.9822485207,
121
+ "r": 0.9651162791,
122
+ "f": 0.9736070381
123
  },
124
  "ccomp": {
125
+ "p": 1.0,
126
+ "r": 0.8181818182,
127
+ "f": 0.9
128
  },
129
  "det": {
130
  "p": 1.0,
 
132
  "f": 0.9904761905
133
  },
134
  "csubj": {
135
+ "p": 0.6666666667,
136
  "r": 0.8333333333,
137
+ "f": 0.7407407407
138
  },
139
  "dep": {
140
+ "p": 0.3,
141
  "r": 0.4285714286,
142
+ "f": 0.3529411765
143
  }
144
  },
145
  "tag_acc": 0.9712488769,
146
+ "lemma_acc": 0.9670526831,
147
+ "ents_p": 0.8443037975,
148
+ "ents_r": 0.8389937107,
149
+ "ents_f": 0.8416403785,
150
  "ents_per_type": {
151
  "DATE": {
152
+ "p": 0.9907407407,
153
+ "r": 0.9816513761,
154
+ "f": 0.9861751152
155
  },
156
  "ORG": {
157
+ "p": 0.7941176471,
158
+ "r": 0.7883211679,
159
+ "f": 0.7912087912
160
  },
161
  "TITLE_AFFIX": {
162
+ "p": 0.8695652174,
163
+ "r": 0.6666666667,
164
+ "f": 0.7547169811
165
  },
166
  "PERSON": {
167
+ "p": 0.9007092199,
168
+ "r": 0.9136690647,
169
+ "f": 0.9071428571
170
  },
171
  "GPE": {
172
+ "p": 0.8315789474,
173
+ "r": 0.8404255319,
174
+ "f": 0.835978836
 
 
 
 
 
175
  },
176
  "TIME": {
177
+ "p": 1.0,
178
  "r": 1.0,
179
+ "f": 1.0
180
  },
181
  "QUANTITY": {
182
+ "p": 0.8533333333,
183
+ "r": 0.9696969697,
184
+ "f": 0.9078014184
185
  },
186
  "NORP": {
187
+ "p": 0.7419354839,
188
+ "r": 0.71875,
189
+ "f": 0.7301587302
190
  },
191
  "ORDINAL": {
192
+ "p": 0.6956521739,
193
  "r": 0.7272727273,
194
+ "f": 0.7111111111
195
  },
196
  "WORK_OF_ART": {
197
+ "p": 0.8235294118,
198
+ "r": 0.8235294118,
199
+ "f": 0.8235294118
 
 
 
 
 
200
  },
201
  "PERCENT": {
202
  "p": 1.0,
203
+ "r": 0.8571428571,
204
+ "f": 0.9230769231
205
+ },
206
+ "CARDINAL": {
207
+ "p": 0.0,
208
+ "r": 0.0,
209
+ "f": 0.0
210
  },
211
  "EVENT": {
212
+ "p": 1.0,
213
+ "r": 0.9230769231,
214
+ "f": 0.96
215
+ },
216
+ "PRODUCT": {
217
+ "p": 0.6216216216,
218
+ "r": 0.5476190476,
219
+ "f": 0.582278481
220
  },
221
  "FAC": {
222
+ "p": 0.7941176471,
223
+ "r": 0.7297297297,
224
+ "f": 0.7605633803
225
  },
226
  "LOC": {
227
+ "p": 0.5714285714,
228
  "r": 0.8,
229
+ "f": 0.6666666667
230
  },
231
  "MOVEMENT": {
232
+ "p": 0.4,
233
+ "r": 0.4,
234
+ "f": 0.4
235
  },
236
  "LAW": {
237
+ "p": 0.6666666667,
238
+ "r": 0.6666666667,
239
+ "f": 0.6666666667
240
  },
241
  "MONEY": {
242
  "p": 1.0,
 
247
  "p": 1.0,
248
  "r": 1.0,
249
  "f": 1.0
250
+ },
251
+ "PET_NAME": {
252
+ "p": 0.0,
253
+ "r": 0.0,
254
+ "f": 0.0
255
  }
256
  },
257
+ "speed": 2829.1916919204
258
  }
ja_core_news_trf-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e447967dc1d3f4f2c344157bf13b07b39122e9235c8189405cc377aef5010bd7
3
- size 337884057
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:51f0142b124a407acdd90fa60ec9eb4a4908fa9c85c98dfe50d83b827208f3d7
3
+ size 337884760
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"ja",
3
  "name":"core_news_trf",
4
- "version":"3.3.0",
5
  "description":"Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components: transformer, morphologizer, parser, ner.",
6
  "author":"Explosion",
7
  "email":"[email protected]",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 3.0",
10
- "spacy_version":">=3.3.0.dev0,<3.4.0",
11
- "spacy_git_version":"849bef2de",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
@@ -115,7 +115,7 @@
115
  "token_p":0.9764591282,
116
  "token_r":0.9790021974,
117
  "token_f":0.9777290092,
118
- "pos_acc":0.9793295403,
119
  "morph_acc":0.0,
120
  "morph_micro_p":0.3401360544,
121
  "morph_micro_r":0.9803921569,
@@ -137,31 +137,31 @@
137
  "f":0.0
138
  }
139
  },
140
- "sents_p":0.9264150943,
141
- "sents_r":0.9684418146,
142
- "sents_f":0.9469623915,
143
- "dep_uas":0.9318744653,
144
- "dep_las":0.9208335209,
145
  "dep_las_per_type":{
146
  "cc":{
147
- "p":0.9130434783,
148
- "r":0.875,
149
- "f":0.8936170213
150
  },
151
  "compound":{
152
- "p":0.953364817,
153
- "r":0.9103720406,
154
- "f":0.931372549
155
  },
156
  "obl":{
157
- "p":0.8539325843,
158
- "r":0.8539325843,
159
- "f":0.8539325843
160
  },
161
  "case":{
162
- "p":0.9843630816,
163
  "r":0.9806231003,
164
- "f":0.9824895318
165
  },
166
  "dislocated":{
167
  "p":0.7,
@@ -169,74 +169,74 @@
169
  "f":0.6086956522
170
  },
171
  "nsubj":{
172
- "p":0.8560460653,
173
- "r":0.8560460653,
174
- "f":0.8560460653
175
  },
176
  "nmod":{
177
- "p":0.9140722291,
178
- "r":0.8584795322,
179
- "f":0.8854041013
180
  },
181
  "root":{
182
- "p":0.9259962049,
183
- "r":0.9625246548,
184
- "f":0.9439071567
185
  },
186
  "aux":{
187
- "p":0.9820075758,
188
- "r":0.9628597957,
189
- "f":0.972339428
190
  },
191
  "advcl":{
192
- "p":0.7400881057,
193
- "r":0.7550561798,
194
- "f":0.7474972191
195
  },
196
  "mark":{
197
- "p":0.9754098361,
198
- "r":0.952,
199
- "f":0.963562753
200
  },
201
  "fixed":{
202
- "p":0.9642218247,
203
  "r":0.98,
204
- "f":0.9720468891
205
  },
206
  "acl":{
207
- "p":0.8886414254,
208
- "r":0.8769230769,
209
- "f":0.8827433628
210
  },
211
  "obj":{
212
- "p":0.9635258359,
213
- "r":0.9577039275,
214
- "f":0.9606060606
215
  },
216
  "nummod":{
217
- "p":0.9868421053,
218
- "r":0.8875739645,
219
- "f":0.9345794393
220
  },
221
  "advmod":{
222
- "p":0.78125,
223
- "r":0.7142857143,
224
- "f":0.7462686567
225
  },
226
  "amod":{
227
- "p":0.9333333333,
228
- "r":0.7567567568,
229
- "f":0.8358208955
230
  },
231
  "cop":{
232
- "p":0.9653179191,
233
- "r":0.9709302326,
234
- "f":0.968115942
235
  },
236
  "ccomp":{
237
- "p":0.9047619048,
238
- "r":0.8636363636,
239
- "f":0.8837209302
240
  },
241
  "det":{
242
  "p":1.0,
@@ -244,111 +244,111 @@
244
  "f":0.9904761905
245
  },
246
  "csubj":{
247
- "p":0.7142857143,
248
  "r":0.8333333333,
249
- "f":0.7692307692
250
  },
251
  "dep":{
252
- "p":0.375,
253
  "r":0.4285714286,
254
- "f":0.4
255
  }
256
  },
257
  "tag_acc":0.9712488769,
258
- "lemma_acc":0.965013864,
259
- "ents_p":0.8450704225,
260
- "ents_r":0.8301886792,
261
- "ents_f":0.8375634518,
262
  "ents_per_type":{
263
  "DATE":{
264
- "p":0.9722222222,
265
- "r":0.9633027523,
266
- "f":0.9677419355
267
  },
268
  "ORG":{
269
- "p":0.7633587786,
270
- "r":0.7299270073,
271
- "f":0.7462686567
272
  },
273
  "TITLE_AFFIX":{
274
- "p":0.8214285714,
275
- "r":0.7666666667,
276
- "f":0.7931034483
277
  },
278
  "PERSON":{
279
- "p":0.9124087591,
280
- "r":0.8992805755,
281
- "f":0.9057971014
282
  },
283
  "GPE":{
284
- "p":0.82,
285
- "r":0.8723404255,
286
- "f":0.8453608247
287
- },
288
- "PRODUCT":{
289
- "p":0.6666666667,
290
- "r":0.619047619,
291
- "f":0.6419753086
292
  },
293
  "TIME":{
294
- "p":0.8,
295
  "r":1.0,
296
- "f":0.8888888889
297
  },
298
  "QUANTITY":{
299
- "p":0.84,
300
- "r":0.9545454545,
301
- "f":0.8936170213
302
  },
303
  "NORP":{
304
- "p":0.6666666667,
305
- "r":0.625,
306
- "f":0.6451612903
307
  },
308
  "ORDINAL":{
309
- "p":0.7619047619,
310
  "r":0.7272727273,
311
- "f":0.7441860465
312
  },
313
  "WORK_OF_ART":{
314
- "p":0.9285714286,
315
- "r":0.7647058824,
316
- "f":0.8387096774
317
- },
318
- "CARDINAL":{
319
- "p":1.0,
320
- "r":0.5,
321
- "f":0.6666666667
322
  },
323
  "PERCENT":{
324
  "p":1.0,
325
- "r":0.7142857143,
326
- "f":0.8333333333
 
 
 
 
 
327
  },
328
  "EVENT":{
329
- "p":0.9565217391,
330
- "r":0.8461538462,
331
- "f":0.8979591837
 
 
 
 
 
332
  },
333
  "FAC":{
334
- "p":0.875,
335
- "r":0.7567567568,
336
- "f":0.8115942029
337
  },
338
  "LOC":{
339
- "p":0.7272727273,
340
  "r":0.8,
341
- "f":0.7619047619
342
  },
343
  "MOVEMENT":{
344
- "p":0.75,
345
- "r":0.6,
346
- "f":0.6666666667
347
  },
348
  "LAW":{
349
- "p":0.75,
350
- "r":1.0,
351
- "f":0.8571428571
352
  },
353
  "MONEY":{
354
  "p":1.0,
@@ -359,9 +359,14 @@
359
  "p":1.0,
360
  "r":1.0,
361
  "f":1.0
 
 
 
 
 
362
  }
363
  },
364
- "speed":535.904305803
365
  },
366
  "sources":[
367
  {
 
1
  {
2
  "lang":"ja",
3
  "name":"core_news_trf",
4
+ "version":"3.4.0",
5
  "description":"Japanese transformer pipeline (cl-tohoku/bert-base-japanese-char-v2). Components: transformer, morphologizer, parser, ner.",
6
  "author":"Explosion",
7
  "email":"[email protected]",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 3.0",
10
+ "spacy_version":">=3.4.0,<3.5.0",
11
+ "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":0,
14
  "vectors":0,
 
115
  "token_p":0.9764591282,
116
  "token_r":0.9790021974,
117
  "token_f":0.9777290092,
118
+ "pos_acc":0.9806393516,
119
  "morph_acc":0.0,
120
  "morph_micro_p":0.3401360544,
121
  "morph_micro_r":0.9803921569,
 
137
  "f":0.0
138
  }
139
  },
140
+ "sents_p":0.9727626459,
141
+ "sents_r":0.9861932939,
142
+ "sents_f":0.9794319295,
143
+ "dep_uas":0.9318325079,
144
+ "dep_las":0.9202448465,
145
  "dep_las_per_type":{
146
  "cc":{
147
+ "p":0.8958333333,
148
+ "r":0.8958333333,
149
+ "f":0.8958333333
150
  },
151
  "compound":{
152
+ "p":0.9542755344,
153
+ "r":0.9058624577,
154
+ "f":0.9294389821
155
  },
156
  "obl":{
157
+ "p":0.8513513514,
158
+ "r":0.8651685393,
159
+ "f":0.8582043344
160
  },
161
  "case":{
162
+ "p":0.9873756695,
163
  "r":0.9806231003,
164
+ "f":0.9839878002
165
  },
166
  "dislocated":{
167
  "p":0.7,
 
169
  "f":0.6086956522
170
  },
171
  "nsubj":{
172
+ "p":0.8549323017,
173
+ "r":0.8483685221,
174
+ "f":0.8516377649
175
  },
176
  "nmod":{
177
+ "p":0.9195979899,
178
+ "r":0.8561403509,
179
+ "f":0.8867353119
180
  },
181
  "root":{
182
+ "p":0.9486166008,
183
+ "r":0.9467455621,
184
+ "f":0.9476801579
185
  },
186
  "aux":{
187
+ "p":0.9794776119,
188
+ "r":0.9749303621,
189
+ "f":0.9771986971
190
  },
191
  "advcl":{
192
+ "p":0.7342342342,
193
+ "r":0.7325842697,
194
+ "f":0.733408324
195
  },
196
  "mark":{
197
+ "p":0.9757575758,
198
+ "r":0.966,
199
+ "f":0.9708542714
200
  },
201
  "fixed":{
202
+ "p":0.9659498208,
203
  "r":0.98,
204
+ "f":0.9729241877
205
  },
206
  "acl":{
207
+ "p":0.8608695652,
208
+ "r":0.8703296703,
209
+ "f":0.8655737705
210
  },
211
  "obj":{
212
+ "p":0.9386503067,
213
+ "r":0.9244712991,
214
+ "f":0.9315068493
215
  },
216
  "nummod":{
217
+ "p":0.9871794872,
218
+ "r":0.9112426036,
219
+ "f":0.9476923077
220
  },
221
  "advmod":{
222
+ "p":0.7851851852,
223
+ "r":0.7571428571,
224
+ "f":0.7709090909
225
  },
226
  "amod":{
227
+ "p":0.9666666667,
228
+ "r":0.7837837838,
229
+ "f":0.8656716418
230
  },
231
  "cop":{
232
+ "p":0.9822485207,
233
+ "r":0.9651162791,
234
+ "f":0.9736070381
235
  },
236
  "ccomp":{
237
+ "p":1.0,
238
+ "r":0.8181818182,
239
+ "f":0.9
240
  },
241
  "det":{
242
  "p":1.0,
 
244
  "f":0.9904761905
245
  },
246
  "csubj":{
247
+ "p":0.6666666667,
248
  "r":0.8333333333,
249
+ "f":0.7407407407
250
  },
251
  "dep":{
252
+ "p":0.3,
253
  "r":0.4285714286,
254
+ "f":0.3529411765
255
  }
256
  },
257
  "tag_acc":0.9712488769,
258
+ "lemma_acc":0.9670526831,
259
+ "ents_p":0.8443037975,
260
+ "ents_r":0.8389937107,
261
+ "ents_f":0.8416403785,
262
  "ents_per_type":{
263
  "DATE":{
264
+ "p":0.9907407407,
265
+ "r":0.9816513761,
266
+ "f":0.9861751152
267
  },
268
  "ORG":{
269
+ "p":0.7941176471,
270
+ "r":0.7883211679,
271
+ "f":0.7912087912
272
  },
273
  "TITLE_AFFIX":{
274
+ "p":0.8695652174,
275
+ "r":0.6666666667,
276
+ "f":0.7547169811
277
  },
278
  "PERSON":{
279
+ "p":0.9007092199,
280
+ "r":0.9136690647,
281
+ "f":0.9071428571
282
  },
283
  "GPE":{
284
+ "p":0.8315789474,
285
+ "r":0.8404255319,
286
+ "f":0.835978836
 
 
 
 
 
287
  },
288
  "TIME":{
289
+ "p":1.0,
290
  "r":1.0,
291
+ "f":1.0
292
  },
293
  "QUANTITY":{
294
+ "p":0.8533333333,
295
+ "r":0.9696969697,
296
+ "f":0.9078014184
297
  },
298
  "NORP":{
299
+ "p":0.7419354839,
300
+ "r":0.71875,
301
+ "f":0.7301587302
302
  },
303
  "ORDINAL":{
304
+ "p":0.6956521739,
305
  "r":0.7272727273,
306
+ "f":0.7111111111
307
  },
308
  "WORK_OF_ART":{
309
+ "p":0.8235294118,
310
+ "r":0.8235294118,
311
+ "f":0.8235294118
 
 
 
 
 
312
  },
313
  "PERCENT":{
314
  "p":1.0,
315
+ "r":0.8571428571,
316
+ "f":0.9230769231
317
+ },
318
+ "CARDINAL":{
319
+ "p":0.0,
320
+ "r":0.0,
321
+ "f":0.0
322
  },
323
  "EVENT":{
324
+ "p":1.0,
325
+ "r":0.9230769231,
326
+ "f":0.96
327
+ },
328
+ "PRODUCT":{
329
+ "p":0.6216216216,
330
+ "r":0.5476190476,
331
+ "f":0.582278481
332
  },
333
  "FAC":{
334
+ "p":0.7941176471,
335
+ "r":0.7297297297,
336
+ "f":0.7605633803
337
  },
338
  "LOC":{
339
+ "p":0.5714285714,
340
  "r":0.8,
341
+ "f":0.6666666667
342
  },
343
  "MOVEMENT":{
344
+ "p":0.4,
345
+ "r":0.4,
346
+ "f":0.4
347
  },
348
  "LAW":{
349
+ "p":0.6666666667,
350
+ "r":0.6666666667,
351
+ "f":0.6666666667
352
  },
353
  "MONEY":{
354
  "p":1.0,
 
359
  "p":1.0,
360
  "r":1.0,
361
  "f":1.0
362
+ },
363
+ "PET_NAME":{
364
+ "p":0.0,
365
+ "r":0.0,
366
+ "f":0.0
367
  }
368
  },
369
+ "speed":2829.1916919204
370
  },
371
  "sources":[
372
  {
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f550659b90f141f19c15eadc29e768f3ab3acdf443be69351a0954215a011887
3
  size 59084
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c2d8ebad0d05f95532763df7e037c200a53b3d967a4780ce3b200376e0b9b7e
3
  size 59084
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:61adab28c0b15f08b8326b9f611f369f9b42a0a5c5760c91ce21b4ed41fd1d7d
3
  size 338861
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d88fa5c2720aa1ab707719d91fdd75ea8303709f648f5cd8df889235cd294ed8
3
  size 338861
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e1360ceabe0f7737e425e42270b8767811c89aec5602ed52d753f9de6521f42c
3
  size 318612
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c420287c381609578c2f76348243a44c556d2471fef08cbaf03c42d4b7203045
3
  size 318612
transformer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62c9c29146b6c9f19aaa658d4972cb6f20fc45f4b7bf7bf820e2aae397f306c8
3
- size 363145603
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb035744014008c4e09ccf237f08798a9265a4aed19e93828f47f30270674813
3
+ size 363145638
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0a7f2048b4765a1e1ef23263c78eff7d7a3037be7018e269628c21833a476d8b
3
- size 1601276
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8c4c085e460d965216188fcf475275929e8562fdc40ea14f82e344c84faed30
3
+ size 1600684