Frenchizer commited on
Commit
36f3e0c
·
verified ·
1 Parent(s): 0f76bc2

Upload meta.json

Browse files
Files changed (1) hide show
  1. en_core_web_sm/meta.json +522 -0
en_core_web_sm/meta.json ADDED
@@ -0,0 +1,522 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lang":"en",
3
+ "name":"core_web_sm",
4
+ "version":"3.8.0",
5
+ "description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.",
6
+ "author":"Explosion",
7
+ "email":"[email protected]",
8
+ "url":"https://explosion.ai",
9
+ "license":"MIT",
10
+ "spacy_version":">=3.8.0,<3.9.0",
11
+ "spacy_git_version":"5010fcbd3",
12
+ "vectors":{
13
+ "width":0,
14
+ "vectors":0,
15
+ "keys":0,
16
+ "name":null,
17
+ "mode":"default"
18
+ },
19
+ "labels":{
20
+ "tok2vec":[
21
+
22
+ ],
23
+ "tagger":[
24
+ "$",
25
+ "''",
26
+ ",",
27
+ "-LRB-",
28
+ "-RRB-",
29
+ ".",
30
+ ":",
31
+ "ADD",
32
+ "AFX",
33
+ "CC",
34
+ "CD",
35
+ "DT",
36
+ "EX",
37
+ "FW",
38
+ "HYPH",
39
+ "IN",
40
+ "JJ",
41
+ "JJR",
42
+ "JJS",
43
+ "LS",
44
+ "MD",
45
+ "NFP",
46
+ "NN",
47
+ "NNP",
48
+ "NNPS",
49
+ "NNS",
50
+ "PDT",
51
+ "POS",
52
+ "PRP",
53
+ "PRP$",
54
+ "RB",
55
+ "RBR",
56
+ "RBS",
57
+ "RP",
58
+ "SYM",
59
+ "TO",
60
+ "UH",
61
+ "VB",
62
+ "VBD",
63
+ "VBG",
64
+ "VBN",
65
+ "VBP",
66
+ "VBZ",
67
+ "WDT",
68
+ "WP",
69
+ "WP$",
70
+ "WRB",
71
+ "XX",
72
+ "_SP",
73
+ "``"
74
+ ],
75
+ "parser":[
76
+ "ROOT",
77
+ "acl",
78
+ "acomp",
79
+ "advcl",
80
+ "advmod",
81
+ "agent",
82
+ "amod",
83
+ "appos",
84
+ "attr",
85
+ "aux",
86
+ "auxpass",
87
+ "case",
88
+ "cc",
89
+ "ccomp",
90
+ "compound",
91
+ "conj",
92
+ "csubj",
93
+ "csubjpass",
94
+ "dative",
95
+ "dep",
96
+ "det",
97
+ "dobj",
98
+ "expl",
99
+ "intj",
100
+ "mark",
101
+ "meta",
102
+ "neg",
103
+ "nmod",
104
+ "npadvmod",
105
+ "nsubj",
106
+ "nsubjpass",
107
+ "nummod",
108
+ "oprd",
109
+ "parataxis",
110
+ "pcomp",
111
+ "pobj",
112
+ "poss",
113
+ "preconj",
114
+ "predet",
115
+ "prep",
116
+ "prt",
117
+ "punct",
118
+ "quantmod",
119
+ "relcl",
120
+ "xcomp"
121
+ ],
122
+ "attribute_ruler":[
123
+
124
+ ],
125
+ "lemmatizer":[
126
+
127
+ ],
128
+ "ner":[
129
+ "CARDINAL",
130
+ "DATE",
131
+ "EVENT",
132
+ "FAC",
133
+ "GPE",
134
+ "LANGUAGE",
135
+ "LAW",
136
+ "LOC",
137
+ "MONEY",
138
+ "NORP",
139
+ "ORDINAL",
140
+ "ORG",
141
+ "PERCENT",
142
+ "PERSON",
143
+ "PRODUCT",
144
+ "QUANTITY",
145
+ "TIME",
146
+ "WORK_OF_ART"
147
+ ]
148
+ },
149
+ "pipeline":[
150
+ "tok2vec",
151
+ "tagger",
152
+ "parser",
153
+ "attribute_ruler",
154
+ "lemmatizer",
155
+ "ner"
156
+ ],
157
+ "components":[
158
+ "tok2vec",
159
+ "tagger",
160
+ "parser",
161
+ "senter",
162
+ "attribute_ruler",
163
+ "lemmatizer",
164
+ "ner"
165
+ ],
166
+ "disabled":[
167
+ "senter"
168
+ ],
169
+ "performance":{
170
+ "token_acc":0.9986194413,
171
+ "token_p":0.9956819193,
172
+ "token_r":0.9957659295,
173
+ "token_f":0.9957239226,
174
+ "tag_acc":0.972937262,
175
+ "sents_p":0.9200841934,
176
+ "sents_r":0.8939244013,
177
+ "sents_f":0.9068156724,
178
+ "dep_uas":0.9176955214,
179
+ "dep_las":0.8991533598,
180
+ "dep_las_per_type":{
181
+ "prep":{
182
+ "p":0.8541604085,
183
+ "r":0.8631379245,
184
+ "f":0.8586257006
185
+ },
186
+ "det":{
187
+ "p":0.9768729642,
188
+ "r":0.9782271875,
189
+ "f":0.9775496068
190
+ },
191
+ "pobj":{
192
+ "p":0.9620664033,
193
+ "r":0.966071078,
194
+ "f":0.9640645819
195
+ },
196
+ "nsubj":{
197
+ "p":0.9573684677,
198
+ "r":0.9454983571,
199
+ "f":0.9513963894
200
+ },
201
+ "aux":{
202
+ "p":0.9792295402,
203
+ "r":0.982106294,
204
+ "f":0.9806658074
205
+ },
206
+ "advmod":{
207
+ "p":0.8525198045,
208
+ "r":0.8510853104,
209
+ "f":0.8518019535
210
+ },
211
+ "relcl":{
212
+ "p":0.7660107335,
213
+ "r":0.776850508,
214
+ "f":0.7713925419
215
+ },
216
+ "root":{
217
+ "p":0.9179682195,
218
+ "r":0.8917474767,
219
+ "f":0.9046678936
220
+ },
221
+ "xcomp":{
222
+ "p":0.8814035088,
223
+ "r":0.9016511127,
224
+ "f":0.8914123492
225
+ },
226
+ "amod":{
227
+ "p":0.9161996611,
228
+ "r":0.9109167477,
229
+ "f":0.9135505669
230
+ },
231
+ "compound":{
232
+ "p":0.916113822,
233
+ "r":0.9305524616,
234
+ "f":0.9232766957
235
+ },
236
+ "poss":{
237
+ "p":0.9741586538,
238
+ "r":0.9788647343,
239
+ "f":0.9765060241
240
+ },
241
+ "ccomp":{
242
+ "p":0.7786216062,
243
+ "r":0.8352342159,
244
+ "f":0.8059349514
245
+ },
246
+ "attr":{
247
+ "p":0.8972491909,
248
+ "r":0.9327165685,
249
+ "f":0.9146391753
250
+ },
251
+ "case":{
252
+ "p":0.9782608696,
253
+ "r":0.990990991,
254
+ "f":0.9845847837
255
+ },
256
+ "mark":{
257
+ "p":0.9028511088,
258
+ "r":0.906200318,
259
+ "f":0.9045226131
260
+ },
261
+ "intj":{
262
+ "p":0.6679841897,
263
+ "r":0.619047619,
264
+ "f":0.6425855513
265
+ },
266
+ "advcl":{
267
+ "p":0.6656519533,
268
+ "r":0.6607907328,
269
+ "f":0.6632124352
270
+ },
271
+ "cc":{
272
+ "p":0.8345964153,
273
+ "r":0.8298050472,
274
+ "f":0.8321938347
275
+ },
276
+ "neg":{
277
+ "p":0.9475786321,
278
+ "r":0.9523331661,
279
+ "f":0.9499499499
280
+ },
281
+ "conj":{
282
+ "p":0.7649689441,
283
+ "r":0.7751762336,
284
+ "f":0.7700387645
285
+ },
286
+ "nsubjpass":{
287
+ "p":0.9159021407,
288
+ "r":0.9215384615,
289
+ "f":0.9187116564
290
+ },
291
+ "auxpass":{
292
+ "p":0.9494232476,
293
+ "r":0.9749430524,
294
+ "f":0.9620139357
295
+ },
296
+ "dobj":{
297
+ "p":0.9231431478,
298
+ "r":0.9399155311,
299
+ "f":0.9314538419
300
+ },
301
+ "nummod":{
302
+ "p":0.9353284301,
303
+ "r":0.9313131313,
304
+ "f":0.9333164621
305
+ },
306
+ "npadvmod":{
307
+ "p":0.7748267898,
308
+ "r":0.7150976909,
309
+ "f":0.7437650102
310
+ },
311
+ "prt":{
312
+ "p":0.8148760331,
313
+ "r":0.8835125448,
314
+ "f":0.8478073947
315
+ },
316
+ "pcomp":{
317
+ "p":0.8693820225,
318
+ "r":0.8669467787,
319
+ "f":0.8681626928
320
+ },
321
+ "expl":{
322
+ "p":0.9789029536,
323
+ "r":0.9935760171,
324
+ "f":0.9861849097
325
+ },
326
+ "acl":{
327
+ "p":0.7417295415,
328
+ "r":0.6972176759,
329
+ "f":0.7187851519
330
+ },
331
+ "agent":{
332
+ "p":0.8994889267,
333
+ "r":0.9462365591,
334
+ "f":0.9222707424
335
+ },
336
+ "dative":{
337
+ "p":0.7669172932,
338
+ "r":0.7018348624,
339
+ "f":0.7329341317
340
+ },
341
+ "acomp":{
342
+ "p":0.9132441163,
343
+ "r":0.8975056689,
344
+ "f":0.9053064959
345
+ },
346
+ "dep":{
347
+ "p":0.3686006826,
348
+ "r":0.1753246753,
349
+ "f":0.2376237624
350
+ },
351
+ "csubj":{
352
+ "p":0.7039106145,
353
+ "r":0.7455621302,
354
+ "f":0.724137931
355
+ },
356
+ "quantmod":{
357
+ "p":0.8625336927,
358
+ "r":0.7798537774,
359
+ "f":0.819112628
360
+ },
361
+ "nmod":{
362
+ "p":0.752886836,
363
+ "r":0.5959780622,
364
+ "f":0.6653061224
365
+ },
366
+ "appos":{
367
+ "p":0.6866606983,
368
+ "r":0.6655097614,
369
+ "f":0.6759198061
370
+ },
371
+ "predet":{
372
+ "p":0.8406374502,
373
+ "r":0.9055793991,
374
+ "f":0.8719008264
375
+ },
376
+ "preconj":{
377
+ "p":0.5591397849,
378
+ "r":0.6046511628,
379
+ "f":0.5810055866
380
+ },
381
+ "oprd":{
382
+ "p":0.8287671233,
383
+ "r":0.7223880597,
384
+ "f":0.7719298246
385
+ },
386
+ "parataxis":{
387
+ "p":0.5860215054,
388
+ "r":0.4728850325,
389
+ "f":0.5234093637
390
+ },
391
+ "meta":{
392
+ "p":0.8,
393
+ "r":0.4615384615,
394
+ "f":0.5853658537
395
+ },
396
+ "csubjpass":{
397
+ "p":0.625,
398
+ "r":0.8333333333,
399
+ "f":0.7142857143
400
+ }
401
+ },
402
+ "ents_p":0.8429743795,
403
+ "ents_r":0.8436498397,
404
+ "ents_f":0.8433119744,
405
+ "ents_per_type":{
406
+ "DATE":{
407
+ "p":0.8531038722,
408
+ "r":0.8812698413,
409
+ "f":0.8669581512
410
+ },
411
+ "GPE":{
412
+ "p":0.9142205757,
413
+ "r":0.8948396095,
414
+ "f":0.9044262757
415
+ },
416
+ "ORDINAL":{
417
+ "p":0.7741046832,
418
+ "r":0.8726708075,
419
+ "f":0.8204379562
420
+ },
421
+ "ORG":{
422
+ "p":0.7904834996,
423
+ "r":0.8191940615,
424
+ "f":0.8045827366
425
+ },
426
+ "CARDINAL":{
427
+ "p":0.8149386845,
428
+ "r":0.8692033294,
429
+ "f":0.8411967779
430
+ },
431
+ "FAC":{
432
+ "p":0.3904761905,
433
+ "r":0.3153846154,
434
+ "f":0.3489361702
435
+ },
436
+ "PERSON":{
437
+ "p":0.8574969021,
438
+ "r":0.9033942559,
439
+ "f":0.8798474253
440
+ },
441
+ "NORP":{
442
+ "p":0.903122498,
443
+ "r":0.9024,
444
+ "f":0.9027611044
445
+ },
446
+ "TIME":{
447
+ "p":0.7454545455,
448
+ "r":0.7192982456,
449
+ "f":0.7321428571
450
+ },
451
+ "LOC":{
452
+ "p":0.7356321839,
453
+ "r":0.6114649682,
454
+ "f":0.667826087
455
+ },
456
+ "MONEY":{
457
+ "p":0.915274463,
458
+ "r":0.9055489965,
459
+ "f":0.9103857567
460
+ },
461
+ "QUANTITY":{
462
+ "p":0.8153846154,
463
+ "r":0.5824175824,
464
+ "f":0.6794871795
465
+ },
466
+ "WORK_OF_ART":{
467
+ "p":0.4744525547,
468
+ "r":0.3350515464,
469
+ "f":0.3927492447
470
+ },
471
+ "EVENT":{
472
+ "p":0.6341463415,
473
+ "r":0.2988505747,
474
+ "f":0.40625
475
+ },
476
+ "LAW":{
477
+ "p":0.4464285714,
478
+ "r":0.390625,
479
+ "f":0.4166666667
480
+ },
481
+ "PERCENT":{
482
+ "p":0.9153354633,
483
+ "r":0.8774885145,
484
+ "f":0.8960125098
485
+ },
486
+ "LANGUAGE":{
487
+ "p":0.7692307692,
488
+ "r":0.625,
489
+ "f":0.6896551724
490
+ },
491
+ "PRODUCT":{
492
+ "p":0.5287356322,
493
+ "r":0.2180094787,
494
+ "f":0.3087248322
495
+ }
496
+ },
497
+ "speed":9426.1029865937
498
+ },
499
+ "sources":[
500
+ {
501
+ "name":"OntoNotes 5",
502
+ "url":"https://catalog.ldc.upenn.edu/LDC2013T19",
503
+ "license":"commercial (licensed by Explosion)",
504
+ "author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston"
505
+ },
506
+ {
507
+ "name":"ClearNLP Constituent-to-Dependency Conversion",
508
+ "url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md",
509
+ "license":"Citation provided for reference, no code packaged with model",
510
+ "author":"Emory University"
511
+ },
512
+ {
513
+ "name":"WordNet 3.0",
514
+ "url":"https://wordnet.princeton.edu/",
515
+ "author":"Princeton University",
516
+ "license":"WordNet 3.0 License"
517
+ }
518
+ ],
519
+ "requirements":[
520
+
521
+ ]
522
+ }