Update spaCy pipeline
Browse files- .gitattributes +2 -0
- README.md +11 -11
- config.cfg +5 -5
- en_Spacy_Custom_ner2-any-py3-none-any.whl +2 -2
- meta.json +28 -22
- ner/model +0 -0
- ner/moves +1 -1
- tok2vec/model +2 -2
- vocab/key2row +3 -1
- vocab/strings.json +0 -0
- vocab/vectors +0 -0
.gitattributes
CHANGED
@@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
en_Spacy_Custom_ner2-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
36 |
tok2vec/model filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
34 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
35 |
en_Spacy_Custom_ner2-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
36 |
tok2vec/model filter=lfs diff=lfs merge=lfs -text
|
37 |
+
vocab/key2row filter=lfs diff=lfs merge=lfs -text
|
38 |
+
vocab/vectors filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
@@ -13,13 +13,13 @@ model-index:
|
|
13 |
metrics:
|
14 |
- name: NER Precision
|
15 |
type: precision
|
16 |
-
value: 0.
|
17 |
- name: NER Recall
|
18 |
type: recall
|
19 |
-
value: 0.
|
20 |
- name: NER F Score
|
21 |
type: f_score
|
22 |
-
value: 0.
|
23 |
---
|
24 |
| Feature | Description |
|
25 |
| --- | --- |
|
@@ -28,7 +28,7 @@ model-index:
|
|
28 |
| **spaCy** | `>=3.5.3,<3.6.0` |
|
29 |
| **Default Pipeline** | `tok2vec`, `ner` |
|
30 |
| **Components** | `tok2vec`, `ner` |
|
31 |
-
| **Vectors** |
|
32 |
| **Sources** | n/a |
|
33 |
| **License** | n/a |
|
34 |
| **Author** | [n/a]() |
|
@@ -37,11 +37,11 @@ model-index:
|
|
37 |
|
38 |
<details>
|
39 |
|
40 |
-
<summary>View label scheme (
|
41 |
|
42 |
| Component | Labels |
|
43 |
| --- | --- |
|
44 |
-
| **`ner`** | `AGENT_FALLBACK`, `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE` |
|
45 |
|
46 |
</details>
|
47 |
|
@@ -49,8 +49,8 @@ model-index:
|
|
49 |
|
50 |
| Type | Score |
|
51 |
| --- | --- |
|
52 |
-
| `ENTS_F` | 99.
|
53 |
-
| `ENTS_P` | 99.
|
54 |
-
| `ENTS_R` | 99.
|
55 |
-
| `TOK2VEC_LOSS` |
|
56 |
-
| `NER_LOSS` |
|
|
|
13 |
metrics:
|
14 |
- name: NER Precision
|
15 |
type: precision
|
16 |
+
value: 0.9918793503
|
17 |
- name: NER Recall
|
18 |
type: recall
|
19 |
+
value: 0.9965034965
|
20 |
- name: NER F Score
|
21 |
type: f_score
|
22 |
+
value: 0.9941860465
|
23 |
---
|
24 |
| Feature | Description |
|
25 |
| --- | --- |
|
|
|
28 |
| **spaCy** | `>=3.5.3,<3.6.0` |
|
29 |
| **Default Pipeline** | `tok2vec`, `ner` |
|
30 |
| **Components** | `tok2vec`, `ner` |
|
31 |
+
| **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
|
32 |
| **Sources** | n/a |
|
33 |
| **License** | n/a |
|
34 |
| **Author** | [n/a]() |
|
|
|
37 |
|
38 |
<details>
|
39 |
|
40 |
+
<summary>View label scheme (16 labels for 1 components)</summary>
|
41 |
|
42 |
| Component | Labels |
|
43 |
| --- | --- |
|
44 |
+
| **`ner`** | `AGENT_FALLBACK`, `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE`, `WELCOME_MSG` |
|
45 |
|
46 |
</details>
|
47 |
|
|
|
49 |
|
50 |
| Type | Score |
|
51 |
| --- | --- |
|
52 |
+
| `ENTS_F` | 99.42 |
|
53 |
+
| `ENTS_P` | 99.19 |
|
54 |
+
| `ENTS_R` | 99.65 |
|
55 |
+
| `TOK2VEC_LOSS` | 1794.25 |
|
56 |
+
| `NER_LOSS` | 53209.43 |
|
config.cfg
CHANGED
@@ -1,7 +1,7 @@
|
|
1 |
[paths]
|
2 |
train = "./training_data.spacy"
|
3 |
dev = "./training_data.spacy"
|
4 |
-
vectors =
|
5 |
init_tok2vec = null
|
6 |
|
7 |
[system]
|
@@ -11,7 +11,7 @@ seed = 0
|
|
11 |
[nlp]
|
12 |
lang = "en"
|
13 |
pipeline = ["tok2vec","ner"]
|
14 |
-
batch_size =
|
15 |
disabled = []
|
16 |
before_creation = null
|
17 |
after_creation = null
|
@@ -52,12 +52,12 @@ factory = "tok2vec"
|
|
52 |
width = ${components.tok2vec.model.encode.width}
|
53 |
attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
|
54 |
rows = [5000,1000,2500,2500]
|
55 |
-
include_static_vectors =
|
56 |
|
57 |
[components.tok2vec.model.encode]
|
58 |
@architectures = "spacy.MaxoutWindowEncoder.v2"
|
59 |
-
width =
|
60 |
-
depth =
|
61 |
window_size = 1
|
62 |
maxout_pieces = 3
|
63 |
|
|
|
1 |
[paths]
|
2 |
train = "./training_data.spacy"
|
3 |
dev = "./training_data.spacy"
|
4 |
+
vectors = "en_core_web_lg"
|
5 |
init_tok2vec = null
|
6 |
|
7 |
[system]
|
|
|
11 |
[nlp]
|
12 |
lang = "en"
|
13 |
pipeline = ["tok2vec","ner"]
|
14 |
+
batch_size = 100
|
15 |
disabled = []
|
16 |
before_creation = null
|
17 |
after_creation = null
|
|
|
52 |
width = ${components.tok2vec.model.encode.width}
|
53 |
attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
|
54 |
rows = [5000,1000,2500,2500]
|
55 |
+
include_static_vectors = true
|
56 |
|
57 |
[components.tok2vec.model.encode]
|
58 |
@architectures = "spacy.MaxoutWindowEncoder.v2"
|
59 |
+
width = 256
|
60 |
+
depth = 8
|
61 |
window_size = 1
|
62 |
maxout_pieces = 3
|
63 |
|
en_Spacy_Custom_ner2-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cdf71ff55f457d482bbdb22b28d2290167f5d9e468d01bf27dba4cd9b365bd5e
|
3 |
+
size 606745646
|
meta.json
CHANGED
@@ -10,10 +10,10 @@
|
|
10 |
"spacy_version":">=3.5.3,<3.6.0",
|
11 |
"spacy_git_version":"Unknown",
|
12 |
"vectors":{
|
13 |
-
"width":
|
14 |
-
"vectors":
|
15 |
-
"keys":
|
16 |
-
"name":
|
17 |
},
|
18 |
"labels":{
|
19 |
"tok2vec":[
|
@@ -34,7 +34,8 @@
|
|
34 |
"ORIGIN",
|
35 |
"SEARCH RATES",
|
36 |
"SHIP",
|
37 |
-
"SHIPMENT TYPE"
|
|
|
38 |
]
|
39 |
},
|
40 |
"pipeline":[
|
@@ -49,9 +50,9 @@
|
|
49 |
|
50 |
],
|
51 |
"performance":{
|
52 |
-
"ents_f":0.
|
53 |
-
"ents_p":0.
|
54 |
-
"ents_r":0.
|
55 |
"ents_per_type":{
|
56 |
"SEARCH RATES":{
|
57 |
"p":1.0,
|
@@ -64,9 +65,9 @@
|
|
64 |
"f":1.0
|
65 |
},
|
66 |
"DESTINATION":{
|
67 |
-
"p":0.
|
68 |
-
"r":0
|
69 |
-
"f":0.
|
70 |
},
|
71 |
"BOOK":{
|
72 |
"p":1.0,
|
@@ -79,9 +80,9 @@
|
|
79 |
"f":0.9938650307
|
80 |
},
|
81 |
"CONTAINER SIZE":{
|
82 |
-
"p":
|
83 |
-
"r":0.
|
84 |
-
"f":0.
|
85 |
},
|
86 |
"SHIPMENT TYPE":{
|
87 |
"p":1.0,
|
@@ -109,9 +110,9 @@
|
|
109 |
"f":1.0
|
110 |
},
|
111 |
"COMODITY":{
|
112 |
-
"p":0.
|
113 |
-
"r":
|
114 |
-
"f":0.
|
115 |
},
|
116 |
"CONTAINER COUNT":{
|
117 |
"p":1.0,
|
@@ -119,18 +120,23 @@
|
|
119 |
"f":1.0
|
120 |
},
|
121 |
"CONTAINER SIZE-COUNT":{
|
122 |
-
"p":0
|
123 |
-
"r":
|
124 |
-
"f":0.
|
125 |
},
|
126 |
"AGENT_FALLBACK":{
|
127 |
"p":1.0,
|
128 |
"r":1.0,
|
129 |
"f":1.0
|
|
|
|
|
|
|
|
|
|
|
130 |
}
|
131 |
},
|
132 |
-
"tok2vec_loss":
|
133 |
-
"ner_loss":
|
134 |
},
|
135 |
"requirements":[
|
136 |
|
|
|
10 |
"spacy_version":">=3.5.3,<3.6.0",
|
11 |
"spacy_git_version":"Unknown",
|
12 |
"vectors":{
|
13 |
+
"width":300,
|
14 |
+
"vectors":514157,
|
15 |
+
"keys":514157,
|
16 |
+
"name":"en_vectors"
|
17 |
},
|
18 |
"labels":{
|
19 |
"tok2vec":[
|
|
|
34 |
"ORIGIN",
|
35 |
"SEARCH RATES",
|
36 |
"SHIP",
|
37 |
+
"SHIPMENT TYPE",
|
38 |
+
"WELCOME_MSG"
|
39 |
]
|
40 |
},
|
41 |
"pipeline":[
|
|
|
50 |
|
51 |
],
|
52 |
"performance":{
|
53 |
+
"ents_f":0.9941860465,
|
54 |
+
"ents_p":0.9918793503,
|
55 |
+
"ents_r":0.9965034965,
|
56 |
"ents_per_type":{
|
57 |
"SEARCH RATES":{
|
58 |
"p":1.0,
|
|
|
65 |
"f":1.0
|
66 |
},
|
67 |
"DESTINATION":{
|
68 |
+
"p":0.9903846154,
|
69 |
+
"r":1.0,
|
70 |
+
"f":0.9951690821
|
71 |
},
|
72 |
"BOOK":{
|
73 |
"p":1.0,
|
|
|
80 |
"f":0.9938650307
|
81 |
},
|
82 |
"CONTAINER SIZE":{
|
83 |
+
"p":0.9905660377,
|
84 |
+
"r":0.9905660377,
|
85 |
+
"f":0.9905660377
|
86 |
},
|
87 |
"SHIPMENT TYPE":{
|
88 |
"p":1.0,
|
|
|
110 |
"f":1.0
|
111 |
},
|
112 |
"COMODITY":{
|
113 |
+
"p":0.9523809524,
|
114 |
+
"r":0.9523809524,
|
115 |
+
"f":0.9523809524
|
116 |
},
|
117 |
"CONTAINER COUNT":{
|
118 |
"p":1.0,
|
|
|
120 |
"f":1.0
|
121 |
},
|
122 |
"CONTAINER SIZE-COUNT":{
|
123 |
+
"p":1.0,
|
124 |
+
"r":0.9615384615,
|
125 |
+
"f":0.9803921569
|
126 |
},
|
127 |
"AGENT_FALLBACK":{
|
128 |
"p":1.0,
|
129 |
"r":1.0,
|
130 |
"f":1.0
|
131 |
+
},
|
132 |
+
"WELCOME_MSG":{
|
133 |
+
"p":1.0,
|
134 |
+
"r":1.0,
|
135 |
+
"f":1.0
|
136 |
}
|
137 |
},
|
138 |
+
"tok2vec_loss":17.9424619099,
|
139 |
+
"ner_loss":532.0943451776
|
140 |
},
|
141 |
"requirements":[
|
142 |
|
ner/model
CHANGED
Binary files a/ner/model and b/ner/model differ
|
|
ner/moves
CHANGED
@@ -1 +1 @@
|
|
1 |
-
��moves
|
|
|
1 |
+
��moves�{"0":{},"1":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"2":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"3":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"4":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2,"":1},"5":{"":1}}�cfg��neg_key�
|
tok2vec/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e2f3e2fab9f568a5c3e23cbe9aa9f9e7e51da3c44d61ed32c617696964b45eb
|
3 |
+
size 34434008
|
vocab/key2row
CHANGED
@@ -1 +1,3 @@
|
|
1 |
-
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:31566ae010da3d399eb1d930ae142757afd2601034a4be3bdb00d18881c8c06a
|
3 |
+
size 7066303
|
vocab/strings.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
vocab/vectors
CHANGED
Binary files a/vocab/vectors and b/vocab/vectors differ
|
|