Ybhav14 commited on
Commit
11dd3ea
·
1 Parent(s): 0014b42

Update spaCy pipeline

Browse files
.gitattributes CHANGED
@@ -34,3 +34,5 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
  en_Spacy_Custom_ner2-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
36
  tok2vec/model filter=lfs diff=lfs merge=lfs -text
 
 
 
34
  *tfevents* filter=lfs diff=lfs merge=lfs -text
35
  en_Spacy_Custom_ner2-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
36
  tok2vec/model filter=lfs diff=lfs merge=lfs -text
37
+ vocab/key2row filter=lfs diff=lfs merge=lfs -text
38
+ vocab/vectors filter=lfs diff=lfs merge=lfs -text
README.md CHANGED
@@ -13,13 +13,13 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.9914634146
17
  - name: NER Recall
18
  type: recall
19
- value: 0.9963235294
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.9938875306
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
@@ -28,7 +28,7 @@ model-index:
28
  | **spaCy** | `>=3.5.3,<3.6.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
- | **Vectors** | 0 keys, 0 unique vectors (0 dimensions) |
32
  | **Sources** | n/a |
33
  | **License** | n/a |
34
  | **Author** | [n/a]() |
@@ -37,11 +37,11 @@ model-index:
37
 
38
  <details>
39
 
40
- <summary>View label scheme (15 labels for 1 components)</summary>
41
 
42
  | Component | Labels |
43
  | --- | --- |
44
- | **`ner`** | `AGENT_FALLBACK`, `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE` |
45
 
46
  </details>
47
 
@@ -49,8 +49,8 @@ model-index:
49
 
50
  | Type | Score |
51
  | --- | --- |
52
- | `ENTS_F` | 99.39 |
53
- | `ENTS_P` | 99.15 |
54
- | `ENTS_R` | 99.63 |
55
- | `TOK2VEC_LOSS` | 11705.89 |
56
- | `NER_LOSS` | 73604.05 |
 
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
+ value: 0.9918793503
17
  - name: NER Recall
18
  type: recall
19
+ value: 0.9965034965
20
  - name: NER F Score
21
  type: f_score
22
+ value: 0.9941860465
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
 
28
  | **spaCy** | `>=3.5.3,<3.6.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
+ | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
32
  | **Sources** | n/a |
33
  | **License** | n/a |
34
  | **Author** | [n/a]() |
 
37
 
38
  <details>
39
 
40
+ <summary>View label scheme (16 labels for 1 components)</summary>
41
 
42
  | Component | Labels |
43
  | --- | --- |
44
+ | **`ner`** | `AGENT_FALLBACK`, `BOOK`, `COMODITY`, `CONTAINER COUNT`, `CONTAINER SIZE`, `CONTAINER SIZE-COUNT`, `DESTINATION`, `ENQUIRY`, `HELP`, `INCOTERM`, `KYC`, `ORIGIN`, `SEARCH RATES`, `SHIP`, `SHIPMENT TYPE`, `WELCOME_MSG` |
45
 
46
  </details>
47
 
 
49
 
50
  | Type | Score |
51
  | --- | --- |
52
+ | `ENTS_F` | 99.42 |
53
+ | `ENTS_P` | 99.19 |
54
+ | `ENTS_R` | 99.65 |
55
+ | `TOK2VEC_LOSS` | 1794.25 |
56
+ | `NER_LOSS` | 53209.43 |
config.cfg CHANGED
@@ -1,7 +1,7 @@
1
  [paths]
2
  train = "./training_data.spacy"
3
  dev = "./training_data.spacy"
4
- vectors = null
5
  init_tok2vec = null
6
 
7
  [system]
@@ -11,7 +11,7 @@ seed = 0
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
- batch_size = 1000
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
@@ -52,12 +52,12 @@ factory = "tok2vec"
52
  width = ${components.tok2vec.model.encode.width}
53
  attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
54
  rows = [5000,1000,2500,2500]
55
- include_static_vectors = false
56
 
57
  [components.tok2vec.model.encode]
58
  @architectures = "spacy.MaxoutWindowEncoder.v2"
59
- width = 96
60
- depth = 4
61
  window_size = 1
62
  maxout_pieces = 3
63
 
 
1
  [paths]
2
  train = "./training_data.spacy"
3
  dev = "./training_data.spacy"
4
+ vectors = "en_core_web_lg"
5
  init_tok2vec = null
6
 
7
  [system]
 
11
  [nlp]
12
  lang = "en"
13
  pipeline = ["tok2vec","ner"]
14
+ batch_size = 100
15
  disabled = []
16
  before_creation = null
17
  after_creation = null
 
52
  width = ${components.tok2vec.model.encode.width}
53
  attrs = ["NORM","PREFIX","SUFFIX","SHAPE"]
54
  rows = [5000,1000,2500,2500]
55
+ include_static_vectors = true
56
 
57
  [components.tok2vec.model.encode]
58
  @architectures = "spacy.MaxoutWindowEncoder.v2"
59
+ width = 256
60
+ depth = 8
61
  window_size = 1
62
  maxout_pieces = 3
63
 
en_Spacy_Custom_ner2-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7743b2f22633d673034a38e534ced88e1d2de091f27e11c5f5d8155691a4556
3
- size 5685862
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cdf71ff55f457d482bbdb22b28d2290167f5d9e468d01bf27dba4cd9b365bd5e
3
+ size 606745646
meta.json CHANGED
@@ -10,10 +10,10 @@
10
  "spacy_version":">=3.5.3,<3.6.0",
11
  "spacy_git_version":"Unknown",
12
  "vectors":{
13
- "width":0,
14
- "vectors":0,
15
- "keys":0,
16
- "name":null
17
  },
18
  "labels":{
19
  "tok2vec":[
@@ -34,7 +34,8 @@
34
  "ORIGIN",
35
  "SEARCH RATES",
36
  "SHIP",
37
- "SHIPMENT TYPE"
 
38
  ]
39
  },
40
  "pipeline":[
@@ -49,9 +50,9 @@
49
 
50
  ],
51
  "performance":{
52
- "ents_f":0.9938875306,
53
- "ents_p":0.9914634146,
54
- "ents_r":0.9963235294,
55
  "ents_per_type":{
56
  "SEARCH RATES":{
57
  "p":1.0,
@@ -64,9 +65,9 @@
64
  "f":1.0
65
  },
66
  "DESTINATION":{
67
- "p":0.9951456311,
68
- "r":0.9951456311,
69
- "f":0.9951456311
70
  },
71
  "BOOK":{
72
  "p":1.0,
@@ -79,9 +80,9 @@
79
  "f":0.9938650307
80
  },
81
  "CONTAINER SIZE":{
82
- "p":1.0,
83
- "r":0.9811320755,
84
- "f":0.9904761905
85
  },
86
  "SHIPMENT TYPE":{
87
  "p":1.0,
@@ -109,9 +110,9 @@
109
  "f":1.0
110
  },
111
  "COMODITY":{
112
- "p":0.9130434783,
113
- "r":1.0,
114
- "f":0.9545454545
115
  },
116
  "CONTAINER COUNT":{
117
  "p":1.0,
@@ -119,18 +120,23 @@
119
  "f":1.0
120
  },
121
  "CONTAINER SIZE-COUNT":{
122
- "p":0.962962963,
123
- "r":1.0,
124
- "f":0.9811320755
125
  },
126
  "AGENT_FALLBACK":{
127
  "p":1.0,
128
  "r":1.0,
129
  "f":1.0
 
 
 
 
 
130
  }
131
  },
132
- "tok2vec_loss":117.0588980803,
133
- "ner_loss":736.0405311402
134
  },
135
  "requirements":[
136
 
 
10
  "spacy_version":">=3.5.3,<3.6.0",
11
  "spacy_git_version":"Unknown",
12
  "vectors":{
13
+ "width":300,
14
+ "vectors":514157,
15
+ "keys":514157,
16
+ "name":"en_vectors"
17
  },
18
  "labels":{
19
  "tok2vec":[
 
34
  "ORIGIN",
35
  "SEARCH RATES",
36
  "SHIP",
37
+ "SHIPMENT TYPE",
38
+ "WELCOME_MSG"
39
  ]
40
  },
41
  "pipeline":[
 
50
 
51
  ],
52
  "performance":{
53
+ "ents_f":0.9941860465,
54
+ "ents_p":0.9918793503,
55
+ "ents_r":0.9965034965,
56
  "ents_per_type":{
57
  "SEARCH RATES":{
58
  "p":1.0,
 
65
  "f":1.0
66
  },
67
  "DESTINATION":{
68
+ "p":0.9903846154,
69
+ "r":1.0,
70
+ "f":0.9951690821
71
  },
72
  "BOOK":{
73
  "p":1.0,
 
80
  "f":0.9938650307
81
  },
82
  "CONTAINER SIZE":{
83
+ "p":0.9905660377,
84
+ "r":0.9905660377,
85
+ "f":0.9905660377
86
  },
87
  "SHIPMENT TYPE":{
88
  "p":1.0,
 
110
  "f":1.0
111
  },
112
  "COMODITY":{
113
+ "p":0.9523809524,
114
+ "r":0.9523809524,
115
+ "f":0.9523809524
116
  },
117
  "CONTAINER COUNT":{
118
  "p":1.0,
 
120
  "f":1.0
121
  },
122
  "CONTAINER SIZE-COUNT":{
123
+ "p":1.0,
124
+ "r":0.9615384615,
125
+ "f":0.9803921569
126
  },
127
  "AGENT_FALLBACK":{
128
  "p":1.0,
129
  "r":1.0,
130
  "f":1.0
131
+ },
132
+ "WELCOME_MSG":{
133
+ "p":1.0,
134
+ "r":1.0,
135
+ "f":1.0
136
  }
137
  },
138
+ "tok2vec_loss":17.9424619099,
139
+ "ner_loss":532.0943451776
140
  },
141
  "requirements":[
142
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves��{"0":{},"1":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"2":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"3":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"4":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves�{"0":{},"1":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"2":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"3":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2},"4":{"DESTINATION":321,"ORIGIN":303,"CONTAINER SIZE":188,"WELCOME_MSG":178,"SHIP":81,"AGENT_FALLBACK":79,"SHIPMENT TYPE":58,"CONTAINER SIZE-COUNT":39,"COMODITY":31,"BOOK":28,"ENQUIRY":18,"SEARCH RATES":14,"CONTAINER COUNT":10,"INCOTERM":9,"HELP":8,"KYC":2,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:822be8a54a09b5c9df436b15ca1de414fca5830de7fe6ed9226c094e7718bf3f
3
- size 6009091
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e2f3e2fab9f568a5c3e23cbe9aa9f9e7e51da3c44d61ed32c617696964b45eb
3
+ size 34434008
vocab/key2row CHANGED
@@ -1 +1,3 @@
1
-
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31566ae010da3d399eb1d930ae142757afd2601034a4be3bdb00d18881c8c06a
3
+ size 7066303
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff
 
vocab/vectors CHANGED
Binary files a/vocab/vectors and b/vocab/vectors differ