teo-sanchez commited on
Commit
1b6ed6e
1 Parent(s): 162009f

Update spaCy pipeline

Browse files
Files changed (8) hide show
  1. README.md +13 -18
  2. config.cfg +19 -19
  3. en_ner_prompting-any-py3-none-any.whl +2 -2
  4. meta.json +12 -109
  5. ner/model +0 -0
  6. ner/moves +1 -1
  7. tok2vec/model +1 -1
  8. vocab/strings.json +0 -0
README.md CHANGED
@@ -13,40 +13,35 @@ model-index:
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
- value: 0.7636566332
17
  - name: NER Recall
18
  type: recall
19
- value: 0.6975560081
20
  - name: NER F Score
21
  type: f_score
22
- value: 0.7291112294
23
- widget:
24
- - text: Golden statue of a victorious warrior raising his sword to the sky, heroic, glorious, in the style of artgerm, gerald brom, atey ghailan and mike mignola, vibrant colors and hard shadows and strong rim light, plain background, comic cover art, trending on artstation
25
- - text: Italian renaissance dragon statue castle gallery highly detailed artstation concept art sharp focus illustration briclot rutkowski mucha
26
- - text: Quetzalcoatl in an epic battle with garuda, fantasy, stained glass, d & d, intricate, elegant, highly detailed, digital painting, artstation, concept art, matte, sharp focus, illustration, art by john collier and albert aublet and krenz cushart and artem demura and alphonse mucha
27
- license: mit
28
  ---
29
  | Feature | Description |
30
  | --- | --- |
31
  | **Name** | `en_ner_prompting` |
32
- | **Version** | `0.0.1` |
33
  | **spaCy** | `>=3.4.3,<3.5.0` |
34
  | **Default Pipeline** | `tok2vec`, `ner` |
35
  | **Components** | `tok2vec`, `ner` |
36
  | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
37
  | **Sources** | n/a |
38
- | **License** | MIT |
39
- | **Author** | [Selas](https://www.selas.ai/) |
40
 
41
  ### Label Scheme
42
 
43
  <details>
44
 
45
- <summary>View label scheme (18 labels for 1 components)</summary>
46
 
47
  | Component | Labels |
48
  | --- | --- |
49
- | **`ner`** | `color`, `composition/scale`, `composition/view`, `context/emotion`, `context/era`, `context/weather`, `detail`, `influence/artist`, `influence/artwork`, `influence/genre`, `influence/repository`, `light`, `medium/illustration`, `medium/painting`, `medium/photography`, `medium/rendering`, `other`, `subject` |
50
 
51
  </details>
52
 
@@ -54,8 +49,8 @@ license: mit
54
 
55
  | Type | Score |
56
  | --- | --- |
57
- | `ENTS_F` | 72.91 |
58
- | `ENTS_P` | 76.37 |
59
- | `ENTS_R` | 69.76 |
60
- | `TOK2VEC_LOSS` | 25220.55 |
61
- | `NER_LOSS` | 221026.23 |
 
13
  metrics:
14
  - name: NER Precision
15
  type: precision
16
+ value: 0.7375565611
17
  - name: NER Recall
18
  type: recall
19
+ value: 0.6848739496
20
  - name: NER F Score
21
  type: f_score
22
+ value: 0.7102396514
 
 
 
 
 
23
  ---
24
  | Feature | Description |
25
  | --- | --- |
26
  | **Name** | `en_ner_prompting` |
27
+ | **Version** | `0.0.2` |
28
  | **spaCy** | `>=3.4.3,<3.5.0` |
29
  | **Default Pipeline** | `tok2vec`, `ner` |
30
  | **Components** | `tok2vec`, `ner` |
31
  | **Vectors** | 514157 keys, 514157 unique vectors (300 dimensions) |
32
  | **Sources** | n/a |
33
+ | **License** | n/a |
34
+ | **Author** | [n/a]() |
35
 
36
  ### Label Scheme
37
 
38
  <details>
39
 
40
+ <summary>View label scheme (1 labels for 1 components)</summary>
41
 
42
  | Component | Labels |
43
  | --- | --- |
44
+ | **`ner`** | `FASHION_BRAND` |
45
 
46
  </details>
47
 
 
49
 
50
  | Type | Score |
51
  | --- | --- |
52
+ | `ENTS_F` | 71.02 |
53
+ | `ENTS_P` | 73.76 |
54
+ | `ENTS_R` | 68.49 |
55
+ | `TOK2VEC_LOSS` | 2670.31 |
56
+ | `NER_LOSS` | 913.14 |
config.cfg CHANGED
@@ -1,8 +1,8 @@
1
  [paths]
2
- train = null
3
- dev = null
4
  vectors = "en_core_web_lg"
5
- init_tok2vec = "/root/prompting-practices/models/ner_model/ner_training/pretrained_model/model50.bin"
6
 
7
  [system]
8
  gpu_allocator = "pytorch"
@@ -62,22 +62,22 @@ window_size = 1
62
  maxout_pieces = 3
63
 
64
  [corpora]
65
- @readers = "prodigy.MergedCorpus.v1"
66
- eval_split = 0.2
67
- sample_size = 1.0
68
- textcat = null
69
- textcat_multilabel = null
70
- parser = null
71
- tagger = null
72
- senter = null
73
- spancat = null
74
-
75
- [corpora.ner]
76
- @readers = "prodigy.NERCorpus.v1"
77
- datasets = ["prompt_ner_data"]
78
- eval_datasets = []
79
- default_fill = "outside"
80
- incorrect_key = "incorrect_spans"
81
 
82
  [training]
83
  dev_corpus = "corpora.dev"
 
1
  [paths]
2
+ train = "corpus/ner_prompting_training.spacy"
3
+ dev = "corpus/ner_prompting_eval.spacy"
4
  vectors = "en_core_web_lg"
5
+ init_tok2vec = "training/pretrain_embedding/model50.bin"
6
 
7
  [system]
8
  gpu_allocator = "pytorch"
 
62
  maxout_pieces = 3
63
 
64
  [corpora]
65
+
66
+ [corpora.dev]
67
+ @readers = "spacy.Corpus.v1"
68
+ path = ${paths.dev}
69
+ max_length = 0
70
+ gold_preproc = false
71
+ limit = 0
72
+ augmenter = null
73
+
74
+ [corpora.train]
75
+ @readers = "spacy.Corpus.v1"
76
+ path = ${paths.train}
77
+ max_length = 0
78
+ gold_preproc = false
79
+ limit = 0
80
+ augmenter = null
81
 
82
  [training]
83
  dev_corpus = "corpora.dev"
en_ner_prompting-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d479d911d44a0822a5671d929f1da02aaea7ba33736c632dde194a5caa237d3
3
- size 606719222
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d0ba1229d80c28417ea0769fbb97a5e08d3e82084ec1946f16a203c88d8ebb6
3
+ size 606771499
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"en",
3
  "name":"ner_prompting",
4
- "version":"0.0.1",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
  "spacy_version":">=3.4.3,<3.5.0",
11
- "spacy_git_version":"Unknown",
12
  "vectors":{
13
  "width":300,
14
  "vectors":514157,
@@ -20,24 +20,7 @@
20
 
21
  ],
22
  "ner":[
23
- "color",
24
- "composition/scale",
25
- "composition/view",
26
- "context/emotion",
27
- "context/era",
28
- "context/weather",
29
- "detail",
30
- "influence/artist",
31
- "influence/artwork",
32
- "influence/genre",
33
- "influence/repository",
34
- "light",
35
- "medium/illustration",
36
- "medium/painting",
37
- "medium/photography",
38
- "medium/rendering",
39
- "other",
40
- "subject"
41
  ]
42
  },
43
  "pipeline":[
@@ -52,98 +35,18 @@
52
 
53
  ],
54
  "performance":{
55
- "ents_f":0.7291112294,
56
- "ents_p":0.7636566332,
57
- "ents_r":0.6975560081,
58
  "ents_per_type":{
59
- "context/emotion":{
60
- "p":0.8620689655,
61
- "r":0.7246376812,
62
- "f":0.7874015748
63
- },
64
- "detail":{
65
- "p":0.9142857143,
66
- "r":0.9056603774,
67
- "f":0.9099526066
68
- },
69
- "medium/illustration":{
70
- "p":0.8813559322,
71
- "r":0.8387096774,
72
- "f":0.8595041322
73
- },
74
- "influence/genre":{
75
- "p":0.8070175439,
76
- "r":0.6764705882,
77
- "f":0.736
78
- },
79
- "subject":{
80
- "p":0.5555555556,
81
- "r":0.5043859649,
82
- "f":0.5287356322
83
- },
84
- "influence/artist":{
85
- "p":0.8217054264,
86
- "r":0.8091603053,
87
- "f":0.8153846154
88
- },
89
- "influence/artwork":{
90
- "p":0.64,
91
- "r":0.4705882353,
92
- "f":0.5423728814
93
- },
94
- "influence/repository":{
95
- "p":0.9090909091,
96
- "r":0.8888888889,
97
- "f":0.8988764045
98
- },
99
- "medium/photography":{
100
- "p":0.7215189873,
101
- "r":0.7808219178,
102
- "f":0.75
103
- },
104
- "color":{
105
- "p":0.7941176471,
106
- "r":0.7941176471,
107
- "f":0.7941176471
108
- },
109
- "context/era":{
110
- "p":0.6666666667,
111
- "r":0.5454545455,
112
- "f":0.6
113
- },
114
- "composition/view":{
115
- "p":0.8947368421,
116
- "r":0.5862068966,
117
- "f":0.7083333333
118
- },
119
- "medium/rendering":{
120
- "p":0.9230769231,
121
- "r":0.5,
122
- "f":0.6486486486
123
- },
124
- "context/weather":{
125
- "p":0.5,
126
- "r":0.7272727273,
127
- "f":0.5925925926
128
- },
129
- "light":{
130
- "p":0.8636363636,
131
- "r":0.7916666667,
132
- "f":0.8260869565
133
- },
134
- "medium/painting":{
135
- "p":0.8235294118,
136
- "r":0.56,
137
- "f":0.6666666667
138
- },
139
- "composition/scale":{
140
- "p":1.0,
141
- "r":0.5,
142
- "f":0.6666666667
143
  }
144
  },
145
- "tok2vec_loss":252.2055473672,
146
- "ner_loss":2210.2623216551
147
  },
148
  "requirements":[
149
 
 
1
  {
2
  "lang":"en",
3
  "name":"ner_prompting",
4
+ "version":"0.0.2",
5
  "description":"",
6
  "author":"",
7
  "email":"",
8
  "url":"",
9
  "license":"",
10
  "spacy_version":">=3.4.3,<3.5.0",
11
+ "spacy_git_version":"63673a792",
12
  "vectors":{
13
  "width":300,
14
  "vectors":514157,
 
20
 
21
  ],
22
  "ner":[
23
+ "FASHION_BRAND"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
24
  ]
25
  },
26
  "pipeline":[
 
35
 
36
  ],
37
  "performance":{
38
+ "ents_f":0.7102396514,
39
+ "ents_p":0.7375565611,
40
+ "ents_r":0.6848739496,
41
  "ents_per_type":{
42
+ "FASHION_BRAND":{
43
+ "p":0.7375565611,
44
+ "r":0.6848739496,
45
+ "f":0.7102396514
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
46
  }
47
  },
48
+ "tok2vec_loss":26.7030918702,
49
+ "ner_loss":9.1313796143
50
  },
51
  "requirements":[
52
 
ner/model CHANGED
Binary files a/ner/model and b/ner/model differ
 
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves��{"0":{},"1":{"subject":3019,"influence/artist":1104,"detail":796,"medium/photography":530,"light":348,"medium/illustration":342,"influence/genre":308,"influence/repository":282,"color":252,"composition/view":228,"context/emotion":222,"medium/rendering":192,"influence/artwork":187,"medium/painting":155,"context/era":109,"context/weather":91,"composition/scale":20,"other":4},"2":{"subject":3019,"influence/artist":1104,"detail":796,"medium/photography":530,"light":348,"medium/illustration":342,"influence/genre":308,"influence/repository":282,"color":252,"composition/view":228,"context/emotion":222,"medium/rendering":192,"influence/artwork":187,"medium/painting":155,"context/era":109,"context/weather":91,"composition/scale":20,"other":4},"3":{"subject":3019,"influence/artist":1104,"detail":796,"medium/photography":530,"light":348,"medium/illustration":342,"influence/genre":308,"influence/repository":282,"color":252,"composition/view":228,"context/emotion":222,"medium/rendering":192,"influence/artwork":187,"medium/painting":155,"context/era":109,"context/weather":91,"composition/scale":20,"other":4},"4":{"subject":3019,"influence/artist":1104,"detail":796,"medium/photography":530,"light":348,"medium/illustration":342,"influence/genre":308,"influence/repository":282,"color":252,"composition/view":228,"context/emotion":222,"medium/rendering":192,"influence/artwork":187,"medium/painting":155,"context/era":109,"context/weather":91,"composition/scale":20,"other":4,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��movesـ{"0":{},"1":{"FASHION_BRAND":728},"2":{"FASHION_BRAND":728},"3":{"FASHION_BRAND":728},"4":{"FASHION_BRAND":728,"":1},"5":{"":1}}�cfg��neg_key�
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b66007c82528f758a500a10a3004866650950e0822706ba5c5a3ab1c8b037e29
3
  size 34434008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b6a9d1faa8f46d9dd9240faeae4c879ed3d33823052c45a48bdd63d9a72a1f4
3
  size 34434008
vocab/strings.json CHANGED
The diff for this file is too large to render. See raw diff