Commit
·
cc5b640
1
Parent(s):
54fe850
xx_lat_sigtyp_trf-0.1.0: Update SIGTYP pipeline
Browse files- .gitattributes +1 -0
- README.md +0 -0
- config.cfg +26 -5
- meta.json +0 -0
- morphologizer/cfg +0 -0
- morphologizer/model +3 -0
- parser/model +1 -1
- tagger/model +1 -1
- trainable_lemmatizer/model +1 -1
- transformer/model +1 -1
- vocab/strings.json +0 -0
- xx_lat_sigtyp_trf-any-py3-none-any.whl +2 -2
.gitattributes
CHANGED
@@ -38,3 +38,4 @@ tagger/model filter=lfs diff=lfs merge=lfs -text
|
|
38 |
trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
|
39 |
transformer/model filter=lfs diff=lfs merge=lfs -text
|
40 |
xx_lat_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
|
|
|
38 |
trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
|
39 |
transformer/model filter=lfs diff=lfs merge=lfs -text
|
40 |
xx_lat_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
41 |
+
morphologizer/model filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
config.cfg
CHANGED
@@ -10,7 +10,7 @@ seed = 42
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
-
pipeline = ["transformer","parser","trainable_lemmatizer","tagger"]
|
14 |
batch_size = 128
|
15 |
disabled = []
|
16 |
before_creation = null
|
@@ -20,6 +20,24 @@ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
|
20 |
|
21 |
[components]
|
22 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
[components.parser]
|
24 |
factory = "parser"
|
25 |
learn_tokens = false
|
@@ -166,14 +184,17 @@ total_steps = 20000
|
|
166 |
initial_rate = 0.00005
|
167 |
|
168 |
[training.score_weights]
|
169 |
-
dep_uas = 0.
|
170 |
-
dep_las = 0.
|
171 |
dep_las_per_type = null
|
172 |
sents_p = null
|
173 |
sents_r = null
|
174 |
sents_f = 0.0
|
175 |
-
lemma_acc = 0.
|
176 |
-
tag_acc = 0.
|
|
|
|
|
|
|
177 |
|
178 |
[pretraining]
|
179 |
|
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
+
pipeline = ["transformer","parser","trainable_lemmatizer","tagger","morphologizer"]
|
14 |
batch_size = 128
|
15 |
disabled = []
|
16 |
before_creation = null
|
|
|
20 |
|
21 |
[components]
|
22 |
|
23 |
+
[components.morphologizer]
|
24 |
+
factory = "morphologizer"
|
25 |
+
extend = false
|
26 |
+
label_smoothing = 0.0
|
27 |
+
overwrite = true
|
28 |
+
scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
|
29 |
+
|
30 |
+
[components.morphologizer.model]
|
31 |
+
@architectures = "spacy.Tagger.v2"
|
32 |
+
nO = null
|
33 |
+
normalize = false
|
34 |
+
|
35 |
+
[components.morphologizer.model.tok2vec]
|
36 |
+
@architectures = "spacy-transformers.TransformerListener.v1"
|
37 |
+
grad_factor = 1.0
|
38 |
+
pooling = {"@layers":"reduce_mean.v1"}
|
39 |
+
upstream = "*"
|
40 |
+
|
41 |
[components.parser]
|
42 |
factory = "parser"
|
43 |
learn_tokens = false
|
|
|
184 |
initial_rate = 0.00005
|
185 |
|
186 |
[training.score_weights]
|
187 |
+
dep_uas = 0.09
|
188 |
+
dep_las = 0.09
|
189 |
dep_las_per_type = null
|
190 |
sents_p = null
|
191 |
sents_r = null
|
192 |
sents_f = 0.0
|
193 |
+
lemma_acc = 0.17
|
194 |
+
tag_acc = 0.17
|
195 |
+
pos_acc = 0.25
|
196 |
+
morph_acc = 0.25
|
197 |
+
morph_per_feat = null
|
198 |
|
199 |
[pretraining]
|
200 |
|
meta.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
morphologizer/cfg
ADDED
The diff for this file is too large to render.
See raw diff
|
|
morphologizer/model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e17232f72d41fdff156322d38848fad7948d5f736edaeb27ca30c4105d6dbef2
|
3 |
+
size 5116041
|
parser/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 2154847
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f21f9493a033fd19f752a78a88d818a78106c0b62d5435cb6b300c95527583f
|
3 |
size 2154847
|
tagger/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6118817
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fb204326ce7026eb93ade2c6cbf518a1fd60ace6cea1eb4de4016e7f2f1815a
|
3 |
size 6118817
|
trainable_lemmatizer/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6198793
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9387a348c02480592fc7a9e22b9c0e0b0db95c24d613e0f856f113f331a7341f
|
3 |
size 6198793
|
transformer/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 509231398
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:becd68d4f609e09647aaed12231187830a70bbfe54dbcb2a279fc3327740711a
|
3 |
size 509231398
|
vocab/strings.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
xx_lat_sigtyp_trf-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c7cc2a3c07822a503dccbd42c0ec077f071da03fda6b0e69c9879d7a16e2def
|
3 |
+
size 484531034
|