Commit
·
9603349
1
Parent(s):
390dd19
xx_chu_sigtyp_trf-0.1.0: Update SIGTYP pipeline
Browse files- .gitattributes +1 -0
- README.md +0 -0
- config.cfg +26 -5
- meta.json +0 -0
- morphologizer/cfg +0 -0
- morphologizer/model +3 -0
- parser/model +1 -1
- tagger/model +1 -1
- trainable_lemmatizer/model +1 -1
- transformer/model +1 -1
- vocab/strings.json +0 -0
- xx_chu_sigtyp_trf-any-py3-none-any.whl +2 -2
.gitattributes
CHANGED
@@ -39,3 +39,4 @@ trainable_lemmatizer/model filter=lfs diff=lfs merge=lfs -text
|
|
39 |
trainable_lemmatizer/trees filter=lfs diff=lfs merge=lfs -text
|
40 |
transformer/model filter=lfs diff=lfs merge=lfs -text
|
41 |
xx_chu_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
|
|
|
39 |
trainable_lemmatizer/trees filter=lfs diff=lfs merge=lfs -text
|
40 |
transformer/model filter=lfs diff=lfs merge=lfs -text
|
41 |
xx_chu_sigtyp_trf-any-py3-none-any.whl filter=lfs diff=lfs merge=lfs -text
|
42 |
+
morphologizer/model filter=lfs diff=lfs merge=lfs -text
|
README.md
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
config.cfg
CHANGED
@@ -10,7 +10,7 @@ seed = 42
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
-
pipeline = ["transformer","parser","trainable_lemmatizer","tagger"]
|
14 |
batch_size = 128
|
15 |
disabled = []
|
16 |
before_creation = null
|
@@ -20,6 +20,24 @@ tokenizer = {"@tokenizers":"spacy.Tokenizer.v1"}
|
|
20 |
|
21 |
[components]
|
22 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
23 |
[components.parser]
|
24 |
factory = "parser"
|
25 |
learn_tokens = false
|
@@ -166,14 +184,17 @@ total_steps = 20000
|
|
166 |
initial_rate = 0.00005
|
167 |
|
168 |
[training.score_weights]
|
169 |
-
dep_uas = 0.
|
170 |
-
dep_las = 0.
|
171 |
dep_las_per_type = null
|
172 |
sents_p = null
|
173 |
sents_r = null
|
174 |
sents_f = 0.0
|
175 |
-
lemma_acc = 0.
|
176 |
-
tag_acc = 0.
|
|
|
|
|
|
|
177 |
|
178 |
[pretraining]
|
179 |
|
|
|
10 |
|
11 |
[nlp]
|
12 |
lang = "xx"
|
13 |
+
pipeline = ["transformer","parser","trainable_lemmatizer","tagger","morphologizer"]
|
14 |
batch_size = 128
|
15 |
disabled = []
|
16 |
before_creation = null
|
|
|
20 |
|
21 |
[components]
|
22 |
|
23 |
+
[components.morphologizer]
|
24 |
+
factory = "morphologizer"
|
25 |
+
extend = false
|
26 |
+
label_smoothing = 0.0
|
27 |
+
overwrite = true
|
28 |
+
scorer = {"@scorers":"spacy.morphologizer_scorer.v1"}
|
29 |
+
|
30 |
+
[components.morphologizer.model]
|
31 |
+
@architectures = "spacy.Tagger.v2"
|
32 |
+
nO = null
|
33 |
+
normalize = false
|
34 |
+
|
35 |
+
[components.morphologizer.model.tok2vec]
|
36 |
+
@architectures = "spacy-transformers.TransformerListener.v1"
|
37 |
+
grad_factor = 1.0
|
38 |
+
pooling = {"@layers":"reduce_mean.v1"}
|
39 |
+
upstream = "*"
|
40 |
+
|
41 |
[components.parser]
|
42 |
factory = "parser"
|
43 |
learn_tokens = false
|
|
|
184 |
initial_rate = 0.00005
|
185 |
|
186 |
[training.score_weights]
|
187 |
+
dep_uas = 0.09
|
188 |
+
dep_las = 0.09
|
189 |
dep_las_per_type = null
|
190 |
sents_p = null
|
191 |
sents_r = null
|
192 |
sents_f = 0.0
|
193 |
+
lemma_acc = 0.17
|
194 |
+
tag_acc = 0.17
|
195 |
+
pos_acc = 0.25
|
196 |
+
morph_acc = 0.25
|
197 |
+
morph_per_feat = null
|
198 |
|
199 |
[pretraining]
|
200 |
|
meta.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
morphologizer/cfg
ADDED
The diff for this file is too large to render.
See raw diff
|
|
morphologizer/model
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee18d9e2fee857cbcb3646853ac3e612c081eb47f5162220b0e06cd8f18c2e44
|
3 |
+
size 4863809
|
parser/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1671399
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:746cdd1ebc50893d15755216f2f3b29c8e51bfeca1af9fa69ec463995e653485
|
3 |
size 1671399
|
tagger/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4371649
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:73797d3ec2cdc3e15679d0648bfdd84b4bf9cb0601bca705587c3dfa4f5135c9
|
3 |
size 4371649
|
trainable_lemmatizer/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14165633
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0586b97d9c4cf54dbf303e606846465c93717e8093224a25b79e7a6c4739aecb
|
3 |
size 14165633
|
transformer/model
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 509231398
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfdbc753160505ac9498b68655f666df4c225aaba0e6786b91f3f45a3433d809
|
3 |
size 509231398
|
vocab/strings.json
CHANGED
The diff for this file is too large to render.
See raw diff
|
|
xx_chu_sigtyp_trf-any-py3-none-any.whl
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5adf07c03fad400227f49547260c81222a70035e6fdd3d5dfe675025cbda7552
|
3 |
+
size 490013884
|