LM filter with better support for cyrillic
Browse files- lm.en +2 -2
- lm.hbs +2 -2
- metadata.yaml +4 -4
lm.en
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a5cb9a347085a461ecd67bb4c6ac6c4dc5a8423a5b6854dac29d72b7faed6a1
|
3 |
+
size 90786329
|
lm.hbs
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e045c50716156ed186865db8874df3a2144e03f55b48fa89343efc47df68678
|
3 |
+
size 343857442
|
metadata.yaml
CHANGED
@@ -10,10 +10,10 @@ porn_removal_side: sl
|
|
10 |
source_lm: lm.en
|
11 |
target_lm: lm.hbs
|
12 |
lm_type: CHARACTER
|
13 |
-
clean_mean_perp: -1.
|
14 |
-
clean_stddev_perp: 0.
|
15 |
-
noisy_mean_perp: -4.
|
16 |
-
noisy_stddev_perp: 0.
|
17 |
classifier_type: xlmr
|
18 |
classifier_settings:
|
19 |
activation: relu
|
|
|
10 |
source_lm: lm.en
|
11 |
target_lm: lm.hbs
|
12 |
lm_type: CHARACTER
|
13 |
+
clean_mean_perp: -1.116365617208272
|
14 |
+
clean_stddev_perp: 0.1687608181840407
|
15 |
+
noisy_mean_perp: -4.013399029709761
|
16 |
+
noisy_stddev_perp: 0.15687448432446158
|
17 |
classifier_type: xlmr
|
18 |
classifier_settings:
|
19 |
activation: relu
|