Update README.md
Browse files
README.md
CHANGED
@@ -3,10 +3,10 @@ language:
|
|
3 |
- ca
|
4 |
- es
|
5 |
- en
|
|
|
6 |
tags:
|
7 |
-
|
8 |
---
|
9 |
-
|
10 |
### Preprocessing
|
11 |
1. Normalisation and tokenisation with moses scripts
|
12 |
2. truecased with model docgWP.tcmodel.[LAN] and moses scripts
|
@@ -23,6 +23,52 @@ tags:
|
|
23 |
- Finetuned with 1.5M real parallel data (without backtranslations)
|
24 |
|
25 |
### Model
|
26 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
27 |
|
28 |
-
## Benchmark
|
|
|
3 |
- ca
|
4 |
- es
|
5 |
- en
|
6 |
+
|
7 |
tags:
|
8 |
+
- translation
|
9 |
---
|
|
|
10 |
### Preprocessing
|
11 |
1. Normalisation and tokenisation with moses scripts
|
12 |
2. truecased with model docgWP.tcmodel.[LAN] and moses scripts
|
|
|
23 |
- Finetuned with 1.5M real parallel data (without backtranslations)
|
24 |
|
25 |
### Model
|
26 |
+
Transformer big with guided alignments. Relevant parameters:
|
27 |
+
|
28 |
+
--beam-size 6
|
29 |
+
|
30 |
+
--normalize 0.6
|
31 |
+
|
32 |
+
--enc-depth 6 --dec-depth 6 --transformer-heads 8
|
33 |
+
|
34 |
+
--transformer-preprocess n --transformer-postprocess da
|
35 |
+
|
36 |
+
--transformer-dropout 0.1
|
37 |
+
|
38 |
+
--label-smoothing 0.1
|
39 |
+
|
40 |
+
--dim-emb 1024 --transformer-dim-ffn 4096
|
41 |
+
|
42 |
+
--transformer-dropout-attention 0.1
|
43 |
+
|
44 |
+
--transformer-dropout-ffn 0.1
|
45 |
+
|
46 |
+
--learn-rate 0.00015 --lr-warmup 8000 --lr-decay-inv-sqrt 8000
|
47 |
+
|
48 |
+
--optimizer-params 0.9 0.998 1e-09
|
49 |
+
|
50 |
+
--clip-norm 5
|
51 |
+
|
52 |
+
--tied-embeddings
|
53 |
+
|
54 |
+
--exponential-smoothing
|
55 |
+
|
56 |
+
--transformer-guided-alignment-layer 1 --guided-alignment-cost mse --guided-alignment-weight 0.1
|
57 |
+
|
58 |
+
|
59 |
+
## Evaluation
|
60 |
+
|
61 |
+
### Test set
|
62 |
+
|
63 |
+
https://github.com/PLXIV/Gebiotoolkit/tree/master/gebiocorpus_v2
|
64 |
+
|
65 |
+
### ca2en
|
66 |
+
BLEU|#:1|bs:1000|rs:12345|c:mixed|e:no|tok:13a|s:exp|v:2.0.0 = 47.8 (μ = 47.8 ± 0.9)
|
67 |
+
|
68 |
+
chrF|#:1|bs:1000|rs:12345|c:mixed|e:yes|nc:6|nw:0|s:no|v:2.0.0 = 69.9 (μ = 69.9 ± 0.7)
|
69 |
+
|
70 |
+
### es2ca
|
71 |
+
BLEU|#:1|bs:1000|rs:12345|c:mixed|e:no|tok:13a|s:exp|v:2.0.0 = 48.9 (μ = 48.9 ± 0.9)
|
72 |
+
|
73 |
+
chrF2|#:1|bs:1000|rs:12345|c:mixed|e:yes|nc:6|nw:0|s:no|v:2.0.0 = 70.5 (μ = 70.5 ± 0.7)
|
74 |
|
|