Upload modelcfg.yaml
Browse files- modelcfg.yaml +5 -27
modelcfg.yaml
CHANGED
@@ -20,41 +20,21 @@ model:
|
|
20 |
- 9
|
21 |
- 1
|
22 |
dropout: 0.2
|
|
|
23 |
n_head: 2
|
24 |
n_layers: 6
|
25 |
scln: true
|
26 |
emb_dim: 512
|
27 |
emb_reduction: 1
|
28 |
encoder:
|
29 |
-
depth: 2
|
30 |
-
expansion: 2
|
31 |
fs2_dropout: 0.2
|
32 |
fs2_head: 2
|
33 |
fs2_layer: 4
|
34 |
-
kernel_size: 5
|
35 |
-
kind: fastspeech2
|
36 |
-
n_heads: 2
|
37 |
-
ve_energy_quantization: linear
|
38 |
ve_n_bins: 256
|
39 |
-
ve_pitch_quantization: linear
|
40 |
vp_dropout: 0.5
|
41 |
vp_filter_size: 256
|
42 |
vp_kernel_size: 3
|
43 |
-
gst:
|
44 |
-
n_heads: 8
|
45 |
-
n_style_tokens: 2000
|
46 |
-
ref_enc_filters:
|
47 |
-
- 32
|
48 |
-
- 32
|
49 |
-
- 64
|
50 |
-
- 64
|
51 |
-
- 128
|
52 |
-
- 128
|
53 |
max_seq_len: 1500
|
54 |
-
postnet:
|
55 |
-
postnet_embedding_dim: 0
|
56 |
-
postnet_kernel_size: 5
|
57 |
-
postnet_n_convolutions: 5
|
58 |
punct_emb_dim: 16
|
59 |
resnet:
|
60 |
encoder_type: ASP
|
@@ -68,10 +48,8 @@ model:
|
|
68 |
- 64
|
69 |
- 128
|
70 |
- 256
|
71 |
-
spkemb:
|
72 |
-
kind: ResNetSE34V2
|
73 |
stats:
|
74 |
-
energy_max:
|
75 |
-
energy_min: -2.
|
76 |
-
pitch_max:
|
77 |
-
pitch_min:
|
|
|
20 |
- 9
|
21 |
- 1
|
22 |
dropout: 0.2
|
23 |
+
kind: styletts
|
24 |
n_head: 2
|
25 |
n_layers: 6
|
26 |
scln: true
|
27 |
emb_dim: 512
|
28 |
emb_reduction: 1
|
29 |
encoder:
|
|
|
|
|
30 |
fs2_dropout: 0.2
|
31 |
fs2_head: 2
|
32 |
fs2_layer: 4
|
|
|
|
|
|
|
|
|
33 |
ve_n_bins: 256
|
|
|
34 |
vp_dropout: 0.5
|
35 |
vp_filter_size: 256
|
36 |
vp_kernel_size: 3
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
37 |
max_seq_len: 1500
|
|
|
|
|
|
|
|
|
38 |
punct_emb_dim: 16
|
39 |
resnet:
|
40 |
encoder_type: ASP
|
|
|
48 |
- 64
|
49 |
- 128
|
50 |
- 256
|
|
|
|
|
51 |
stats:
|
52 |
+
energy_max: 493.5418701171875
|
53 |
+
energy_min: -2.139316514718655
|
54 |
+
pitch_max: 883.609245028834
|
55 |
+
pitch_min: 57.520125416548694
|