Commit
·
205ca43
1
Parent(s):
138e6cc
Upload 2 files
Browse files- config.json +21 -10
- config.yml +31 -10
config.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"train": {
|
3 |
-
"log_interval":
|
4 |
-
"eval_interval":
|
5 |
"seed": 42,
|
6 |
-
"epochs":
|
7 |
"learning_rate": 0.0001,
|
8 |
"betas": [
|
9 |
0.8,
|
@@ -11,14 +11,19 @@
|
|
11 |
],
|
12 |
"eps": 1e-09,
|
13 |
"batch_size": 8,
|
14 |
-
"
|
15 |
"lr_decay": 0.99995,
|
16 |
"segment_size": 16384,
|
17 |
"init_lr_ratio": 1,
|
18 |
"warmup_epochs": 0,
|
19 |
"c_mel": 45,
|
20 |
"c_kl": 1.0,
|
21 |
-
"
|
|
|
|
|
|
|
|
|
|
|
22 |
},
|
23 |
"data": {
|
24 |
"training_files": "Data/glut/filelists/train.list",
|
@@ -32,14 +37,13 @@
|
|
32 |
"mel_fmin": 0.0,
|
33 |
"mel_fmax": null,
|
34 |
"add_blank": true,
|
35 |
-
"n_speakers":
|
36 |
"cleaned_text": true,
|
37 |
"spk2id": {
|
38 |
"16": 0,
|
39 |
"G": 1,
|
40 |
"M": 2,
|
41 |
-
"
|
42 |
-
"Y": 4
|
43 |
}
|
44 |
},
|
45 |
"model": {
|
@@ -94,7 +98,14 @@
|
|
94 |
],
|
95 |
"n_layers_q": 3,
|
96 |
"use_spectral_norm": false,
|
97 |
-
"gin_channels":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
98 |
},
|
99 |
-
"version": "2.
|
100 |
}
|
|
|
1 |
{
|
2 |
"train": {
|
3 |
+
"log_interval": 1000,
|
4 |
+
"eval_interval": 1000,
|
5 |
"seed": 42,
|
6 |
+
"epochs": 10000,
|
7 |
"learning_rate": 0.0001,
|
8 |
"betas": [
|
9 |
0.8,
|
|
|
11 |
],
|
12 |
"eps": 1e-09,
|
13 |
"batch_size": 8,
|
14 |
+
"bf16_run": false,
|
15 |
"lr_decay": 0.99995,
|
16 |
"segment_size": 16384,
|
17 |
"init_lr_ratio": 1,
|
18 |
"warmup_epochs": 0,
|
19 |
"c_mel": 45,
|
20 |
"c_kl": 1.0,
|
21 |
+
"c_commit": 100,
|
22 |
+
"skip_optimizer": true,
|
23 |
+
"freeze_ZH_bert": false,
|
24 |
+
"freeze_JP_bert": false,
|
25 |
+
"freeze_EN_bert": false,
|
26 |
+
"freeze_emo": false
|
27 |
},
|
28 |
"data": {
|
29 |
"training_files": "Data/glut/filelists/train.list",
|
|
|
37 |
"mel_fmin": 0.0,
|
38 |
"mel_fmax": null,
|
39 |
"add_blank": true,
|
40 |
+
"n_speakers": 4,
|
41 |
"cleaned_text": true,
|
42 |
"spk2id": {
|
43 |
"16": 0,
|
44 |
"G": 1,
|
45 |
"M": 2,
|
46 |
+
"Y": 3
|
|
|
47 |
}
|
48 |
},
|
49 |
"model": {
|
|
|
98 |
],
|
99 |
"n_layers_q": 3,
|
100 |
"use_spectral_norm": false,
|
101 |
+
"gin_channels": 512,
|
102 |
+
"slm": {
|
103 |
+
"model": "./slm/wavlm-base-plus",
|
104 |
+
"sr": 16000,
|
105 |
+
"hidden": 768,
|
106 |
+
"nlayers": 13,
|
107 |
+
"initial_channel": 64
|
108 |
+
}
|
109 |
},
|
110 |
+
"version": "2.3"
|
111 |
}
|
config.yml
CHANGED
@@ -3,11 +3,12 @@ bert_gen:
|
|
3 |
device: cuda
|
4 |
num_processes: 2
|
5 |
use_multi_device: false
|
6 |
-
dataset_path: Data
|
7 |
emo_gen:
|
8 |
config_path: config.json
|
9 |
device: cuda
|
10 |
num_processes: 2
|
|
|
11 |
mirror: ''
|
12 |
openi_token: ''
|
13 |
preprocess_text:
|
@@ -18,23 +19,43 @@ preprocess_text:
|
|
18 |
train_path: filelists/train.list
|
19 |
transcription_path: filelists/short_character_anno.list
|
20 |
val_path: filelists/val.list
|
21 |
-
|
22 |
resample:
|
23 |
-
in_dir:
|
24 |
-
out_dir:
|
25 |
sampling_rate: 44100
|
26 |
server:
|
27 |
device: cuda
|
28 |
models:
|
29 |
-
- config:
|
30 |
device: cuda
|
31 |
language: ZH
|
32 |
-
model:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
speakers: []
|
34 |
port: 5000
|
35 |
train_ms:
|
36 |
base:
|
37 |
-
model_image: "Bert-VITS2_2.
|
38 |
repo_id: Stardust_minus/Bert-VITS2
|
39 |
use_base_model: false
|
40 |
config_path: config.json
|
@@ -46,16 +67,16 @@ train_ms:
|
|
46 |
WORLD_SIZE: 1
|
47 |
keep_ckpts: 10
|
48 |
model: models
|
49 |
-
num_workers:
|
50 |
spec_cache: true
|
51 |
translate:
|
52 |
app_key: ''
|
53 |
secret_key: ''
|
54 |
webui:
|
55 |
-
config_path:
|
56 |
debug: false
|
57 |
device: cuda
|
58 |
language_identification_library: langid
|
59 |
-
model:
|
60 |
port: 7860
|
61 |
share: false
|
|
|
3 |
device: cuda
|
4 |
num_processes: 2
|
5 |
use_multi_device: false
|
6 |
+
dataset_path: Data\glut
|
7 |
emo_gen:
|
8 |
config_path: config.json
|
9 |
device: cuda
|
10 |
num_processes: 2
|
11 |
+
use_multi_device: false
|
12 |
mirror: ''
|
13 |
openi_token: ''
|
14 |
preprocess_text:
|
|
|
19 |
train_path: filelists/train.list
|
20 |
transcription_path: filelists/short_character_anno.list
|
21 |
val_path: filelists/val.list
|
22 |
+
val_per_lang: 4
|
23 |
resample:
|
24 |
+
in_dir: raw
|
25 |
+
out_dir: wavs
|
26 |
sampling_rate: 44100
|
27 |
server:
|
28 |
device: cuda
|
29 |
models:
|
30 |
+
- config: ''
|
31 |
device: cuda
|
32 |
language: ZH
|
33 |
+
model: ''
|
34 |
+
speakers:
|
35 |
+
- length_scale: 1
|
36 |
+
noise_scale: 0.6
|
37 |
+
noise_scale_w: 0.8
|
38 |
+
sdp_ratio: 0.2
|
39 |
+
speaker: "\u79D1\u6BD4"
|
40 |
+
- length_scale: 0.5
|
41 |
+
noise_scale: 0.7
|
42 |
+
noise_scale_w: 0.8
|
43 |
+
sdp_ratio: 0.3
|
44 |
+
speaker: "\u4E94\u6761\u609F"
|
45 |
+
- length_scale: 1.2
|
46 |
+
noise_scale: 0.6
|
47 |
+
noise_scale_w: 0.8
|
48 |
+
sdp_ratio: 0.2
|
49 |
+
speaker: "\u5B89\u500D\u664B\u4E09"
|
50 |
+
- config: ''
|
51 |
+
device: cpu
|
52 |
+
language: JP
|
53 |
+
model: ''
|
54 |
speakers: []
|
55 |
port: 5000
|
56 |
train_ms:
|
57 |
base:
|
58 |
+
model_image: "Bert-VITS2_2.3\u5E95\u6A21"
|
59 |
repo_id: Stardust_minus/Bert-VITS2
|
60 |
use_base_model: false
|
61 |
config_path: config.json
|
|
|
67 |
WORLD_SIZE: 1
|
68 |
keep_ckpts: 10
|
69 |
model: models
|
70 |
+
num_workers: 2
|
71 |
spec_cache: true
|
72 |
translate:
|
73 |
app_key: ''
|
74 |
secret_key: ''
|
75 |
webui:
|
76 |
+
config_path: config.json
|
77 |
debug: false
|
78 |
device: cuda
|
79 |
language_identification_library: langid
|
80 |
+
model: models/G_8000.pth
|
81 |
port: 7860
|
82 |
share: false
|