Spaces:
Running
Running
update
Browse files- examples/dfnet2/run.sh +4 -0
- examples/dtln/run.sh +6 -0
- examples/dtln/yaml/config-1024.yaml +29 -0
- examples/frcrn/run.sh +5 -0
- examples/frcrn/yaml/config-10.yaml +1 -1
- main.py +18 -6
examples/dfnet2/run.sh
CHANGED
@@ -10,6 +10,10 @@ sh run.sh --stage 2 --stop_stage 2 --system_version centos --file_folder_name fi
|
|
10 |
--noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
|
11 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/dns3-speech"
|
12 |
|
|
|
|
|
|
|
|
|
13 |
|
14 |
END
|
15 |
|
|
|
10 |
--noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
|
11 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/dns3-speech"
|
12 |
|
13 |
+
sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name dfnet2-nx-devoice \
|
14 |
+
--noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/nx-speech" \
|
15 |
+
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise/nx-noise"
|
16 |
+
|
17 |
|
18 |
END
|
19 |
|
examples/dtln/run.sh
CHANGED
@@ -13,6 +13,12 @@ sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name fi
|
|
13 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/dns3-speech"
|
14 |
|
15 |
|
|
|
|
|
|
|
|
|
|
|
|
|
16 |
END
|
17 |
|
18 |
|
|
|
13 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/dns3-speech"
|
14 |
|
15 |
|
16 |
+
sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir-1024 --final_model_name dtln-1024-nx \
|
17 |
+
--config_file "yaml/config-1024.yaml" \
|
18 |
+
--noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise/nx-noise" \
|
19 |
+
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/nx-speech"
|
20 |
+
|
21 |
+
|
22 |
END
|
23 |
|
24 |
|
examples/dtln/yaml/config-1024.yaml
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
model_name: "DTLN"
|
2 |
+
|
3 |
+
# spec
|
4 |
+
sample_rate: 8000
|
5 |
+
fft_size: 512
|
6 |
+
hop_size: 128
|
7 |
+
win_type: hann
|
8 |
+
|
9 |
+
# data
|
10 |
+
max_snr_db: 20
|
11 |
+
min_snr_db: -10
|
12 |
+
|
13 |
+
# model
|
14 |
+
encoder_size: 1024
|
15 |
+
|
16 |
+
# train
|
17 |
+
lr: 0.001
|
18 |
+
lr_scheduler: "CosineAnnealingLR"
|
19 |
+
lr_scheduler_kwargs:
|
20 |
+
T_max: 250000
|
21 |
+
eta_min: 0.0001
|
22 |
+
|
23 |
+
max_epochs: 100
|
24 |
+
clip_grad_norm: 10.0
|
25 |
+
seed: 1234
|
26 |
+
|
27 |
+
num_workers: 4
|
28 |
+
batch_size: 64
|
29 |
+
eval_steps: 15000
|
examples/frcrn/run.sh
CHANGED
@@ -9,6 +9,11 @@ sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name fi
|
|
9 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech"
|
10 |
|
11 |
|
|
|
|
|
|
|
|
|
|
|
12 |
END
|
13 |
|
14 |
|
|
|
9 |
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech"
|
10 |
|
11 |
|
12 |
+
sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name frcrn-10-nx-devoice \
|
13 |
+
--config_file "yaml/config-10.yaml" \
|
14 |
+
--noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/speech/nx-speech" \
|
15 |
+
--speech_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise/nx-noise"
|
16 |
+
|
17 |
END
|
18 |
|
19 |
|
examples/frcrn/yaml/config-10.yaml
CHANGED
@@ -16,7 +16,7 @@ max_snr_db: 20
|
|
16 |
|
17 |
num_workers: 8
|
18 |
batch_size: 32
|
19 |
-
eval_steps:
|
20 |
|
21 |
lr: 0.001
|
22 |
lr_scheduler: "CosineAnnealingLR"
|
|
|
16 |
|
17 |
num_workers: 8
|
18 |
batch_size: 32
|
19 |
+
eval_steps: 20000
|
20 |
|
21 |
lr: 0.001
|
22 |
lr_scheduler: "CosineAnnealingLR"
|
main.py
CHANGED
@@ -102,16 +102,28 @@ denoise_engines = {
|
|
102 |
"pretrained_model_path_or_zip_file": (project_path / "trained_models/dfnet2-nx-dns3.zip").as_posix()
|
103 |
}
|
104 |
},
|
105 |
-
"frcrn-dns3": {
|
106 |
"infer_cls": InferenceFRCRN,
|
107 |
"kwargs": {
|
108 |
-
"pretrained_model_path_or_zip_file": (project_path / "trained_models/frcrn-dns3.zip").as_posix()
|
109 |
}
|
110 |
},
|
111 |
-
"mpnet-nx
|
112 |
"infer_cls": InferenceMPNet,
|
113 |
"kwargs": {
|
114 |
-
"pretrained_model_path_or_zip_file": (project_path / "trained_models/mpnet-nx
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
115 |
}
|
116 |
},
|
117 |
}
|
@@ -277,8 +289,8 @@ def main():
|
|
277 |
# http://127.0.0.1:7865/
|
278 |
# http://10.75.27.247:7865/
|
279 |
blocks.queue().launch(
|
280 |
-
|
281 |
-
share=False if platform.system() == "Windows" else False,
|
282 |
server_name="127.0.0.1" if platform.system() == "Windows" else "0.0.0.0",
|
283 |
server_port=args.server_port
|
284 |
)
|
|
|
102 |
"pretrained_model_path_or_zip_file": (project_path / "trained_models/dfnet2-nx-dns3.zip").as_posix()
|
103 |
}
|
104 |
},
|
105 |
+
"frcrn-10-dns3": {
|
106 |
"infer_cls": InferenceFRCRN,
|
107 |
"kwargs": {
|
108 |
+
"pretrained_model_path_or_zip_file": (project_path / "trained_models/frcrn-10-dns3.zip").as_posix()
|
109 |
}
|
110 |
},
|
111 |
+
"mpnet-nx": {
|
112 |
"infer_cls": InferenceMPNet,
|
113 |
"kwargs": {
|
114 |
+
"pretrained_model_path_or_zip_file": (project_path / "trained_models/mpnet-nx.zip").as_posix()
|
115 |
+
}
|
116 |
+
},
|
117 |
+
"dfnet2-nx-devoice": {
|
118 |
+
"infer_cls": InferenceDfNet2,
|
119 |
+
"kwargs": {
|
120 |
+
"pretrained_model_path_or_zip_file": (project_path / "trained_models/dfnet2-nx-devoice.zip").as_posix()
|
121 |
+
}
|
122 |
+
},
|
123 |
+
"frcrn-10-nx-devoice": {
|
124 |
+
"infer_cls": InferenceFRCRN,
|
125 |
+
"kwargs": {
|
126 |
+
"pretrained_model_path_or_zip_file": (project_path / "trained_models/frcrn-10-nx-devoice.zip").as_posix()
|
127 |
}
|
128 |
},
|
129 |
}
|
|
|
289 |
# http://127.0.0.1:7865/
|
290 |
# http://10.75.27.247:7865/
|
291 |
blocks.queue().launch(
|
292 |
+
share=True,
|
293 |
+
# share=False if platform.system() == "Windows" else False,
|
294 |
server_name="127.0.0.1" if platform.system() == "Windows" else "0.0.0.0",
|
295 |
server_port=args.server_port
|
296 |
)
|