HoneyTian commited on
Commit
c37a8f9
·
1 Parent(s): deadd6d
examples/nx_clean_unet/run.sh CHANGED
@@ -12,10 +12,10 @@ sh run.sh --stage 3 --stop_stage 3 --system_version centos --file_folder_name fi
12
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
13
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train"
14
 
15
- sh run.sh --stage 2 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name mpnet-aishell-20250224 \
16
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
17
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train" \
18
- --max_epochs 100 --max_count 10000
19
 
20
 
21
  sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name mpnet-nx-speech-20250224 \
 
12
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
13
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train"
14
 
15
+ sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name nx-clean-unet-aishell-20250228 \
16
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
17
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train" \
18
+ --max_epochs 100
19
 
20
 
21
  sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir --final_model_name mpnet-nx-speech-20250224 \
examples/nx_clean_unet/yaml/config.yaml CHANGED
@@ -6,14 +6,14 @@ n_fft: 512
6
  win_size: 200
7
  hop_size: 80
8
 
9
- down_sampling_num_layers: 5
10
  down_sampling_in_channels: 1
11
  down_sampling_hidden_channels: 64
12
  down_sampling_kernel_size: 4
13
  down_sampling_stride: 2
14
 
15
- tsfm_hidden_size: 512
16
- tsfm_attention_heads: 8
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
19
  tsfm_max_length: 1024
 
6
  win_size: 200
7
  hop_size: 80
8
 
9
+ down_sampling_num_layers: 6
10
  down_sampling_in_channels: 1
11
  down_sampling_hidden_channels: 64
12
  down_sampling_kernel_size: 4
13
  down_sampling_stride: 2
14
 
15
+ tsfm_hidden_size: 2048
16
+ tsfm_attention_heads: 12
17
  tsfm_num_blocks: 6
18
  tsfm_dropout_rate: 0.1
19
  tsfm_max_length: 1024
toolbox/torchaudio/models/nx_clean_unet/modeling_nx_clean_unet.py CHANGED
@@ -329,4 +329,4 @@ def main():
329
 
330
 
331
  if __name__ == "__main__":
332
- main()
 
329
 
330
 
331
  if __name__ == "__main__":
332
+ main2()