HoneyTian commited on
Commit
e38e642
·
1 Parent(s): 25ec0f4
examples/spectrum_dfnet_aishell/run.sh CHANGED
@@ -8,7 +8,7 @@ sh run.sh --stage 2 --stop_stage 2 --system_version windows --file_folder_name f
8
  --speech_dir "E:/programmer/asr_datasets/aishell/data_aishell/wav/train"
9
 
10
 
11
- sh run.sh --stage 1 --stop_stage 3 --system_version centos --file_folder_name file_dir \
12
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
13
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train"
14
 
 
8
  --speech_dir "E:/programmer/asr_datasets/aishell/data_aishell/wav/train"
9
 
10
 
11
+ sh run.sh --stage 1 --stop_stage 2 --system_version centos --file_folder_name file_dir \
12
  --noise_dir "/data/tianxing/HuggingDatasets/nx_noise/data/noise" \
13
  --speech_dir "/data/tianxing/HuggingDatasets/aishell/data_aishell/wav/train"
14
 
examples/spectrum_dfnet_aishell/step_2_train_model.py CHANGED
@@ -320,7 +320,7 @@ def main():
320
  if torch.any(torch.isnan(lsnr_prediction)) or torch.any(torch.isinf(lsnr_prediction)):
321
  raise AssertionError("nan or inf in lsnr_prediction")
322
 
323
- speech_loss = speech_mse_loss.forward(speech_spec_prediction, speech_complex_spec)
324
  irm_loss = irm_mse_loss.forward(speech_irm_prediction, speech_irm_target)
325
 
326
  lsnr_prediction = (lsnr_prediction - config.lsnr_min) / (config.lsnr_max - config.lsnr_min)
@@ -375,7 +375,7 @@ def main():
375
  if torch.any(torch.isnan(lsnr_prediction)) or torch.any(torch.isinf(lsnr_prediction)):
376
  raise AssertionError("nan or inf in lsnr_prediction")
377
 
378
- speech_loss = speech_mse_loss.forward(speech_spec_prediction, speech_complex_spec)
379
  irm_loss = irm_mse_loss.forward(speech_irm_prediction, speech_irm_target)
380
 
381
  lsnr_prediction = (lsnr_prediction - config.lsnr_min) / (config.lsnr_max - config.lsnr_min)
 
320
  if torch.any(torch.isnan(lsnr_prediction)) or torch.any(torch.isinf(lsnr_prediction)):
321
  raise AssertionError("nan or inf in lsnr_prediction")
322
 
323
+ speech_loss = speech_mse_loss.forward(speech_spec_prediction, torch.view_as_real(speech_complex_spec))
324
  irm_loss = irm_mse_loss.forward(speech_irm_prediction, speech_irm_target)
325
 
326
  lsnr_prediction = (lsnr_prediction - config.lsnr_min) / (config.lsnr_max - config.lsnr_min)
 
375
  if torch.any(torch.isnan(lsnr_prediction)) or torch.any(torch.isinf(lsnr_prediction)):
376
  raise AssertionError("nan or inf in lsnr_prediction")
377
 
378
+ speech_loss = speech_mse_loss.forward(speech_spec_prediction, torch.view_as_real(speech_complex_spec))
379
  irm_loss = irm_mse_loss.forward(speech_irm_prediction, speech_irm_target)
380
 
381
  lsnr_prediction = (lsnr_prediction - config.lsnr_min) / (config.lsnr_max - config.lsnr_min)