kevinwang676 commited on
Commit
dc3921c
·
verified ·
1 Parent(s): 3fba2c5

Update GPT_SoVITS/TTS_infer_pack/TTS.py

Browse files
Files changed (1) hide show
  1. GPT_SoVITS/TTS_infer_pack/TTS.py +4 -4
GPT_SoVITS/TTS_infer_pack/TTS.py CHANGED
@@ -287,7 +287,7 @@ class TTS_Config:
287
  configs: dict = self._load_configs(self.configs_path)
288
 
289
  assert isinstance(configs, dict)
290
- version = configs.get("version", "v2").lower()
291
  assert version in ["v1", "v2", "v3", "v4"]
292
  self.default_configs[version] = configs.get(version, self.default_configs[version])
293
  self.configs: dict = configs.get("custom", deepcopy(self.default_configs[version]))
@@ -369,7 +369,7 @@ class TTS_Config:
369
  return self.config
370
 
371
  def update_version(self, version: str) -> None:
372
- self.version = version
373
  self.languages = self.v1_languages if self.version == "v1" else self.v2_languages
374
 
375
  def __str__(self):
@@ -747,8 +747,8 @@ class TTS:
747
  )
748
  with torch.no_grad():
749
  wav16k, sr = librosa.load(ref_wav_path, sr=16000)
750
- if wav16k.shape[0] > 160000 or wav16k.shape[0] < 48000:
751
- raise OSError(i18n("参考音频在3~10秒范围外,请更换!"))
752
  wav16k = torch.from_numpy(wav16k)
753
  zero_wav_torch = torch.from_numpy(zero_wav)
754
  wav16k = wav16k.to(self.configs.device)
 
287
  configs: dict = self._load_configs(self.configs_path)
288
 
289
  assert isinstance(configs, dict)
290
+ version = "v2" #configs.get("version", "v4").lower() # 使用 v4
291
  assert version in ["v1", "v2", "v3", "v4"]
292
  self.default_configs[version] = configs.get(version, self.default_configs[version])
293
  self.configs: dict = configs.get("custom", deepcopy(self.default_configs[version]))
 
369
  return self.config
370
 
371
  def update_version(self, version: str) -> None:
372
+ self.version = "v2"#version
373
  self.languages = self.v1_languages if self.version == "v1" else self.v2_languages
374
 
375
  def __str__(self):
 
747
  )
748
  with torch.no_grad():
749
  wav16k, sr = librosa.load(ref_wav_path, sr=16000)
750
+ if wav16k.shape[0] > 240000 or wav16k.shape[0] < 48000:
751
+ raise OSError(i18n("参考音频在3~15秒范围外,请更换!"))
752
  wav16k = torch.from_numpy(wav16k)
753
  zero_wav_torch = torch.from_numpy(zero_wav)
754
  wav16k = wav16k.to(self.configs.device)