Xin Zhang commited on
Commit
70b1d55
·
1 Parent(s): 38a440e

[fix]: opt parameter.

Browse files
transcribe/helpers/funasr.py CHANGED
@@ -24,7 +24,7 @@ class FunASR:
24
  def warmup(self, warmup_steps=1):
25
  warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
26
  for _ in range(warmup_steps):
27
- self.model.generate(input=warmup_soundfile)
28
 
29
  def transcribe(self, audio_buffer: bytes, language):
30
  audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
 
24
  def warmup(self, warmup_steps=1):
25
  warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
26
  for _ in range(warmup_steps):
27
+ self.model.generate(input=warmup_soundfile, disable_pbar=True)
28
 
29
  def transcribe(self, audio_buffer: bytes, language):
30
  audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
transcribe/pipelines/pipe_vad.py CHANGED
@@ -33,12 +33,12 @@ class VadPipe(BasePipe):
33
  def init(cls):
34
  if cls.vac is None:
35
  cls.vac = FixedVADIterator(
36
- threshold=0.5,
37
  sampling_rate=cls.sample_rate,
38
  # speech_pad_ms=10
39
- min_silence_duration_ms = 100,
40
  # speech_pad_ms = 30,
41
- max_speech_duration_s=20.0,
42
  )
43
  cls.vac.reset_states()
44
 
 
33
  def init(cls):
34
  if cls.vac is None:
35
  cls.vac = FixedVADIterator(
36
+ threshold=0.6,
37
  sampling_rate=cls.sample_rate,
38
  # speech_pad_ms=10
39
+ min_silence_duration_ms = 80,
40
  # speech_pad_ms = 30,
41
+ max_speech_duration_s=25.0,
42
  )
43
  cls.vac.reset_states()
44