Xin Zhang
commited on
Commit
·
70b1d55
1
Parent(s):
38a440e
[fix]: opt parameter.
Browse files
transcribe/helpers/funasr.py
CHANGED
@@ -24,7 +24,7 @@ class FunASR:
|
|
24 |
def warmup(self, warmup_steps=1):
|
25 |
warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
|
26 |
for _ in range(warmup_steps):
|
27 |
-
self.model.generate(input=warmup_soundfile)
|
28 |
|
29 |
def transcribe(self, audio_buffer: bytes, language):
|
30 |
audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
|
|
|
24 |
def warmup(self, warmup_steps=1):
|
25 |
warmup_soundfile = f"{config.ASSERT_DIR}/jfk.flac"
|
26 |
for _ in range(warmup_steps):
|
27 |
+
self.model.generate(input=warmup_soundfile, disable_pbar=True)
|
28 |
|
29 |
def transcribe(self, audio_buffer: bytes, language):
|
30 |
audio_frames = np.frombuffer(audio_buffer, dtype=np.float32)
|
transcribe/pipelines/pipe_vad.py
CHANGED
@@ -33,12 +33,12 @@ class VadPipe(BasePipe):
|
|
33 |
def init(cls):
|
34 |
if cls.vac is None:
|
35 |
cls.vac = FixedVADIterator(
|
36 |
-
threshold=0.
|
37 |
sampling_rate=cls.sample_rate,
|
38 |
# speech_pad_ms=10
|
39 |
-
min_silence_duration_ms =
|
40 |
# speech_pad_ms = 30,
|
41 |
-
max_speech_duration_s=
|
42 |
)
|
43 |
cls.vac.reset_states()
|
44 |
|
|
|
33 |
def init(cls):
|
34 |
if cls.vac is None:
|
35 |
cls.vac = FixedVADIterator(
|
36 |
+
threshold=0.6,
|
37 |
sampling_rate=cls.sample_rate,
|
38 |
# speech_pad_ms=10
|
39 |
+
min_silence_duration_ms = 80,
|
40 |
# speech_pad_ms = 30,
|
41 |
+
max_speech_duration_s=25.0,
|
42 |
)
|
43 |
cls.vac.reset_states()
|
44 |
|