fix 'transcrible' named error

Files changed (4) hide show

api_model.py CHANGED Viewed

@@ -18,9 +18,9 @@ class TransResult(BaseModel):
 class DebugResult(BaseModel):
     # trans_pattern: str
     seg_id: int
-    transcrible_time: float
     translate_time:float
-    context: str = Field(alias="transcribleContent")
     from_: str = Field(alias="from")
     to: str
     tran_content: str = Field(alias="translateContent")

 class DebugResult(BaseModel):
     # trans_pattern: str
     seg_id: int
+    transcribe_time: float
     translate_time:float
+    context: str = Field(alias="transcribeContent")
     from_: str = Field(alias="from")
     to: str
     tran_content: str = Field(alias="translateContent")

transcribe/translatepipes.py CHANGED Viewed

@@ -47,7 +47,7 @@ class TranslatePipes:
             return self._funasr_pipe
         return self._whisper_pipe_en
-    def transcrible(self, audio_buffer: bytes, src_lang: str) -> MetaItem:
         transcription_model = self.get_transcription_model(src_lang)
         item = MetaItem(audio=audio_buffer, source_language=src_lang)
         transcription_model.input_queue.put(item)
@@ -65,6 +65,6 @@ if __name__ == "__main__":
     tp = TranslatePipes()
     # result = tp.translate("你好，今天天气怎么样?", src_lang="zh", dst_lang="en")
     mel, _, = soundfile.read("assets/jfk.flac")
-    # result = tp.transcrible(mel, 'en')
     result = tp.voice_detect(mel)
     print(result)

             return self._funasr_pipe
         return self._whisper_pipe_en
+    def transcribe(self, audio_buffer: bytes, src_lang: str) -> MetaItem:
         transcription_model = self.get_transcription_model(src_lang)
         item = MetaItem(audio=audio_buffer, source_language=src_lang)
         transcription_model.input_queue.put(item)
     tp = TranslatePipes()
     # result = tp.translate("你好，今天天气怎么样?", src_lang="zh", dst_lang="en")
     mel, _, = soundfile.read("assets/jfk.flac")
+    # result = tp.transcribe(mel, 'en')
     result = tp.voice_detect(mel)
     print(result)

transcribe/utils.py CHANGED Viewed

@@ -157,8 +157,8 @@ class TestDataWriter:
     def __init__(self, file_path='test_data.csv'):
         self.file_path = file_path
         self.fieldnames = [
-            'seg_id', 'transcrible_time', 'translate_time',
-            'transcribleContent', 'from', 'to', 'translateContent', 'partial'
         ]
         self._ensure_file_has_header()

     def __init__(self, file_path='test_data.csv'):
         self.file_path = file_path
         self.fieldnames = [
+            'seg_id', 'transcribe_time', 'translate_time',
+            'transcribeContent', 'from', 'to', 'translateContent', 'partial'
         ]
         self._ensure_file_has_header()

transcribe/whisper_llm_serve.py CHANGED Viewed

@@ -56,7 +56,6 @@ class WhisperTranscriptionService:
         # 文本分隔符，根据语言设置
         self.text_separator = _get_text_separator(language)
         self.loop = asyncio.get_event_loop()
-        # 发送就绪状态
         #  原始音频队列
         self._frame_queue = queue.Queue()
         #  音频队列缓冲区
@@ -72,7 +71,7 @@ class WhisperTranscriptionService:
         self.frame_processing_thread = _start_thread(self._frame_processing_loop)
         self.row_number = 0
         # for test
-        self._transcrible_time_cost = 0.
         self._translate_time_cost = 0.
         if config.SAVE_DATA_SAVE:
@@ -187,13 +186,13 @@ class WhisperTranscriptionService:
         log_block("Audio buffer length", f"{audio_buffer.shape[0]/self.sample_rate:.2f}", "s")
         start_time = time.perf_counter()
-        result = self._translate_pipe.transcrible(audio_buffer.tobytes(), self.source_language)
         segments = result.segments
         time_diff = (time.perf_counter() - start_time)
-        logger.debug(f"📝 Transcrible Segments: {segments} ")
-        log_block("📝 Transcrible output", f"{self.text_separator.join(seg.text for seg in segments)}", "")
-        log_block("📝 Transcrible time", f"{time_diff:.3f}", "s")
-        self._transcrible_time_cost = round(time_diff, 3)
         return result
     def _translate_text(self, text: str) -> str:

         # 文本分隔符，根据语言设置
         self.text_separator = _get_text_separator(language)
         self.loop = asyncio.get_event_loop()
         #  原始音频队列
         self._frame_queue = queue.Queue()
         #  音频队列缓冲区
         self.frame_processing_thread = _start_thread(self._frame_processing_loop)
         self.row_number = 0
         # for test
+        self._transcribe_time_cost = 0.
         self._translate_time_cost = 0.
         if config.SAVE_DATA_SAVE:
         log_block("Audio buffer length", f"{audio_buffer.shape[0]/self.sample_rate:.2f}", "s")
         start_time = time.perf_counter()
+        result = self._translate_pipe.transcribe(audio_buffer.tobytes(), self.source_language)
         segments = result.segments
         time_diff = (time.perf_counter() - start_time)
+        logger.debug(f"📝 transcribe Segments: {segments} ")
+        log_block("📝 transcribe output", f"{self.text_separator.join(seg.text for seg in segments)}", "")
+        log_block("📝 transcribe time", f"{time_diff:.3f}", "s")
+        self._transcribe_time_cost = round(time_diff, 3)
         return result
     def _translate_text(self, text: str) -> str: