Commit
·
645fa36
1
Parent(s):
24f7854
Add full language name for whisper
Browse files- backend/audio_to_tgt.py +4 -2
- requirements.txt +2 -1
backend/audio_to_tgt.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
import whisper
|
2 |
import numpy as np
|
3 |
from pydub import AudioSegment
|
|
|
4 |
from deep_translator import GoogleTranslator
|
5 |
|
6 |
def audio_to_numpy(audio_file_input):
|
@@ -16,7 +17,8 @@ def src_audio_to_eng_translator(audio_file_input, model_size = "turbo"):
|
|
16 |
model = whisper.load_model(model_size)
|
17 |
result = model.transcribe(audio_data)
|
18 |
input_text = result["text"]
|
19 |
-
|
|
|
20 |
translated_text = GoogleTranslator(source='auto', target='en').translate(input_text)
|
21 |
-
return input_text, translated_text,
|
22 |
# return result['text']
|
|
|
1 |
import whisper
|
2 |
import numpy as np
|
3 |
from pydub import AudioSegment
|
4 |
+
import langcodes
|
5 |
from deep_translator import GoogleTranslator
|
6 |
|
7 |
def audio_to_numpy(audio_file_input):
|
|
|
17 |
model = whisper.load_model(model_size)
|
18 |
result = model.transcribe(audio_data)
|
19 |
input_text = result["text"]
|
20 |
+
language_code = result["language"]
|
21 |
+
language_name = langcodes.get(language_code).language_name()
|
22 |
translated_text = GoogleTranslator(source='auto', target='en').translate(input_text)
|
23 |
+
return input_text, translated_text, language_name
|
24 |
# return result['text']
|
requirements.txt
CHANGED
@@ -3,4 +3,5 @@ gradio==5.6.0
|
|
3 |
pillow==11.0.0
|
4 |
pytesseract==0.3.13
|
5 |
openai-whisper==20240930
|
6 |
-
pydub==0.25.1
|
|
|
|
3 |
pillow==11.0.0
|
4 |
pytesseract==0.3.13
|
5 |
openai-whisper==20240930
|
6 |
+
pydub==0.25.1
|
7 |
+
langcodes==3.5.0
|