DebasishDhal99 commited on
Commit
a8be1b1
·
1 Parent(s): 2d18120

Remove API dependency for lang detection using langdetect lib

Browse files
backend/audio_to_tgt.py CHANGED
@@ -2,6 +2,7 @@ import whisper
2
  import numpy as np
3
  from pydub import AudioSegment
4
  from deep_translator import GoogleTranslator, detection
 
5
  import os
6
 
7
  available_languages = GoogleTranslator().get_supported_languages(as_dict=True)
@@ -24,7 +25,8 @@ def src_audio_to_eng_translator(audio_file_input, model_size = "turbo", target_l
24
  result = model.transcribe(audio_data)
25
  input_text = result["text"]
26
 
27
- src_lang_code = detection.single_detection(input_text, api_key = lang_detect_key)
 
28
  src_lang = formatted_codes.get(src_lang_code, 'Source language not detected')
29
  target_lang_code = formatted_languages.get(target_lang, 'en')
30
  translated_text = GoogleTranslator(source='auto', target=target_lang_code).translate(input_text)
 
2
  import numpy as np
3
  from pydub import AudioSegment
4
  from deep_translator import GoogleTranslator, detection
5
+ from langdetect import detect
6
  import os
7
 
8
  available_languages = GoogleTranslator().get_supported_languages(as_dict=True)
 
25
  result = model.transcribe(audio_data)
26
  input_text = result["text"]
27
 
28
+ # src_lang_code = detection.single_detection(input_text, api_key = lang_detect_key)
29
+ src_lang_code = detect(input_text)
30
  src_lang = formatted_codes.get(src_lang_code, 'Source language not detected')
31
  target_lang_code = formatted_languages.get(target_lang, 'en')
32
  translated_text = GoogleTranslator(source='auto', target=target_lang_code).translate(input_text)
backend/text_to_tgt.py CHANGED
@@ -1,4 +1,5 @@
1
  from deep_translator import GoogleTranslator, detection
 
2
  import os
3
 
4
  available_languages = GoogleTranslator().get_supported_languages(as_dict=True)
@@ -9,7 +10,8 @@ lang_detect_key = os.getenv("detect_language_api_key")
9
 
10
  def src_txt_to_eng_translator(input_text, target_lang = 'English'):
11
  target_lang_code = formatted_languages.get(target_lang, 'en')
12
- src_lang_code = detection.single_detection(input_text, api_key = lang_detect_key)
 
13
  src_lang = formatted_codes.get(src_lang_code, 'Source language not detected')
14
  translated = GoogleTranslator(source='auto', target=target_lang_code).translate(input_text)
15
  return translated, src_lang
 
1
  from deep_translator import GoogleTranslator, detection
2
+ from langdetect import detect
3
  import os
4
 
5
  available_languages = GoogleTranslator().get_supported_languages(as_dict=True)
 
10
 
11
  def src_txt_to_eng_translator(input_text, target_lang = 'English'):
12
  target_lang_code = formatted_languages.get(target_lang, 'en')
13
+ # src_lang_code = detection.single_detection(input_text, api_key = lang_detect_key)
14
+ src_lang_code = detect(input_text)
15
  src_lang = formatted_codes.get(src_lang_code, 'Source language not detected')
16
  translated = GoogleTranslator(source='auto', target=target_lang_code).translate(input_text)
17
  return translated, src_lang
requirements.txt CHANGED
@@ -4,4 +4,5 @@ pillow==11.0.0
4
  pytesseract==0.3.13
5
  openai-whisper==20240930
6
  pydub==0.25.1
7
- langcodes==3.5.0
 
 
4
  pytesseract==0.3.13
5
  openai-whisper==20240930
6
  pydub==0.25.1
7
+ langcodes==3.5.0
8
+ langdetect==1.0.9