frogcho123 commited on
Commit
ae8d075
·
1 Parent(s): fa154e4

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -0
app.py CHANGED
@@ -12,6 +12,8 @@ tokenizer = AutoTokenizer.from_pretrained("alirezamsh/small100")
12
  model = AutoModelForSeq2SeqLM.from_pretrained("alirezamsh/small100")
13
 
14
  def translate_speech(audio, target_lang):
 
 
15
  audio = audio.astype("float32") # Convert audio to float32
16
  audio = whisper.pad_or_trim(audio, whisper_model.audio_config.sample_rate)
17
  mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
@@ -34,6 +36,7 @@ def translate_speech(audio, target_lang):
34
  return audio_path
35
 
36
 
 
37
  def translate_speech_interface(audio, target_lang):
38
  translated_audio = translate_speech(audio, target_lang)
39
  translated_audio_bytes = open(translated_audio, "rb").read()
 
12
  model = AutoModelForSeq2SeqLM.from_pretrained("alirezamsh/small100")
13
 
14
  def translate_speech(audio, target_lang):
15
+ if isinstance(audio, tuple):
16
+ audio = audio[0]
17
  audio = audio.astype("float32") # Convert audio to float32
18
  audio = whisper.pad_or_trim(audio, whisper_model.audio_config.sample_rate)
19
  mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
 
36
  return audio_path
37
 
38
 
39
+
40
  def translate_speech_interface(audio, target_lang):
41
  translated_audio = translate_speech(audio, target_lang)
42
  translated_audio_bytes = open(translated_audio, "rb").read()