Spaces:

frogcho123
/

s2s

Build error

frogcho123 commited on Jun 6, 2023

Commit

b480da2

1 Parent(s): 34bfd6c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -8,13 +8,14 @@ from tempfile import NamedTemporaryFile
 # Define translation function
 def translate_audio(input_file, target_language):
     # Save uploaded audio file to a temporary file
-    with NamedTemporaryFile(suffix=".mp3") as temp_audio:
         temp_audio.write(input_file.read())
         temp_audio.seek(0)
     # Auto to text (STT)
     model = whisper.load_model("base")
-    audio = whisper.load_audio(temp_audio.name)
     audio = whisper.pad_or_trim(audio)
     mel = whisper.log_mel_spectrogram(audio).to(model.device)
     _, probs = model.detect_language(mel)
@@ -40,15 +41,15 @@ def translate_audio(input_file, target_language):
 # Define Gradio interface
 inputs = [
- gr.File(label="Upload Audio File"),
- gr.Dropdown(choices=['en', 'es', 'fr', 'de', 'ru'], label="Target Language")
 ]
 outputs = [
- gr.File(label="Translated Audio")
 ]
 title = "Audio Translation"
 description = "Upload an audio file, translate the speech to a target language, and download the translated audio."
-gr.Interface(fn=translate_audio, inputs=inputs, outputs=outputs, title=title, description=description).launch()

 # Define translation function
 def translate_audio(input_file, target_language):
     # Save uploaded audio file to a temporary file
+    with NamedTemporaryFile(suffix=".mp3", dir=".", delete=False) as temp_audio:
         temp_audio.write(input_file.read())
         temp_audio.seek(0)
+        temp_audio_path = temp_audio.name
     # Auto to text (STT)
     model = whisper.load_model("base")
+    audio = whisper.load_audio(temp_audio_path)
     audio = whisper.pad_or_trim(audio)
     mel = whisper.log_mel_spectrogram(audio).to(model.device)
     _, probs = model.detect_language(mel)
 # Define Gradio interface
 inputs = [
+ gr.inputs.File(label="Upload Audio File"),
+ gr.inputs.Dropdown(choices=['en', 'es', 'fr', 'de', 'ru'], label="Target Language")
 ]
 outputs = [
+ gr.outputs.File(label="Translated Audio")
 ]
 title = "Audio Translation"
 description = "Upload an audio file, translate the speech to a target language, and download the translated audio."
+gr.Interface(fn=translate_audio, inputs=inputs, outputs=outputs, title=title, description=description).launch()