frogcho123 commited on
Commit
c13c4df
·
1 Parent(s): 45b71c9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -1
app.py CHANGED
@@ -9,9 +9,13 @@ import numpy as np
9
 
10
  def translate_speech_to_speech(input_audio):
11
 
 
 
 
 
12
  # Save the input audio to a temporary file
13
  input_file = "input_audio.wav"
14
- sf.write(input_file, input_audio, 44100)
15
 
16
  # Language detection and translation code from the first code snippet
17
  model = whisper.load_model("base")
 
9
 
10
  def translate_speech_to_speech(input_audio):
11
 
12
+ # Convert stereo to mono and convert float to int16
13
+ mono_audio = np.mean(input_audio, axis=1)
14
+ int_audio = np.int16(mono_audio * 32767)
15
+
16
  # Save the input audio to a temporary file
17
  input_file = "input_audio.wav"
18
+ sf.write(input_file, int_audio, 16000)
19
 
20
  # Language detection and translation code from the first code snippet
21
  model = whisper.load_model("base")