Spaces:

GoodML
/

dishDecode

Running

App Files Files Community

GoodML commited on Dec 10, 2024

Commit

482cb98

verified ·

1 Parent(s): 0db5687

removed the wav concertor

Browse files

Files changed (1) hide show

app.py +17 -38

app.py CHANGED Viewed

@@ -88,27 +88,16 @@ def health_check():
 #             os.remove(temp_audio_path)
 #             print(f"Temporary WAV file deleted: {temp_audio_path}")
-def download_video(url, temp_video_path):
-    """Download video from the given URL and save it to temp_video_path."""
     response = requests.get(url, stream=True)
     if response.status_code == 200:
-        with open(temp_video_path, 'wb') as f:
             for chunk in response.iter_content(chunk_size=1024):
                 f.write(chunk)
-        print(f"Video downloaded successfully to {temp_video_path}")
     else:
-        raise Exception(f"Failed to download video, status code: {response.status_code}")
-def convert_to_wav(video_path, wav_path):
-    """Convert video file to WAV format using FFmpeg."""
-    try:
-        ffmpeg_command = [
-            "ffmpeg", "-i", video_path, "-q:a", "0", "-map", "a", wav_path
-        ]
-        subprocess.run(ffmpeg_command, check=True)
-        print(f"Video converted to WAV successfully: {wav_path}")
-    except subprocess.CalledProcessError as e:
-        raise Exception(f"FFmpeg conversion failed: {e}")
 @app.route('/process-audio', methods=['POST'])
 def process_audio():
@@ -116,26 +105,21 @@ def process_audio():
         return jsonify({"error": "No audio URL provided"}), 400
     audio_url = request.json['audioUrl']
-    temp_video_path = None
-    temp_wav_path = None
     try:
-        # Step 1: Download the video file from the Cloudinary URL
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".mp4") as temp_video_file:
-            temp_video_path = temp_video_file.name
-            download_video(audio_url, temp_video_path)
-        # Step 2: Convert the downloaded video to WAV format
-        temp_wav_path = temp_video_path.replace(".mp4", ".wav")
-        convert_to_wav(temp_video_path, temp_wav_path)
-        # Step 3: Transcribe the audio file synchronously
-        transcription = transcribe_audio(temp_wav_path)
         if not transcription:
             return jsonify({"error": "Audio transcription failed"}), 500
-        # Step 4: Generate structured recipe information using Gemini API synchronously
         structured_data = query_gemini_api(transcription)
         return jsonify(structured_data)
@@ -144,15 +128,10 @@ def process_audio():
         return jsonify({"error": str(e)}), 500
     finally:
-        # Clean up temporary files
-        if temp_video_path and os.path.exists(temp_video_path):
-            os.remove(temp_video_path)
-            print(f"Temporary video file deleted: {temp_video_path}")
-        if temp_wav_path and os.path.exists(temp_wav_path):
-            os.remove(temp_wav_path)
-            print(f"Temporary WAV file deleted: {temp_wav_path}")

 #             os.remove(temp_audio_path)
 #             print(f"Temporary WAV file deleted: {temp_audio_path}")
+def download_audio(url, temp_audio_path):
+    """Download audio (WAV format) from the given URL and save it to temp_audio_path."""
     response = requests.get(url, stream=True)
     if response.status_code == 200:
+        with open(temp_audio_path, 'wb') as f:
             for chunk in response.iter_content(chunk_size=1024):
                 f.write(chunk)
+        print(f"Audio downloaded successfully to {temp_audio_path}")
     else:
+        raise Exception(f"Failed to download audio, status code: {response.status_code}")
 @app.route('/process-audio', methods=['POST'])
 def process_audio():
         return jsonify({"error": "No audio URL provided"}), 400
     audio_url = request.json['audioUrl']
+    temp_audio_path = None
     try:
+        # Step 1: Download the WAV file from the provided URL
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as temp_audio_file:
+            temp_audio_path = temp_audio_file.name
+            download_audio(audio_url, temp_audio_path)
+        # Step 2: Transcribe the downloaded WAV file synchronously
+        transcription = transcribe_audio(temp_audio_path)
         if not transcription:
             return jsonify({"error": "Audio transcription failed"}), 500
+        # Step 3: Generate structured recipe information using Gemini API synchronously
         structured_data = query_gemini_api(transcription)
         return jsonify(structured_data)
         return jsonify({"error": str(e)}), 500
     finally:
+        # Clean up temporary audio file
+        if temp_audio_path and os.path.exists(temp_audio_path):
+            os.remove(temp_audio_path)
+            print(f"Temporary audio file deleted: {temp_audio_path}")