Spaces:

hprasath
/

image-processing

Sleeping

App Files Files Community

hprasath commited on Apr 8, 2024

Commit

8756640

verified ·

1 Parent(s): dc2d233

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -16

app.py CHANGED Viewed

@@ -49,7 +49,7 @@ def get_face_locations(binary_data):
     print(3)
     return face_locations
-def seperate_image_text_from_pdf(pdf_url):
     # List to store page information
     pages_info = []
@@ -57,13 +57,18 @@ def seperate_image_text_from_pdf(pdf_url):
     response = requests.get(pdf_url)
     if response.status_code == 200:
-        # Create a temporary file to save the PDF data
-        with tempfile.NamedTemporaryFile(delete=False) as tmp_file:
             tmp_file.write(response.content)
-            tmp_file_path = tmp_file.name
         # Open the PDF
-        pdf = fitz.open(tmp_file_path)
         # Iterate through each page
         for page_num in range(len(pdf)):
@@ -96,9 +101,9 @@ def seperate_image_text_from_pdf(pdf_url):
         # Close the PDF
         pdf.close()
-        # Clean up the temporary file
-        import os
-        os.unlink(tmp_file_path)
     else:
         print("Failed to fetch the PDF from the URL.")
@@ -148,16 +153,18 @@ def separate_audio_from_video(video_url):
         # Extract audio
         audio = video.audio
-        # Create a temporary file to write the audio data
-        with tempfile.NamedTemporaryFile(suffix=".wav", delete=False) as temp_audio_file:
-            temp_audio_filename = temp_audio_file.name
-            # Write the audio data to the temporary file
-            audio.write_audiofile(temp_audio_filename)
-            # Read the audio data from the temporary file as bytes
-            with open(temp_audio_filename, "rb") as f:
-                audio_bytes = f.read()
         return audio_bytes

     print(3)
     return face_locations
+def separate_image_text_from_pdf(pdf_url):
     # List to store page information
     pages_info = []
     response = requests.get(pdf_url)
     if response.status_code == 200:
+        # Create a temporary directory to store the PDF data
+        temp_dir = tempfile.mkdtemp()
+        # Define the temporary file path for the PDF
+        temp_pdf_path = os.path.join(temp_dir, "temp.pdf")
+        # Write the PDF data to the temporary file
+        with open(temp_pdf_path, "wb") as tmp_file:
             tmp_file.write(response.content)
         # Open the PDF
+        pdf = fitz.open(temp_pdf_path)
         # Iterate through each page
         for page_num in range(len(pdf)):
         # Close the PDF
         pdf.close()
+        # Clean up the temporary files
+        os.unlink(temp_pdf_path)
+        os.rmdir(temp_dir)
     else:
         print("Failed to fetch the PDF from the URL.")
         # Extract audio
         audio = video.audio
+        # Create a temporary directory to store temporary files
+        temp_dir = tempfile.mkdtemp()
+        # Define the temporary file path for the audio
+        temp_audio_filename = os.path.join(temp_dir, "audio.wav")
+        # Write the audio data to the temporary file
+        audio.write_audiofile(temp_audio_filename)
+        # Read the audio data from the temporary file as bytes
+        with open(temp_audio_filename, "rb") as f:
+            audio_bytes = f.read()
         return audio_bytes