Spaces:

udayl
/

NotebookLM-Kokoro_TTS_App

Running

App Files Files Community

udayl commited on 21 days ago

Commit

cea6d8c

1 Parent(s): 61caafb

fix: using /tmp instead of /app

Browse files

Files changed (1) hide show

gradio_app.py +19 -37

gradio_app.py CHANGED Viewed

@@ -89,70 +89,52 @@ def generate_audio_from_script_with_voices(script, speaker1_voice, speaker2_voic
 def process_pdf(pdf_file, speaker1_voice, speaker2_voice, provider, api_key, openrouter_base=None):
     """Process the uploaded PDF file and generate audio"""
     try:
         # Set API configuration based on provider
         if provider == "openai":
-            os.environ["OPENAI_API_KEY"] = api_key
             os.environ["OPENROUTER_API_BASE"] = "https://api.openai.com/v1"
         else:
-            os.environ["OPENAI_API_KEY"] = api_key
             os.environ["OPENROUTER_API_BASE"] = openrouter_base or "https://openrouter.ai/api/v1"
-        # Check if we received a valid file
         if pdf_file is None:
             return "No file uploaded", None
-        # Create a temporary file with .pdf extension
-        with tempfile.NamedTemporaryFile(delete=False, suffix=".pdf") as tmp:
-            # For Gradio uploads, we need to copy the file
-            shutil.copy2(pdf_file.name, tmp.name)
-            tmp_path = tmp.name
-        print(f"Uploaded PDF saved at {tmp_path}")
-        # Generate transcript using your existing function
         transcript, transcript_path = generate_podcast_script(tmp_path, provider=provider)
         if transcript is None:
             return "Error generating transcript", None
-        # Define an output file path for the generated audio
         audio_output_path = os.path.join(
-            os.path.dirname(tmp_path),
-            f"audio_{os.path.basename(tmp_path).replace('.pdf', '.wav')}"
         )
-        # result = generate_audio_from_script_with_voices(
-        #     transcript,
-        #     speaker1_voice,
-        #     speaker2_voice,
-        #     output_file=audio_output_path
-        # )
-        # Use ProcessPoolExecutor with explicit number of workers
         with concurrent.futures.ProcessPoolExecutor(max_workers=NUM_WORKERS) as executor:
-            print(f"Processing with {NUM_WORKERS} CPU cores")
-            # Submit audio generation task to the executor
             future = executor.submit(
                 generate_audio_from_script_with_voices,
                 transcript, speaker1_voice, speaker2_voice, audio_output_path
             )
             result = future.result()
-            if result is None:
-                return "Error generating audio", None
-            return "Process complete!", result
-    except Exception as e:
-        print(f"Error in process_pdf: {str(e)}")
-        return f"Error processing file: {str(e)}", None
         if result is None:
             return "Error generating audio", None
         return "Process complete!", result
     except Exception as e:
-        print(f"Error in process_pdf: {str(e)}")
         return f"Error processing file: {str(e)}", None

 def process_pdf(pdf_file, speaker1_voice, speaker2_voice, provider, api_key, openrouter_base=None):
     """Process the uploaded PDF file and generate audio"""
     try:
         # Set API configuration based on provider
+        os.environ["OPENAI_API_KEY"] = api_key
         if provider == "openai":
             os.environ["OPENROUTER_API_BASE"] = "https://api.openai.com/v1"
         else:
             os.environ["OPENROUTER_API_BASE"] = openrouter_base or "https://openrouter.ai/api/v1"
         if pdf_file is None:
             return "No file uploaded", None
+        # Use /tmp or current directory for temp file creation
+        base_dir = "/tmp" if os.path.exists("/tmp") else os.getcwd()
+        # Create a temp copy of the uploaded PDF
+        pdf_filename = os.path.basename(pdf_file.name)
+        tmp_path = os.path.join(base_dir, f"uploaded_{pdf_filename}")
+        shutil.copy2(pdf_file.name, tmp_path)
+        print(f"[INFO] Uploaded PDF saved at {tmp_path}")
+        # Generate the podcast script
         transcript, transcript_path = generate_podcast_script(tmp_path, provider=provider)
         if transcript is None:
             return "Error generating transcript", None
+        # Define audio output path in the same temp dir
         audio_output_path = os.path.join(
+            base_dir,
+            f"audio_{os.path.splitext(pdf_filename)[0]}.wav"
         )
+        # Process audio generation using parallel CPU workers
         with concurrent.futures.ProcessPoolExecutor(max_workers=NUM_WORKERS) as executor:
+            print(f"[INFO] Processing with {NUM_WORKERS} CPU cores")
             future = executor.submit(
                 generate_audio_from_script_with_voices,
                 transcript, speaker1_voice, speaker2_voice, audio_output_path
             )
             result = future.result()
         if result is None:
             return "Error generating audio", None
         return "Process complete!", result
     except Exception as e:
+        print(f"[ERROR] process_pdf failed: {str(e)}")
         return f"Error processing file: {str(e)}", None