Spaces:

Nasma
/

voicecloneapi

Sleeping

App Files Files Community

Nasma commited on Jan 15

Commit

fb89804

verified ·

1 Parent(s): d26a5fd

Update main.py

Browse files

Files changed (1) hide show

main.py +25 -25

main.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from fastapi import FastAPI, Query, HTTPException
 from fastapi.responses import StreamingResponse
 from TTS.api import TTS
 import os
 from io import BytesIO
@@ -27,32 +28,31 @@ def split_text(text: str, words_per_chunk: int = 20):
 @app.post("/generate-audio/")
 async def generate_audio(
     text: str = Query(..., description="The input text to convert to speech."),
-    language: str = Query("en", description="Language code for TTS (e.g., 'en' for English).")
-):
-    if not os.path.exists(FIXED_SPEAKER_WAV):
-        raise HTTPException(status_code=400, detail="Fixed speaker WAV file not found.")
-    # StreamingResponse to stream audio chunks
-    def audio_stream():
-            if tts.is_multi_lingual and not language:
-                raise ValueError("Language must be specified for multi-lingual models.")
-            text_chunks = split_text(text, 20)
-            for idx, chunk in enumerate(text_chunks):
-                # Generate audio for each chunk and yield as bytes
-                output_file = f"out_{idx}.wav"
-                tts.tts_to_file(
-                    text=chunk,
                     file_path=output_file,
                     speaker_wav=FIXED_SPEAKER_WAV,
                     language=language
-                )
-                print(output_file)
-                # Read the file content and yield as binary
-                with open(output_file, "rb") as audio_file:
-                    yield audio_file.read()
-                # Optionally delete the file after streaming
-                os.remove(output_file)
-    return StreamingResponse(audio_stream(), media_type="audio/wav")

 from fastapi import FastAPI, Query, HTTPException
 from fastapi.responses import StreamingResponse
+from fastapi.responses import FileResponse
 from TTS.api import TTS
 import os
 from io import BytesIO
 @app.post("/generate-audio/")
 async def generate_audio(
     text: str = Query(..., description="The input text to convert to speech."),
+    language: str = Query("en", description="Language code for TTS (e.g., 'en' for English).")):
+        if not os.path.exists(FIXED_SPEAKER_WAV):
+            raise HTTPException(status_code=400, detail="Fixed speaker WAV file not found.")
+        if tts.is_multi_lingual and not language:
+            raise ValueError("Language must be specified for multi-lingual models.")
+            # Generate audio for each chunk and yield as bytes
+        output_file = f"out.wav"
+        try:
+            tts.tts_to_file(
+                    text=text,
                     file_path=output_file,
                     speaker_wav=FIXED_SPEAKER_WAV,
                     language=language
+            )
+            print(output_file)
+            # Return the generated audio file as a response
+            return FileResponse(output_file, media_type="audio/wav")
+        except Exception as e:
+            raise HTTPException(status_code=500, detail=f"Error generating audio: {str(e)}")
+        # finally:
+        #     # Clean up the generated file after the response is sent
+        #     if os.path.exists(output_file):
+        #         os.remove(output_file)