sachin
add-user
38a081b
raw
history blame
2.03 kB
import gradio as gr
import requests
def text_to_speech(text):
# Construct URL with plain text as query parameter
import os
# Get the base URL (IP or domain) from environment variable
base_url = os.getenv("DWANI_AI_API_BASE_URL")
if not base_url:
raise ValueError("DWANI_AI_API_BASE_URL environment variable is not set")
# Define the endpoint path
endpoint = "/v1/audio/speech?"
# Construct the full API URL
url = f"{base_url.rstrip('/')}{endpoint}"
url = (f"{url}"
f"input={text}&response_format=mp3")
headers = {
"accept": "application/json"
}
try:
response = requests.post(url, headers=headers, data='')
response.raise_for_status()
# Save the audio content to a temporary file
temp_file = "temp_output.mp3"
with open(temp_file, "wb") as f:
f.write(response.content)
return temp_file
except requests.exceptions.RequestException as e:
return f"Error: {str(e)}"
# Create Gradio interface
with gr.Blocks(title="Text to Speech API Interface") as demo:
gr.Markdown("# Text to Speech API Interface")
with gr.Row():
with gr.Column():
# Input components
text_input = gr.Textbox(
label="Text",
placeholder="Enter text to convert to speech",
value="ಕರ್ನಾಟಕದ ರಾಜಧಾನಿ ಬೆಂಗಳೂರು." # Example from curl
)
submit_btn = gr.Button("Generate Speech")
with gr.Column():
# Output component
audio_output = gr.Audio(
label="Generated Speech",
type="filepath",
interactive=False
)
# Connect the button click to the API function
submit_btn.click(
fn=text_to_speech,
inputs=[text_input],
outputs=audio_output
)
# Launch the interface
demo.launch()