File size: 1,463 Bytes
914c7b4
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
import os
from dotenv import load_dotenv
import gradio as gr
import requests
import pathlib


load_dotenv()
KEY_ELEVENLABS = os.getenv('ELEVENLABS_KEY')
print(KEY_ELEVENLABS)


def generate_audio(text_input: str, creator: str) -> str:
    CHUNK_SIZE = 1024

    headers = {
        "Accept": "application/json",
        "xi-api-key": KEY_ELEVENLABS
    }

    voice_id = ''

    match creator:
        case 'Roomie':
            voice_id = '2Onew6n5JwT9uEbmTSrO'
        case 'Xavy':
            voice_id = 'cYBsY94mzMC7VpGoVMgr'
        case 'Bella':
            voice_id = 'X9j5sAaRD6aEgBblOUOG'

    url = f"https://api.elevenlabs.io/v1/text-to-speech/{voice_id}/stream"

    payload = {
        "text": text_input,
        "model_id": "eleven_monolingual_v1",
        "voice_settings": {
            "stability": 0.5,
            "similarity_boost": 0.8,
            "style": 0.0,
            "use_speaker_boost": False
        }
    }

    response = requests.post(url, headers=headers, json=payload, stream=True)
    print(response)
    with open('output.wav', 'wb') as f:
        for chunk in response.iter_content(chunk_size=CHUNK_SIZE):
            if chunk:
                f.write(chunk)

    return f'{pathlib.Path().resolve()}\output.mp3'


app = gr.Interface(
    fn=generate_audio,
    inputs=[gr.Textbox(label='Text to Speach'), gr.Dropdown(
        ['Roomie', 'Xavy', 'Bella'], label="Coice your creator")],
    outputs=['audio']
)

app.launch()