Spaces:

hamzaherry
/

voice-chat

Sleeping

App Files Files Community

hamzaherry commited on Dec 16, 2024

Commit

94dd3ca

verified ·

1 Parent(s): 2514512

Create app.py

Browse files

Files changed (1) hide show

app.py +62 -0

app.py ADDED Viewed

	@@ -0,0 +1,62 @@

+import os
+import whisper
+from groq import Groq
+from gtts import gTTS
+import tempfile
+import IPython.display as ipd
+import gradio as gr
+# Step 1: Set up Whisper for transcription
+model = whisper.load_model("base")
+# Function to transcribe audio using Whisper
+def transcribe_audio(audio_file):
+    result = model.transcribe(audio_file)
+    return result["text"]
+GROOQ_API_KEY = "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"
+Client = Grooq(api_key=GROOQ_API_KEY)
+# Function to get a response from the Groq LLM (Llama 3)
+def get_groq_response(text):
+    chat_completion = client.chat.completions.create(
+        messages=[{"role": "user", "content": text}],
+        model="llama3-8b-8192",  # Use any other model if you prefer
+        stream=False
+    )
+    return chat_completion.choices[0].message.content
+# Step 3: Convert text response from LLM to speech using GTTS
+def text_to_speech(text):
+    tts = gTTS(text)
+    # Save the audio to a temporary file
+    temp_file = tempfile.NamedTemporaryFile(delete=False)
+    tts.save(temp_file.name)
+    # Play the audio in Colab (testing)
+    ipd.Audio(temp_file.name)
+    return temp_file.name  # Return file path for further use
+# Step 4: Integrate everything into a Gradio interface
+def voice_chatbot(audio_input):
+    # Step 1: Transcribe the audio using Whisper
+    transcription = transcribe_audio(audio_input)
+    # Step 2: Get response from Groq API using the transcription
+    response = get_groq_response(transcription)
+    # Step 3: Convert the response text to speech using GTTS
+    audio_response = text_to_speech(response)
+    # Return the audio response (Gradio will play it)
+    return audio_response
+# Step 5: Create the Gradio interface (microphone input and audio output)
+iface = gr.Interface(fn=voice_chatbot,
+                     inputs=gr.Audio(type="filepath"),  # No source="microphone" argument
+                     outputs=gr.Audio(),
+                     live=True)
+# Launch the Gradio interface
+iface.launch()