Spaces:

prasanth345
/

voicechatin

Sleeping

App Files Files Community

prasanth345 commited on Jan 7

Commit

39ef4ac

verified ·

1 Parent(s): 5eea1c8

Upload 2 files

Browse files

Files changed (2) hide show

app.py +52 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,52 @@

+# Import libraries
+import whisper
+import os
+from gtts import gTTS
+import gradio as gr
+from groq import Groq
+# Load Whisper model for transcription
+model = whisper.load_model("base")
+Groq_api_key = "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"
+client = Groq(api_key=Groq_api_key)
+# Function to get the LLM response from Groq
+def get_llm_response(user_input):
+    chat_completion = client.chat.completions.create(
+        messages=[{"role": "user", "content": user_input}],
+        model="llama3-8b-8192",  # Replace with your desired model
+    )
+    return chat_completion.choices[0].message.content
+# Function to convert text to speech using gTTS
+def text_to_speech(text, output_audio="output_audio.mp3"):
+    tts = gTTS(text)
+    tts.save(output_audio)
+    return output_audio
+# Main chatbot function to handle audio input and output
+def chatbot(audio):
+    # Step 1: Transcribe the audio using Whisper
+    result = model.transcribe(audio)
+    user_text = result["text"]
+    # Step 2: Get LLM response from Groq
+    response_text = get_llm_response(user_text)
+    # Step 3: Convert the response text to speech
+    output_audio = text_to_speech(response_text)
+    return response_text, output_audio
+# Gradio interface for real-time interaction
+iface = gr.Interface(
+    fn=chatbot,
+    inputs=gr.Audio(type="filepath"),  # Input from mic or file
+    outputs=[gr.Textbox(), gr.Audio(type="filepath")],  # Output: response text and audio
+    live=True
+)
+# Launch the Gradio app
+iface.launch()

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+openai-whisper
+groq
+gtts
+gradio
+pydub