Spaces:

Somnath3570
/

Voice_Assistant

Runtime error

App Files Files Community

Somnath3570 commited on Feb 17

Commit

c336d2f

verified ·

1 Parent(s): b3ce7b4

Create app.py

Browse files

Files changed (1) hide show

app.py +116 -0

app.py ADDED Viewed

	@@ -0,0 +1,116 @@

+# app.py
+import gradio as gr
+import torch
+import transformers
+import librosa
+import numpy as np
+import os
+class UltravoxInterface:
+    def __init__(self):
+        """Initialize the Ultravox model and settings"""
+        print("Loading Ultravox model... This may take a few minutes...")
+        self.pipe = transformers.pipeline(
+            model='fixie-ai/ultravox-v0_4',
+            trust_remote_code=True,
+            device=0 if torch.cuda.is_available() else -1
+        )
+        print("Model loaded successfully!")
+        # Default system prompt
+        self.default_prompt = "You are a friendly and helpful character. You love to answer questions for people."
+    def process_audio(self, audio_path, custom_prompt=None):
+        """Process audio input and return model response"""
+        try:
+            # Load and preprocess audio
+            audio, sr = librosa.load(audio_path, sr=16000)
+            # Prepare conversation turns
+            turns = [
+                {
+                    "role": "system",
+                    "content": custom_prompt if custom_prompt else self.default_prompt
+                }
+            ]
+            # Get model response
+            result = self.pipe(
+                {
+                    'audio': audio,
+                    'turns': turns,
+                    'sampling_rate': sr
+                },
+                max_new_tokens=30
+            )
+            # Handle different response formats
+            if isinstance(result, str):
+                return result
+            elif isinstance(result, list):
+                return result[0] if result else "No response generated"
+            elif isinstance(result, dict):
+                return result.get('generated_text', "No response generated")
+            else:
+                return str(result)
+        except Exception as e:
+            return f"Error processing audio: {str(e)}"
+    def create_interface(self):
+        """Create and configure the Gradio interface"""
+        with gr.Blocks(title="Ultravox Voice Assistant", theme=gr.themes.Soft(
+            primary_hue="orange",
+            secondary_hue="gray",
+        )) as interface:
+            gr.Markdown("# 🎙️ Ultravox Voice Assistant")
+            gr.Markdown("Speak into the microphone and get AI-generated responses!")
+            with gr.Row():
+                with gr.Column():
+                    audio_input = gr.Audio(
+                        label="Speak here",
+                        sources=["microphone"],
+                        type="filepath"
+                    )
+                    system_prompt = gr.Textbox(
+                        label="System Prompt (Optional)",
+                        placeholder="Enter custom system prompt or leave empty for default",
+                        value=self.default_prompt
+                    )
+                    submit_btn = gr.Button(
+                        "Process Audio",
+                        variant="primary"
+                    )
+                with gr.Column():
+                    output_text = gr.Textbox(
+                        label="AI Response",
+                        lines=5,
+                        placeholder="AI response will appear here..."
+                    )
+            submit_btn.click(
+                fn=self.process_audio,
+                inputs=[audio_input, system_prompt],
+                outputs=output_text
+            )
+            gr.Markdown("""
+            ## How to use:
+            1. Click the microphone icon and allow browser access
+            2. Speak your question or prompt
+            3. Click 'Stop' when finished
+            4. Click 'Process Audio' to get the AI response
+            ## Note:
+            First-time loading may take a few minutes as the model is downloaded.
+            """)
+        return interface
+app = UltravoxInterface()
+interface = app.create_interface()