Spaces:

Somnath3570
/

Voice_Assistant

Runtime error

App Files Files Community

Somnath3570 commited on Feb 17

Commit

04cf931

verified ·

1 Parent(s): 3e435ed

Update app.py

Browse files

Files changed (1) hide show

app.py +30 -48

app.py CHANGED Viewed

@@ -10,13 +10,13 @@ class UltravoxInterface:
         """Initialize with smaller model footprint"""
         print("Initializing voice interface...")
-        # Use smaller whisper model instead of full Ultravox
         self.model_name = "openai/whisper-small"
         self.pipe = transformers.pipeline(
             "automatic-speech-recognition",
             model=self.model_name,
-            torch_dtype=torch.float16,  # Use half precision
-            device=0 if torch.cuda.is_available() else -1
         )
         print("Model loaded successfully!")
@@ -50,51 +50,33 @@ class UltravoxInterface:
     def create_interface(self):
         """Create and configure the Gradio interface"""
-        with gr.Blocks(title="Voice Assistant", theme=gr.themes.Soft(
-            primary_hue="orange",
-            secondary_hue="gray",
-        )) as interface:
-            gr.Markdown("# 🎙️ Voice Assistant")
-            gr.Markdown("Speak into the microphone and get text transcription!")
-            with gr.Row():
-                with gr.Column():
-                    audio_input = gr.Audio(
-                        label="Speak here",
-                        sources=["microphone"],
-                        type="filepath"
-                    )
-                    submit_btn = gr.Button(
-                        "Process Audio",
-                        variant="primary"
-                    )
-                with gr.Column():
-                    output_text = gr.Textbox(
-                        label="Transcription",
-                        lines=5,
-                        placeholder="Transcription will appear here..."
-                    )
-            submit_btn.click(
-                fn=self.process_audio,
-                inputs=[audio_input],
-                outputs=output_text
-            )
-            gr.Markdown("""
-            ## How to use:
-            1. Click the microphone icon and allow browser access
-            2. Speak your message
-            3. Click 'Stop' when finished
-            4. Click 'Process Audio' to get the transcription
-            ## Note:
-            Optimized for short audio clips (up to 30 seconds).
-            """)
         return interface
 app = UltravoxInterface()
-interface = app.create_interface()

         """Initialize with smaller model footprint"""
         print("Initializing voice interface...")
+        # Use smaller whisper model
         self.model_name = "openai/whisper-small"
         self.pipe = transformers.pipeline(
             "automatic-speech-recognition",
             model=self.model_name,
+            torch_dtype=torch.float16,
+            device="cpu"  # Explicitly set to CPU
         )
         print("Model loaded successfully!")
     def create_interface(self):
         """Create and configure the Gradio interface"""
+        interface = gr.Interface(
+            fn=self.process_audio,
+            inputs=[
+                gr.Audio(
+                    label="Speak here",
+                    sources=["microphone"],
+                    type="filepath"
+                )
+            ],
+            outputs=[
+                gr.Textbox(
+                    label="Transcription",
+                    lines=5,
+                    placeholder="Transcription will appear here..."
+                )
+            ],
+            title="Voice Assistant",
+            description="Speak into the microphone and get text transcription!",
+            theme=gr.themes.Soft(primary_hue="orange"),
+            examples=[[None]],
+        )
         return interface
+# Create the interface
 app = UltravoxInterface()
+interface = app.create_interface()
+# Launch the interface - this is crucial for Hugging Face Spaces
+interface.launch()