Spaces:

pratham0011
/

ConversAI_AI-Voice-Chat-Assistant

Sleeping

App Files Files Community

pratham0011 commited on Jan 11

Commit

ffe3553

verified ·

1 Parent(s): 2995035

Delete whisper.py

Browse files

Files changed (1) hide show

whisper.py +0 -68

whisper.py DELETED Viewed

@@ -1,68 +0,0 @@
-import os
-import tempfile
-import logging
-import requests
-from typing import Optional
-import edge_tts
-from config.config import VOICE, FALLBACK_VOICES, token
-logger = logging.getLogger(__name__)
-# Whisper model for speech to text
-API_URL = "https://api-inference.huggingface.co/models/openai/whisper-tiny"
-headers = {"Authorization": f"Bearer {token}"}
-# Voice selection handling
-async def get_valid_voice() -> str:
-    available_voices = await edge_tts.list_voices()
-    voice_names = [VOICE] + FALLBACK_VOICES
-    available_voice_names = {v["ShortName"] for v in available_voices}
-    for voice in voice_names:
-        if voice in available_voice_names:
-            return voice
-    raise RuntimeError("No valid voice found")
-# Text-to-speech conversion using Edge TTS
-async def generate_speech(text: str) -> Optional[str]:
-    if not text or not isinstance(text, str):
-        raise ValueError("Invalid text input")
-    voice = await get_valid_voice()
-    logger.info(f"Using voice: {voice}")
-    with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp_file:
-        tmp_path = tmp_file.name
-    communicate = edge_tts.Communicate(text, voice)
-    await communicate.save(tmp_path)
-    if not os.path.exists(tmp_path) or os.path.getsize(tmp_path) == 0:
-        raise RuntimeError("Speech file empty or not created")
-    logger.info(f"Speech generated successfully: {tmp_path}")
-    return tmp_path
-# Speech-to-text using Whisper
-async def transcribe(audio_file: str) -> str:
-    try:
-        with open(audio_file, "rb") as f:
-            data = f.read()
-        response = requests.post(API_URL, headers=headers, data=data)
-        result = response.json()
-        if "text" in result:
-            transcription = result["text"].strip()
-            logger.info(f"Transcribed text: {transcription}")
-            return transcription
-        else:
-            raise ValueError("No transcription in response")
-    except Exception as e:
-        logger.error(f"Transcription error: {str(e)}")
-        raise RuntimeError(f"Failed to transcribe audio: {str(e)}")