sqlbot / setup.py
edithram23's picture
initial commit
f103f44 verified
raw
history blame contribute delete
885 Bytes
import os
import io
from groq import Groq
import soundfile as sf
from deepgram import DeepgramClient, SpeakOptions
from langchain_groq import ChatGroq
from dotenv import load_dotenv
load_dotenv('.env')
# Text to Speech and Speech to Text
class Speech_Text():
def __init__(self):
self.client = Groq(api_key=os.getenv("GROQ_API_KEY"))
# Function to get transcript from audio
def get_transcript(self,audio):
audio_buffer = io.BytesIO()
sf.write(audio_buffer, audio[1], samplerate=audio[0], format="MP3")
audio_buffer.seek(0)
translation = self.client.audio.transcriptions.create(
file=("audio.mp3", audio_buffer.read()),
model="distil-whisper-large-v3-en",
response_format="json",
temperature=0.0,
)
return translation.text