DEBO-V1 / vocal_app.py
Unggi's picture
change whisper model to whisper api
c688a3b
raw
history blame
731 Bytes
import whisper
import gradio as gr
from dotenv import dotenv_values
import openai
import os
"""
apt-get update
apt-get install ffmpeg
"""
config = dotenv_values(".env")
openai.organization = config.get('OPENAI_ORGANIZATION')
openai.api_key = config.get('OPENAI_API_KEY')
def transcribe(audio):
os.rename(audio, audio + '.wav')
file = open(audio + '.wav', "rb")
result = openai.Audio.transcribe("whisper-1", file).text
return result
gr.Interface(
title = 'Whisper Audio to Text with Speaker Recognition',
fn=transcribe,
inputs=[
gr.inputs.Audio(source="microphone", type="filepath"),
#gr.inputs.Number(default=2, label="Number of Speakers")
],
outputs="text"
).launch()