WhisperX-V2 / app.py
StevenChen16's picture
Update app.py
8392829 verified
raw
history blame
724 Bytes
import torch
import whisperx
# 检测设备类型
device = "cuda" if torch.cuda.is_available() else "cpu"
# 设置计算类型
compute_type = "float16" if device == "cuda" else "int8"
# 加载 WhisperX 模型
model = whisperx.load_model("large-v3", device=device, compute_type=compute_type)
def transcribe(audio_path):
# 使用WhisperX进行转录
result = model.transcribe(audio_path)
return result['text']
# 创建Gradio接口
iface = gr.Interface(
fn=transcribe,
inputs=gr.Audio(source="upload", type="filepath"),
outputs="text",
title="WhisperX 语音转文字",
description="上传音频文件,使用WhisperX模型进行转录。"
)
if __name__ == "__main__":
iface.launch()