File size: 751 Bytes
ddbafc6
 
d4e93ec
ddbafc6
d4e93ec
 
 
 
 
 
 
 
 
 
 
ddbafc6
 
 
 
 
 
 
56a58c1
ddbafc6
 
 
 
 
d4e93ec
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
from transformers import pipeline
import gradio as gr
import torch

def detect_gpu():
    if not torch.cuda.is_available():
        print("No GPU device found")
        exit()
    
    print(f"Found {torch.cuda.device_count()} GPU device(s)")
    print(f"Using {torch.cuda.get_device_name(0)}")
    
detect_gpu()

pipe = pipeline(model="pierrelf/whisper-small-sv", device=0)

def transcribe(audio):
    text = pipe(audio)["text"]
    return text

iface = gr.Interface(
    fn=transcribe,
    inputs=gr.Audio(sources=['upload', 'microphone'], type="filepath"),
    outputs="text",
    title="Whisper Swedish",
    description="Realtime demo for Swedish speech recognition using a fine-tuned Whisper small model.",
)

iface.launch(server_name="0.0.0.0")