Spaces:
Sleeping
Sleeping
from llmlib.whisper import Whisper | |
import pytest | |
from tests.helpers import is_ci, file_for_test | |
def model() -> Whisper: | |
return Whisper() | |
def test_transcription(model: Whisper): | |
audio_file = str(file_for_test(name="some-audio.flac")) # Librispeech sample 2 | |
expected_transcription = "before he had time to answer a much encumbered vera burst into the room with the question i say can i leave these here these were a small black pig and a lusty specimen of black-red game-cock" | |
actual_transcription: str = model.transcribe_file(audio_file) | |
assert actual_transcription == expected_transcription | |
def test_video_transcription(model: Whisper): | |
video_file = str(file_for_test("video.mp4")) | |
expected_fragment = ( | |
"Die Unionsparteien oder deren Politiker sind heute wichtige Offiziere" | |
) | |
transcription = model.transcribe_file(video_file) | |
assert expected_fragment in transcription | |
def test_translation(model: Whisper): | |
german_video = str(file_for_test("video.mp4")) | |
translation: str = model.transcribe_file(german_video, translate=True) | |
assert "The parties and their politicians" in translation | |
def test_long_video_transcription(model: Whisper): | |
video_file = str(file_for_test("long-video.mp4")) | |
transcription: str = model.transcribe_file(video_file) | |
assert isinstance(transcription, str) | |