Spaces:

tomasruiz
/

multimodal-vibe-check

Sleeping

App Files Files Community

multimodal-vibe-check / tests /test_whisper.py

tomasruiz

Include code of llmapp from Github

41d24d2 7 months ago

raw

history blame contribute delete

1.64 kB

	from llmlib.whisper import Whisper
	import pytest
	from tests.helpers import is_ci, file_for_test


	@pytest.fixture(scope="module")
	def model() -> Whisper:
	return Whisper()


	@pytest.mark.skipif(condition=is_ci(), reason="No GPU in CI")
	def test_transcription(model: Whisper):
	audio_file = str(file_for_test(name="some-audio.flac")) # Librispeech sample 2
	expected_transcription = "before he had time to answer a much encumbered vera burst into the room with the question i say can i leave these here these were a small black pig and a lusty specimen of black-red game-cock"
	actual_transcription: str = model.transcribe_file(audio_file)
	assert actual_transcription == expected_transcription


	@pytest.mark.skipif(condition=is_ci(), reason="No GPU in CI")
	def test_video_transcription(model: Whisper):
	video_file = str(file_for_test("video.mp4"))
	expected_fragment = (
	"Die Unionsparteien oder deren Politiker sind heute wichtige Offiziere"
	)
	transcription = model.transcribe_file(video_file)
	assert expected_fragment in transcription


	@pytest.mark.skipif(condition=is_ci(), reason="No GPU in CI")
	def test_translation(model: Whisper):
	german_video = str(file_for_test("video.mp4"))
	translation: str = model.transcribe_file(german_video, translate=True)
	assert "The parties and their politicians" in translation


	@pytest.mark.skipif(condition=is_ci(), reason="No GPU in CI")
	def test_long_video_transcription(model: Whisper):
	video_file = str(file_for_test("long-video.mp4"))
	transcription: str = model.transcribe_file(video_file)
	assert isinstance(transcription, str)