DuyTa
/

Graduation

Model card Files Files and versions Community

Graduation / whisper_pipeline /infer.py

DuyTa's picture

Upload folder using huggingface_hub

c3b1078 verified about 1 month ago

1.24 kB

	import os
	from pathlib import Path
	from gector import GecBERTModel
	from faster_whisper import WhisperModel, BatchedInferencePipeline
	from transformers.models.whisper.english_normalizer import BasicTextNormalizer
	from text_processing.inverse_normalize import InverseNormalizer
	import time
	inverse_normalizer = InverseNormalizer('vi')
	current_dir = Path(__file__).parent.as_posix()
	whisper_model = WhisperModel("pho_distill_q8", device="auto", compute_type="auto")
	batched_model = BatchedInferencePipeline(model=whisper_model, use_vad_model=True, chunk_length=15)
	gector_model = GecBERTModel(
	vocab_path=os.path.join(current_dir, "gector/vocabulary"),
	model_paths=[os.path.join(current_dir, "gector/Model_GECTOR")],
	split_chunk=True
	)
	normalizer = BasicTextNormalizer()

	####start transcriptions#####
	start = time.time()
	segments, info = batched_model.transcribe("HA1.wav", language="vi", batch_size=32)
	transcriptions = [segment.text for segment in segments]
	normalized_transcriptions = [inverse_normalizer.inverse_normalize(normalizer(text)) for text in transcriptions]
	corrected_texts = gector_model(normalized_transcriptions)
	print(''.join(text for text in corrected_texts))
	print(time.time() - start)