Spaces:
Runtime error
Runtime error
File size: 1,690 Bytes
b9354c2 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 |
import glob
from typing import Any, Optional
import whisper, os
from interpreter import Interpreter
from utils import SEGMENTS_INFO, AUDIO_FILES, json_dump
class WhisperInterpreter(Interpreter):
def __init__(self, model_size: str) -> None:
self.model = whisper.load_model(model_size)
def transcribe(self, file_path: str, **kwargs: Optional[Any]) -> dict:
return self._execute_task("transcribe", file_path, **kwargs)
def translate(self, file_path: str, **kwargs: Optional[Any]) -> dict:
return self._execute_task("translate", file_path, **kwargs)
def _execute_task(self, mode: str, file_path: str, **kwargs: Optional[Any]) -> dict:
options = dict(task=mode)
options.update(kwargs)
if os.path.isdir(file_path):
result = []
files = [x for x in glob.glob(os.path.join(file_path,"*")) if os.path.splitext(x)[1] in AUDIO_FILES]
for file in files:
file_processed = dict(filename=file)
file_processed.update(self._file_extraction(file, **options))
result.append(file_processed)
else:
result = self._file_extraction(file_path, **options)
return result
def _formatter_result(self, input: dict) -> dict:
output = dict()
output["text"] = input["text"]
output["segments"] = [{key: segment[key] for key in SEGMENTS_INFO} for segment in input["segments"]]
return output
def _file_extraction(self, file_path: str, **kwargs: Optional[Any]) -> dict:
write = kwargs.pop("write",False)
result = self._formatter_result(
self.model.transcribe(file_path, **kwargs)
)
if write:
json_dump(result, f"{file_path.split('.')[0]}.json")
return result |