tts-openai / src /infer /model_inference.py
imseldrith's picture
Upload folder using huggingface_hub
f32a529 verified
raw
history blame
3.33 kB
import ast
import json
import os
import torch
from mosestokenizer import *
from tts_infer.transliterate import XlitEngine
from tts_infer.tts import TextToMel, MelToWav
from src import log_setup, utilities
from src.config import settings
LOGGER = log_setup.get_logger(__name__)
def get_gpu_info(gpu):
LOGGER.info(f"*** GPU is enabled: {gpu} ***")
if gpu:
no_gpus = torch.cuda.device_count()
LOGGER.info(f"*** Total number of gpus allocated are {no_gpus} ***")
LOGGER.info(f"*** Cuda Version {torch.version.cuda} ***")
LOGGER.info(f"*** Python process id {os.getpid()} ***")
LOGGER.info("*** The gpu device info : ***")
for gpu in range(0, no_gpus):
LOGGER.info(f"GPU {str(gpu)} - {str(torch.cuda.get_device_name(gpu))}")
class ModelService:
def __init__(self):
LOGGER.info(f'Loading with settings {settings}')
gpu_present = torch.cuda.is_available()
LOGGER.info("Gpu present : %s", gpu_present)
get_gpu_info(settings.gpu)
self.device = "cuda" if gpu_present & settings.gpu else "cpu"
LOGGER.info("Using device : %s", self.device)
model_config_file_path = settings.models_base_path + settings.model_config_file_path
if os.path.exists(model_config_file_path):
with open(model_config_file_path, 'r') as f:
model_config = json.load(f)
else:
raise Exception(f'Model configuration file is missing at {model_config_file_path}')
languages = ast.literal_eval(utilities.get_env_var('languages', '["all"]'))
self.supported_languages = list(model_config.keys())
LOGGER.info(f'supported languages {self.supported_languages}')
self.available_choice = {}
LOGGER.info(f'requested languages are {languages}')
for language_code, lang_config in model_config.items():
if language_code in languages or 'all' in languages:
if lang_config.get("male_glow") is not None:
self.available_choice[f"{language_code}_male"] = [
TextToMel(glow_model_dir=settings.models_base_path + lang_config.get("male_glow"),
device=self.device),
MelToWav(hifi_model_dir=settings.models_base_path + lang_config.get("male_hifi"),
device=self.device)]
if lang_config.get("female_glow") is not None:
self.available_choice[f"{language_code}_female"] = [
TextToMel(glow_model_dir=settings.models_base_path + lang_config.get("female_glow"),
device=self.device),
MelToWav(hifi_model_dir=settings.models_base_path + lang_config.get("female_hifi"),
device=self.device)]
LOGGER.info(f'{language_code} Models initialized successfully')
LOGGER.info(f'Model service available_choices are {self.available_choice}')
if len(self.available_choice) == 0:
LOGGER.error(
f'Invalid languages requested in {languages} ,only supported languages are {self.supported_languages}')
raise Exception(f'Invalid languages requested')
self.transliterate_obj = XlitEngine()