Spaces:

Nocigar
/

sillytavern

Running

App Files Files Community

sillytavern / public /scripts /extensions /tts /openai-compatible.js

Nocigar's picture

Upload 475 files

b82d373 verified 11 months ago

history blame contribute delete

7.58 kB

	import { getRequestHeaders } from '../../../script.js';
	import { callGenericPopup, POPUP_RESULT, POPUP_TYPE } from '../../popup.js';
	import { findSecret, SECRET_KEYS, secret_state, writeSecret } from '../../secrets.js';
	import { getPreviewString, saveTtsProviderSettings } from './index.js';

	export { OpenAICompatibleTtsProvider };

	class OpenAICompatibleTtsProvider {
	settings;
	voices = [];
	separator = ' . ';

	audioElement = document.createElement('audio');

	defaultSettings = {
	voiceMap: {},
	model: 'tts-1',
	speed: 1,
	available_voices: ['alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'],
	provider_endpoint: 'http://127.0.0.1:8000/v1/audio/speech',
	};

	get settingsHtml() {
	let html = `
	<label for="openai_compatible_tts_endpoint">Provider Endpoint:</label>
	<div class="flex-container alignItemsCenter">
	<div class="flex1">
	<input id="openai_compatible_tts_endpoint" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.provider_endpoint}"/>
	</div>
	<div id="openai_compatible_tts_key" class="menu_button menu_button_icon">
	<i class="fa-solid fa-key"></i>
	<span>API Key</span>
	</div>
	</div>
	<label for="openai_compatible_model">Model:</label>
	<input id="openai_compatible_model" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.model}"/>
	<label for="openai_compatible_tts_voices">Available Voices (comma separated):</label>
	<input id="openai_compatible_tts_voices" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.available_voices.join()}"/>
	<label for="openai_compatible_tts_speed">Speed: <span id="openai_compatible_tts_speed_output"></span></label>
	<input type="range" id="openai_compatible_tts_speed" value="1" min="0.25" max="4" step="0.05">`;
	return html;
	}

	async loadSettings(settings) {
	// Populate Provider UI given input settings
	if (Object.keys(settings).length == 0) {
	console.info('Using default TTS Provider settings');
	}

	// Only accept keys defined in defaultSettings
	this.settings = this.defaultSettings;

	for (const key in settings) {
	if (key in this.settings) {
	this.settings[key] = settings[key];
	} else {
	throw `Invalid setting passed to TTS Provider: ${key}`;
	}
	}

	$('#openai_compatible_tts_endpoint').val(this.settings.provider_endpoint);
	$('#openai_compatible_tts_endpoint').on('input', () => { this.onSettingsChange(); });

	$('#openai_compatible_model').val(this.defaultSettings.model);
	$('#openai_compatible_model').on('input', () => { this.onSettingsChange(); });

	$('#openai_compatible_tts_voices').val(this.settings.available_voices.join());
	$('#openai_compatible_tts_voices').on('input', () => { this.onSettingsChange(); });

	$('#openai_compatible_tts_speed').val(this.settings.speed);
	$('#openai_compatible_tts_speed').on('input', () => {
	this.onSettingsChange();
	});

	$('#openai_compatible_tts_speed_output').text(this.settings.speed);

	$('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]);
	$('#openai_compatible_tts_key').on('click', async () => {
	const popupText = 'OpenAI-compatible TTS API Key';
	const savedKey = secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS] ? await findSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS) : '';

	const key = await callGenericPopup(popupText, POPUP_TYPE.INPUT, savedKey, {
	customButtons: [{
	text: 'Remove Key',
	appendAtEnd: true,
	result: POPUP_RESULT.NEGATIVE,
	action: async () => {
	await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, '');
	$('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]);
	toastr.success('API Key removed');
	await this.onRefreshClick();
	},
	}],
	});

	if (key == false \|\| key == '') {
	return;
	}

	await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, String(key));

	toastr.success('API Key saved');
	$('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]);
	await this.onRefreshClick();
	});

	await this.checkReady();

	console.debug('OpenAI Compatible TTS: Settings loaded');
	}

	onSettingsChange() {
	// Update dynamically
	this.settings.provider_endpoint = String($('#openai_compatible_tts_endpoint').val());
	this.settings.model = String($('#openai_compatible_model').val());
	this.settings.available_voices = String($('#openai_compatible_tts_voices').val()).split(',');
	this.settings.speed = Number($('#openai_compatible_tts_speed').val());
	$('#openai_compatible_tts_speed_output').text(this.settings.speed);
	saveTtsProviderSettings();
	}

	async checkReady() {
	await this.fetchTtsVoiceObjects();
	}

	async onRefreshClick() {
	return;
	}

	async getVoice(voiceName) {
	if (this.voices.length == 0) {
	this.voices = await this.fetchTtsVoiceObjects();
	}
	const match = this.voices.filter(
	oaicVoice => oaicVoice.name == voiceName,
	)[0];
	if (!match) {
	throw `TTS Voice name ${voiceName} not found`;
	}
	return match;
	}

	async generateTts(text, voiceId) {
	const response = await this.fetchTtsGeneration(text, voiceId);
	return response;
	}

	async fetchTtsVoiceObjects() {
	return this.settings.available_voices.map(v => {
	return { name: v, voice_id: v, lang: 'en-US' };
	});
	}

	async previewTtsVoice(voiceId) {
	this.audioElement.pause();
	this.audioElement.currentTime = 0;

	const text = getPreviewString('en-US');
	const response = await this.fetchTtsGeneration(text, voiceId);
	if (!response.ok) {
	throw new Error(`HTTP ${response.status}`);
	}

	const audio = await response.blob();
	const url = URL.createObjectURL(audio);
	this.audioElement.src = url;
	this.audioElement.play();
	this.audioElement.onended = () => URL.revokeObjectURL(url);
	}

	async fetchTtsGeneration(inputText, voiceId) {
	console.info(`Generating new TTS for voice_id ${voiceId}`);
	const response = await fetch('/api/openai/custom/generate-voice', {
	method: 'POST',
	headers: getRequestHeaders(),
	body: JSON.stringify({
	provider_endpoint: this.settings.provider_endpoint,
	model: this.settings.model,
	input: inputText,
	voice: voiceId,
	response_format: 'mp3',
	speed: this.settings.speed,
	}),
	});

	if (!response.ok) {
	toastr.error(response.statusText, 'TTS Generation Failed');
	throw new Error(`HTTP ${response.status}: ${await response.text()}`);
	}

	return response;
	}
	}