Spaces:
Paused
Paused
| import { getRequestHeaders } from '../../../script.js'; | |
| import { callGenericPopup, POPUP_RESULT, POPUP_TYPE } from '../../popup.js'; | |
| import { findSecret, SECRET_KEYS, secret_state, writeSecret } from '../../secrets.js'; | |
| import { getPreviewString, saveTtsProviderSettings } from './index.js'; | |
| export { OpenAICompatibleTtsProvider }; | |
| class OpenAICompatibleTtsProvider { | |
| settings; | |
| voices = []; | |
| separator = ' . '; | |
| audioElement = document.createElement('audio'); | |
| defaultSettings = { | |
| voiceMap: {}, | |
| model: 'tts-1', | |
| speed: 1, | |
| available_voices: ['alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'], | |
| provider_endpoint: 'http://127.0.0.1:8000/v1/audio/speech', | |
| }; | |
| get settingsHtml() { | |
| let html = ` | |
| <label for="openai_compatible_tts_endpoint">Provider Endpoint:</label> | |
| <div class="flex-container alignItemsCenter"> | |
| <div class="flex1"> | |
| <input id="openai_compatible_tts_endpoint" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.provider_endpoint}"/> | |
| </div> | |
| <div id="openai_compatible_tts_key" class="menu_button menu_button_icon"> | |
| <i class="fa-solid fa-key"></i> | |
| <span>API Key</span> | |
| </div> | |
| </div> | |
| <label for="openai_compatible_model">Model:</label> | |
| <input id="openai_compatible_model" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.model}"/> | |
| <label for="openai_compatible_tts_voices">Available Voices (comma separated):</label> | |
| <input id="openai_compatible_tts_voices" type="text" class="text_pole" maxlength="250" value="${this.defaultSettings.available_voices.join()}"/> | |
| <label for="openai_compatible_tts_speed">Speed: <span id="openai_compatible_tts_speed_output"></span></label> | |
| <input type="range" id="openai_compatible_tts_speed" value="1" min="0.25" max="4" step="0.05">`; | |
| return html; | |
| } | |
| async loadSettings(settings) { | |
| // Populate Provider UI given input settings | |
| if (Object.keys(settings).length == 0) { | |
| console.info('Using default TTS Provider settings'); | |
| } | |
| // Only accept keys defined in defaultSettings | |
| this.settings = this.defaultSettings; | |
| for (const key in settings) { | |
| if (key in this.settings) { | |
| this.settings[key] = settings[key]; | |
| } else { | |
| throw `Invalid setting passed to TTS Provider: ${key}`; | |
| } | |
| } | |
| $('#openai_compatible_tts_endpoint').val(this.settings.provider_endpoint); | |
| $('#openai_compatible_tts_endpoint').on('input', () => { this.onSettingsChange(); }); | |
| $('#openai_compatible_model').val(this.defaultSettings.model); | |
| $('#openai_compatible_model').on('input', () => { this.onSettingsChange(); }); | |
| $('#openai_compatible_tts_voices').val(this.settings.available_voices.join()); | |
| $('#openai_compatible_tts_voices').on('input', () => { this.onSettingsChange(); }); | |
| $('#openai_compatible_tts_speed').val(this.settings.speed); | |
| $('#openai_compatible_tts_speed').on('input', () => { | |
| this.onSettingsChange(); | |
| }); | |
| $('#openai_compatible_tts_speed_output').text(this.settings.speed); | |
| $('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); | |
| $('#openai_compatible_tts_key').on('click', async () => { | |
| const popupText = 'OpenAI-compatible TTS API Key'; | |
| const savedKey = secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS] ? await findSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS) : ''; | |
| const key = await callGenericPopup(popupText, POPUP_TYPE.INPUT, savedKey, { | |
| customButtons: [{ | |
| text: 'Remove Key', | |
| appendAtEnd: true, | |
| result: POPUP_RESULT.NEGATIVE, | |
| action: async () => { | |
| await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, ''); | |
| $('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); | |
| toastr.success('API Key removed'); | |
| await this.onRefreshClick(); | |
| }, | |
| }], | |
| }); | |
| if (key == false || key == '') { | |
| return; | |
| } | |
| await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, String(key)); | |
| toastr.success('API Key saved'); | |
| $('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); | |
| await this.onRefreshClick(); | |
| }); | |
| await this.checkReady(); | |
| console.debug('OpenAI Compatible TTS: Settings loaded'); | |
| } | |
| onSettingsChange() { | |
| // Update dynamically | |
| this.settings.provider_endpoint = String($('#openai_compatible_tts_endpoint').val()); | |
| this.settings.model = String($('#openai_compatible_model').val()); | |
| this.settings.available_voices = String($('#openai_compatible_tts_voices').val()).split(','); | |
| this.settings.speed = Number($('#openai_compatible_tts_speed').val()); | |
| $('#openai_compatible_tts_speed_output').text(this.settings.speed); | |
| saveTtsProviderSettings(); | |
| } | |
| async checkReady() { | |
| await this.fetchTtsVoiceObjects(); | |
| } | |
| async onRefreshClick() { | |
| return; | |
| } | |
| async getVoice(voiceName) { | |
| if (this.voices.length == 0) { | |
| this.voices = await this.fetchTtsVoiceObjects(); | |
| } | |
| const match = this.voices.filter( | |
| oaicVoice => oaicVoice.name == voiceName, | |
| )[0]; | |
| if (!match) { | |
| throw `TTS Voice name ${voiceName} not found`; | |
| } | |
| return match; | |
| } | |
| async generateTts(text, voiceId) { | |
| const response = await this.fetchTtsGeneration(text, voiceId); | |
| return response; | |
| } | |
| async fetchTtsVoiceObjects() { | |
| return this.settings.available_voices.map(v => { | |
| return { name: v, voice_id: v, lang: 'en-US' }; | |
| }); | |
| } | |
| async previewTtsVoice(voiceId) { | |
| this.audioElement.pause(); | |
| this.audioElement.currentTime = 0; | |
| const text = getPreviewString('en-US'); | |
| const response = await this.fetchTtsGeneration(text, voiceId); | |
| if (!response.ok) { | |
| throw new Error(`HTTP ${response.status}`); | |
| } | |
| const audio = await response.blob(); | |
| const url = URL.createObjectURL(audio); | |
| this.audioElement.src = url; | |
| this.audioElement.play(); | |
| this.audioElement.onended = () => URL.revokeObjectURL(url); | |
| } | |
| async fetchTtsGeneration(inputText, voiceId) { | |
| console.info(`Generating new TTS for voice_id ${voiceId}`); | |
| const response = await fetch('/api/openai/custom/generate-voice', { | |
| method: 'POST', | |
| headers: getRequestHeaders(), | |
| body: JSON.stringify({ | |
| provider_endpoint: this.settings.provider_endpoint, | |
| model: this.settings.model, | |
| input: inputText, | |
| voice: voiceId, | |
| response_format: 'mp3', | |
| speed: this.settings.speed, | |
| }), | |
| }); | |
| if (!response.ok) { | |
| toastr.error(response.statusText, 'TTS Generation Failed'); | |
| throw new Error(`HTTP ${response.status}: ${await response.text()}`); | |
| } | |
| return response; | |
| } | |
| } | |