import { getRequestHeaders } from '../../../script.js'; import { callGenericPopup, POPUP_RESULT, POPUP_TYPE } from '../../popup.js'; import { findSecret, SECRET_KEYS, secret_state, writeSecret } from '../../secrets.js'; import { getPreviewString, saveTtsProviderSettings } from './index.js'; export { OpenAICompatibleTtsProvider }; class OpenAICompatibleTtsProvider { settings; voices = []; separator = ' . '; audioElement = document.createElement('audio'); defaultSettings = { voiceMap: {}, model: 'tts-1', speed: 1, available_voices: ['alloy', 'echo', 'fable', 'onyx', 'nova', 'shimmer'], provider_endpoint: 'http://127.0.0.1:8000/v1/audio/speech', }; get settingsHtml() { let html = `
`; return html; } async loadSettings(settings) { // Populate Provider UI given input settings if (Object.keys(settings).length == 0) { console.info('Using default TTS Provider settings'); } // Only accept keys defined in defaultSettings this.settings = this.defaultSettings; for (const key in settings) { if (key in this.settings) { this.settings[key] = settings[key]; } else { throw `Invalid setting passed to TTS Provider: ${key}`; } } $('#openai_compatible_tts_endpoint').val(this.settings.provider_endpoint); $('#openai_compatible_tts_endpoint').on('input', () => { this.onSettingsChange(); }); $('#openai_compatible_model').val(this.defaultSettings.model); $('#openai_compatible_model').on('input', () => { this.onSettingsChange(); }); $('#openai_compatible_tts_voices').val(this.settings.available_voices.join()); $('#openai_compatible_tts_voices').on('input', () => { this.onSettingsChange(); }); $('#openai_compatible_tts_speed').val(this.settings.speed); $('#openai_compatible_tts_speed').on('input', () => { this.onSettingsChange(); }); $('#openai_compatible_tts_speed_output').text(this.settings.speed); $('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); $('#openai_compatible_tts_key').on('click', async () => { const popupText = 'OpenAI-compatible TTS API Key'; const savedKey = secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS] ? await findSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS) : ''; const key = await callGenericPopup(popupText, POPUP_TYPE.INPUT, savedKey, { customButtons: [{ text: 'Remove Key', appendAtEnd: true, result: POPUP_RESULT.NEGATIVE, action: async () => { await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, ''); $('#openai_compatible_tts_key').toggleClass('success', !!secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); toastr.success('API Key removed'); await this.onRefreshClick(); }, }], }); if (!key) { return; } await writeSecret(SECRET_KEYS.CUSTOM_OPENAI_TTS, String(key)); toastr.success('API Key saved'); $('#openai_compatible_tts_key').toggleClass('success', secret_state[SECRET_KEYS.CUSTOM_OPENAI_TTS]); await this.onRefreshClick(); }); await this.checkReady(); console.debug('OpenAI Compatible TTS: Settings loaded'); } onSettingsChange() { // Update dynamically this.settings.provider_endpoint = String($('#openai_compatible_tts_endpoint').val()); this.settings.model = String($('#openai_compatible_model').val()); this.settings.available_voices = String($('#openai_compatible_tts_voices').val()).split(','); this.settings.speed = Number($('#openai_compatible_tts_speed').val()); $('#openai_compatible_tts_speed_output').text(this.settings.speed); saveTtsProviderSettings(); } async checkReady() { await this.fetchTtsVoiceObjects(); } async onRefreshClick() { return; } async getVoice(voiceName) { if (this.voices.length == 0) { this.voices = await this.fetchTtsVoiceObjects(); } const match = this.voices.filter( oaicVoice => oaicVoice.name == voiceName, )[0]; if (!match) { throw `TTS Voice name ${voiceName} not found`; } return match; } async generateTts(text, voiceId) { const response = await this.fetchTtsGeneration(text, voiceId); return response; } async fetchTtsVoiceObjects() { return this.settings.available_voices.map(v => { return { name: v, voice_id: v, lang: 'en-US' }; }); } async previewTtsVoice(voiceId) { this.audioElement.pause(); this.audioElement.currentTime = 0; const text = getPreviewString('en-US'); const response = await this.fetchTtsGeneration(text, voiceId); if (!response.ok) { throw new Error(`HTTP ${response.status}`); } const audio = await response.blob(); const url = URL.createObjectURL(audio); this.audioElement.src = url; this.audioElement.play(); this.audioElement.onended = () => URL.revokeObjectURL(url); } async fetchTtsGeneration(inputText, voiceId) { console.info(`Generating new TTS for voice_id ${voiceId}`); const response = await fetch('/api/openai/custom/generate-voice', { method: 'POST', headers: getRequestHeaders(), body: JSON.stringify({ provider_endpoint: this.settings.provider_endpoint, model: this.settings.model, input: inputText, voice: voiceId, response_format: 'mp3', speed: this.settings.speed, }), }); if (!response.ok) { toastr.error(response.statusText, 'TTS Generation Failed'); throw new Error(`HTTP ${response.status}: ${await response.text()}`); } return response; } }