mirror of
				https://github.com/SillyTavern/SillyTavern.git
				synced 2025-06-05 21:59:27 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			271 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
			
		
		
	
	
			271 lines
		
	
	
		
			8.5 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
import { getRequestHeaders } from '../../../script.js';
 | 
						|
import { getApiUrl } from '../../extensions.js';
 | 
						|
import { doExtrasFetch, modules } from '../../extensions.js';
 | 
						|
import { getPreviewString } from './index.js';
 | 
						|
import { saveTtsProviderSettings } from './index.js';
 | 
						|
 | 
						|
export { EdgeTtsProvider };
 | 
						|
 | 
						|
const EDGE_TTS_PROVIDER = {
 | 
						|
    extras: 'extras',
 | 
						|
    plugin: 'plugin',
 | 
						|
};
 | 
						|
 | 
						|
class EdgeTtsProvider {
 | 
						|
    //########//
 | 
						|
    // Config //
 | 
						|
    //########//
 | 
						|
 | 
						|
    settings;
 | 
						|
    voices = [];
 | 
						|
    separator = ' . ';
 | 
						|
    audioElement = document.createElement('audio');
 | 
						|
 | 
						|
    defaultSettings = {
 | 
						|
        voiceMap: {},
 | 
						|
        rate: 0,
 | 
						|
        provider: EDGE_TTS_PROVIDER.extras,
 | 
						|
    };
 | 
						|
 | 
						|
    get settingsHtml() {
 | 
						|
        let html = `Microsoft Edge TTS<br>
 | 
						|
        <label for="edge_tts_provider">Provider</label>
 | 
						|
        <select id="edge_tts_provider">
 | 
						|
            <option value="${EDGE_TTS_PROVIDER.extras}">Extras</option>
 | 
						|
            <option value="${EDGE_TTS_PROVIDER.plugin}">Plugin</option>
 | 
						|
        </select>
 | 
						|
        <label for="edge_tts_rate">Rate: <span id="edge_tts_rate_output"></span></label>
 | 
						|
        <input id="edge_tts_rate" type="range" value="${this.defaultSettings.rate}" min="-100" max="100" step="1" />
 | 
						|
        `;
 | 
						|
        return html;
 | 
						|
    }
 | 
						|
 | 
						|
    onSettingsChange() {
 | 
						|
        this.settings.rate = Number($('#edge_tts_rate').val());
 | 
						|
        $('#edge_tts_rate_output').text(this.settings.rate);
 | 
						|
        this.settings.provider = String($('#edge_tts_provider').val());
 | 
						|
        saveTtsProviderSettings();
 | 
						|
    }
 | 
						|
 | 
						|
    async loadSettings(settings) {
 | 
						|
        // Pupulate Provider UI given input settings
 | 
						|
        if (Object.keys(settings).length == 0) {
 | 
						|
            console.info('Using default TTS Provider settings');
 | 
						|
        }
 | 
						|
 | 
						|
        // Only accept keys defined in defaultSettings
 | 
						|
        this.settings = this.defaultSettings;
 | 
						|
 | 
						|
        for (const key in settings) {
 | 
						|
            if (key in this.settings) {
 | 
						|
                this.settings[key] = settings[key];
 | 
						|
            } else {
 | 
						|
                throw `Invalid setting passed to TTS Provider: ${key}`;
 | 
						|
            }
 | 
						|
        }
 | 
						|
 | 
						|
        $('#edge_tts_rate').val(this.settings.rate || 0);
 | 
						|
        $('#edge_tts_rate_output').text(this.settings.rate || 0);
 | 
						|
        $('#edge_tts_rate').on('input', () => { this.onSettingsChange(); });
 | 
						|
        $('#edge_tts_provider').val(this.settings.provider || EDGE_TTS_PROVIDER.extras);
 | 
						|
        $('#edge_tts_provider').on('change', () => { this.onSettingsChange(); });
 | 
						|
        await this.checkReady();
 | 
						|
 | 
						|
        console.debug('EdgeTTS: Settings loaded');
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
    * Perform a simple readiness check by trying to fetch voiceIds
 | 
						|
    */
 | 
						|
    async checkReady() {
 | 
						|
        await this.throwIfModuleMissing();
 | 
						|
        await this.fetchTtsVoiceObjects();
 | 
						|
    }
 | 
						|
 | 
						|
    async onRefreshClick() {
 | 
						|
        return;
 | 
						|
    }
 | 
						|
 | 
						|
    //#################//
 | 
						|
    //  TTS Interfaces //
 | 
						|
    //#################//
 | 
						|
 | 
						|
    /**
 | 
						|
     * Get a voice from the TTS provider.
 | 
						|
     * @param {string} voiceName Voice name to get
 | 
						|
     * @returns {Promise<Object>} Voice object
 | 
						|
     */
 | 
						|
    async getVoice(voiceName) {
 | 
						|
        if (this.voices.length == 0) {
 | 
						|
            this.voices = await this.fetchTtsVoiceObjects();
 | 
						|
        }
 | 
						|
        const match = this.voices.filter(
 | 
						|
            voice => voice.name == voiceName,
 | 
						|
        )[0];
 | 
						|
        if (!match) {
 | 
						|
            throw `TTS Voice name ${voiceName} not found`;
 | 
						|
        }
 | 
						|
        return match;
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Generate TTS for a given text.
 | 
						|
     * @param {string} text Text to generate TTS for
 | 
						|
     * @param {string} voiceId Voice ID to use
 | 
						|
     * @returns {Promise<Response>} Fetch response
 | 
						|
     */
 | 
						|
    async generateTts(text, voiceId) {
 | 
						|
        const response = await this.fetchTtsGeneration(text, voiceId);
 | 
						|
        return response;
 | 
						|
    }
 | 
						|
 | 
						|
    //###########//
 | 
						|
    // API CALLS //
 | 
						|
    //###########//
 | 
						|
    async fetchTtsVoiceObjects() {
 | 
						|
        await this.throwIfModuleMissing();
 | 
						|
 | 
						|
        const url = this.getVoicesUrl();
 | 
						|
        const response = await this.doFetch(url);
 | 
						|
        if (!response.ok) {
 | 
						|
            throw new Error(`HTTP ${response.status}: ${await response.text()}`);
 | 
						|
        }
 | 
						|
        let responseJson = await response.json();
 | 
						|
        responseJson = responseJson
 | 
						|
            .sort((a, b) => a.Locale.localeCompare(b.Locale) || a.ShortName.localeCompare(b.ShortName))
 | 
						|
            .map(x => ({ name: x.ShortName, voice_id: x.ShortName, preview_url: false, lang: x.Locale }));
 | 
						|
        return responseJson;
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Preview TTS for a given voice ID.
 | 
						|
     * @param {string} id Voice ID
 | 
						|
     */
 | 
						|
    async previewTtsVoice(id) {
 | 
						|
        this.audioElement.pause();
 | 
						|
        this.audioElement.currentTime = 0;
 | 
						|
        const voice = await this.getVoice(id);
 | 
						|
        const text = getPreviewString(voice.lang);
 | 
						|
        const response = await this.fetchTtsGeneration(text, id);
 | 
						|
        if (!response.ok) {
 | 
						|
            throw new Error(`HTTP ${response.status}: ${await response.text()}`);
 | 
						|
        }
 | 
						|
 | 
						|
        const audio = await response.blob();
 | 
						|
        const url = URL.createObjectURL(audio);
 | 
						|
        this.audioElement.src = url;
 | 
						|
        this.audioElement.play();
 | 
						|
        this.audioElement.onended = () => URL.revokeObjectURL(url);
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Fetch TTS generation from the API.
 | 
						|
     * @param {string} inputText Text to generate TTS for
 | 
						|
     * @param {string} voiceId Voice ID to use
 | 
						|
     * @returns {Promise<Response>} Fetch response
 | 
						|
     */
 | 
						|
    async fetchTtsGeneration(inputText, voiceId) {
 | 
						|
        await this.throwIfModuleMissing();
 | 
						|
 | 
						|
        console.info(`Generating new TTS for voice_id ${voiceId}`);
 | 
						|
        const url = this.getGenerateUrl();
 | 
						|
        const response = await this.doFetch(url,
 | 
						|
            {
 | 
						|
                method: 'POST',
 | 
						|
                headers: getRequestHeaders(),
 | 
						|
                body: JSON.stringify({
 | 
						|
                    'text': inputText,
 | 
						|
                    'voice': voiceId,
 | 
						|
                    'rate': Number(this.settings.rate),
 | 
						|
                }),
 | 
						|
            },
 | 
						|
        );
 | 
						|
        if (!response.ok) {
 | 
						|
            toastr.error(response.statusText, 'TTS Generation Failed');
 | 
						|
            throw new Error(`HTTP ${response.status}: ${await response.text()}`);
 | 
						|
        }
 | 
						|
        return response;
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Perform a fetch request using the configured provider.
 | 
						|
     * @param {string} url URL string
 | 
						|
     * @param {any} options Request options
 | 
						|
     * @returns {Promise<Response>} Fetch response
 | 
						|
     */
 | 
						|
    doFetch(url, options) {
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
 | 
						|
            return doExtrasFetch(url, options);
 | 
						|
        }
 | 
						|
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
 | 
						|
            return fetch(url, options);
 | 
						|
        }
 | 
						|
 | 
						|
        throw new Error('Invalid TTS Provider');
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Get the URL for the TTS generation endpoint.
 | 
						|
     * @returns {string} URL string
 | 
						|
     */
 | 
						|
    getGenerateUrl() {
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
 | 
						|
            const url = new URL(getApiUrl());
 | 
						|
            url.pathname = '/api/edge-tts/generate';
 | 
						|
            return url.toString();
 | 
						|
        }
 | 
						|
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
 | 
						|
            return '/api/plugins/edge-tts/generate';
 | 
						|
        }
 | 
						|
 | 
						|
        throw new Error('Invalid TTS Provider');
 | 
						|
    }
 | 
						|
 | 
						|
    /**
 | 
						|
     * Get the URL for the TTS voices endpoint.
 | 
						|
     * @returns {string} URL object or string
 | 
						|
     */
 | 
						|
    getVoicesUrl() {
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
 | 
						|
            const url = new URL(getApiUrl());
 | 
						|
            url.pathname = '/api/edge-tts/list';
 | 
						|
            return url.toString();
 | 
						|
        }
 | 
						|
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
 | 
						|
            return '/api/plugins/edge-tts/list';
 | 
						|
        }
 | 
						|
 | 
						|
        throw new Error('Invalid TTS Provider');
 | 
						|
    }
 | 
						|
 | 
						|
    async throwIfModuleMissing() {
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.extras && !modules.includes('edge-tts')) {
 | 
						|
            const message = 'Edge TTS module not loaded. Add edge-tts to enable-modules and restart the Extras API.';
 | 
						|
            // toastr.error(message)
 | 
						|
            throw new Error(message);
 | 
						|
        }
 | 
						|
 | 
						|
        if (this.settings.provider === EDGE_TTS_PROVIDER.plugin && !this.isPluginAvailable()) {
 | 
						|
            const message = 'Edge TTS Server plugin not loaded. Install it from https://github.com/SillyTavern/SillyTavern-EdgeTTS-Plugin and restart the SillyTavern server.';
 | 
						|
            // toastr.error(message)
 | 
						|
            throw new Error(message);
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    async isPluginAvailable() {
 | 
						|
        try {
 | 
						|
            const result = await fetch('/api/plugins/edge-tts/probe', {
 | 
						|
                method: 'POST',
 | 
						|
                headers: getRequestHeaders(),
 | 
						|
            });
 | 
						|
            return result.ok;
 | 
						|
        } catch (e) {
 | 
						|
            return false;
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
 |