271 lines
8.5 KiB
JavaScript
271 lines
8.5 KiB
JavaScript
import { getRequestHeaders } from '../../../script.js';
|
|
import { getApiUrl } from '../../extensions.js';
|
|
import { doExtrasFetch, modules } from '../../extensions.js';
|
|
import { getPreviewString } from './index.js';
|
|
import { saveTtsProviderSettings } from './index.js';
|
|
|
|
export { EdgeTtsProvider };
|
|
|
|
const EDGE_TTS_PROVIDER = {
|
|
extras: 'extras',
|
|
plugin: 'plugin',
|
|
};
|
|
|
|
class EdgeTtsProvider {
|
|
//########//
|
|
// Config //
|
|
//########//
|
|
|
|
settings;
|
|
voices = [];
|
|
separator = ' . ';
|
|
audioElement = document.createElement('audio');
|
|
|
|
defaultSettings = {
|
|
voiceMap: {},
|
|
rate: 0,
|
|
provider: EDGE_TTS_PROVIDER.extras,
|
|
};
|
|
|
|
get settingsHtml() {
|
|
let html = `Microsoft Edge TTS<br>
|
|
<label for="edge_tts_provider">Provider</label>
|
|
<select id="edge_tts_provider">
|
|
<option value="${EDGE_TTS_PROVIDER.extras}">Extras</option>
|
|
<option value="${EDGE_TTS_PROVIDER.plugin}">Plugin</option>
|
|
</select>
|
|
<label for="edge_tts_rate">Rate: <span id="edge_tts_rate_output"></span></label>
|
|
<input id="edge_tts_rate" type="range" value="${this.defaultSettings.rate}" min="-100" max="100" step="1" />
|
|
`;
|
|
return html;
|
|
}
|
|
|
|
onSettingsChange() {
|
|
this.settings.rate = Number($('#edge_tts_rate').val());
|
|
$('#edge_tts_rate_output').text(this.settings.rate);
|
|
this.settings.provider = String($('#edge_tts_provider').val());
|
|
saveTtsProviderSettings();
|
|
}
|
|
|
|
async loadSettings(settings) {
|
|
// Pupulate Provider UI given input settings
|
|
if (Object.keys(settings).length == 0) {
|
|
console.info('Using default TTS Provider settings');
|
|
}
|
|
|
|
// Only accept keys defined in defaultSettings
|
|
this.settings = this.defaultSettings;
|
|
|
|
for (const key in settings) {
|
|
if (key in this.settings) {
|
|
this.settings[key] = settings[key];
|
|
} else {
|
|
throw `Invalid setting passed to TTS Provider: ${key}`;
|
|
}
|
|
}
|
|
|
|
$('#edge_tts_rate').val(this.settings.rate || 0);
|
|
$('#edge_tts_rate_output').text(this.settings.rate || 0);
|
|
$('#edge_tts_rate').on('input', () => { this.onSettingsChange(); });
|
|
$('#edge_tts_provider').val(this.settings.provider || EDGE_TTS_PROVIDER.extras);
|
|
$('#edge_tts_provider').on('change', () => { this.onSettingsChange(); });
|
|
await this.checkReady();
|
|
|
|
console.debug('EdgeTTS: Settings loaded');
|
|
}
|
|
|
|
/**
|
|
* Perform a simple readiness check by trying to fetch voiceIds
|
|
*/
|
|
async checkReady() {
|
|
await this.throwIfModuleMissing();
|
|
await this.fetchTtsVoiceObjects();
|
|
}
|
|
|
|
async onRefreshClick() {
|
|
return;
|
|
}
|
|
|
|
//#################//
|
|
// TTS Interfaces //
|
|
//#################//
|
|
|
|
/**
|
|
* Get a voice from the TTS provider.
|
|
* @param {string} voiceName Voice name to get
|
|
* @returns {Promise<Object>} Voice object
|
|
*/
|
|
async getVoice(voiceName) {
|
|
if (this.voices.length == 0) {
|
|
this.voices = await this.fetchTtsVoiceObjects();
|
|
}
|
|
const match = this.voices.filter(
|
|
voice => voice.name == voiceName,
|
|
)[0];
|
|
if (!match) {
|
|
throw `TTS Voice name ${voiceName} not found`;
|
|
}
|
|
return match;
|
|
}
|
|
|
|
/**
|
|
* Generate TTS for a given text.
|
|
* @param {string} text Text to generate TTS for
|
|
* @param {string} voiceId Voice ID to use
|
|
* @returns {Promise<Response>} Fetch response
|
|
*/
|
|
async generateTts(text, voiceId) {
|
|
const response = await this.fetchTtsGeneration(text, voiceId);
|
|
return response;
|
|
}
|
|
|
|
//###########//
|
|
// API CALLS //
|
|
//###########//
|
|
async fetchTtsVoiceObjects() {
|
|
await this.throwIfModuleMissing();
|
|
|
|
const url = this.getVoicesUrl();
|
|
const response = await this.doFetch(url);
|
|
if (!response.ok) {
|
|
throw new Error(`HTTP ${response.status}: ${await response.text()}`);
|
|
}
|
|
let responseJson = await response.json();
|
|
responseJson = responseJson
|
|
.sort((a, b) => a.Locale.localeCompare(b.Locale) || a.ShortName.localeCompare(b.ShortName))
|
|
.map(x => ({ name: x.ShortName, voice_id: x.ShortName, preview_url: false, lang: x.Locale }));
|
|
return responseJson;
|
|
}
|
|
|
|
/**
|
|
* Preview TTS for a given voice ID.
|
|
* @param {string} id Voice ID
|
|
*/
|
|
async previewTtsVoice(id) {
|
|
this.audioElement.pause();
|
|
this.audioElement.currentTime = 0;
|
|
const voice = await this.getVoice(id);
|
|
const text = getPreviewString(voice.lang);
|
|
const response = await this.fetchTtsGeneration(text, id);
|
|
if (!response.ok) {
|
|
throw new Error(`HTTP ${response.status}: ${await response.text()}`);
|
|
}
|
|
|
|
const audio = await response.blob();
|
|
const url = URL.createObjectURL(audio);
|
|
this.audioElement.src = url;
|
|
this.audioElement.play();
|
|
this.audioElement.onended = () => URL.revokeObjectURL(url);
|
|
}
|
|
|
|
/**
|
|
* Fetch TTS generation from the API.
|
|
* @param {string} inputText Text to generate TTS for
|
|
* @param {string} voiceId Voice ID to use
|
|
* @returns {Promise<Response>} Fetch response
|
|
*/
|
|
async fetchTtsGeneration(inputText, voiceId) {
|
|
await this.throwIfModuleMissing();
|
|
|
|
console.info(`Generating new TTS for voice_id ${voiceId}`);
|
|
const url = this.getGenerateUrl();
|
|
const response = await this.doFetch(url,
|
|
{
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
body: JSON.stringify({
|
|
'text': inputText,
|
|
'voice': voiceId,
|
|
'rate': Number(this.settings.rate),
|
|
}),
|
|
},
|
|
);
|
|
if (!response.ok) {
|
|
toastr.error(response.statusText, 'TTS Generation Failed');
|
|
throw new Error(`HTTP ${response.status}: ${await response.text()}`);
|
|
}
|
|
return response;
|
|
}
|
|
|
|
/**
|
|
* Perform a fetch request using the configured provider.
|
|
* @param {string} url URL string
|
|
* @param {any} options Request options
|
|
* @returns {Promise<Response>} Fetch response
|
|
*/
|
|
doFetch(url, options) {
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
|
|
return doExtrasFetch(url, options);
|
|
}
|
|
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
|
|
return fetch(url, options);
|
|
}
|
|
|
|
throw new Error('Invalid TTS Provider');
|
|
}
|
|
|
|
/**
|
|
* Get the URL for the TTS generation endpoint.
|
|
* @returns {string} URL string
|
|
*/
|
|
getGenerateUrl() {
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
|
|
const url = new URL(getApiUrl());
|
|
url.pathname = '/api/edge-tts/generate';
|
|
return url.toString();
|
|
}
|
|
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
|
|
return '/api/plugins/edge-tts/generate';
|
|
}
|
|
|
|
throw new Error('Invalid TTS Provider');
|
|
}
|
|
|
|
/**
|
|
* Get the URL for the TTS voices endpoint.
|
|
* @returns {string} URL object or string
|
|
*/
|
|
getVoicesUrl() {
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.extras) {
|
|
const url = new URL(getApiUrl());
|
|
url.pathname = '/api/edge-tts/list';
|
|
return url.toString();
|
|
}
|
|
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) {
|
|
return '/api/plugins/edge-tts/list';
|
|
}
|
|
|
|
throw new Error('Invalid TTS Provider');
|
|
}
|
|
|
|
async throwIfModuleMissing() {
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.extras && !modules.includes('edge-tts')) {
|
|
const message = 'Edge TTS module not loaded. Add edge-tts to enable-modules and restart the Extras API.';
|
|
// toastr.error(message)
|
|
throw new Error(message);
|
|
}
|
|
|
|
if (this.settings.provider === EDGE_TTS_PROVIDER.plugin && !this.isPluginAvailable()) {
|
|
const message = 'Edge TTS Server plugin not loaded. Install it from https://github.com/SillyTavern/SillyTavern-EdgeTTS-Plugin and restart the SillyTavern server.';
|
|
// toastr.error(message)
|
|
throw new Error(message);
|
|
}
|
|
}
|
|
|
|
async isPluginAvailable() {
|
|
try {
|
|
const result = await fetch('/api/plugins/edge-tts/probe', {
|
|
method: 'POST',
|
|
headers: getRequestHeaders(),
|
|
});
|
|
return result.ok;
|
|
} catch (e) {
|
|
return false;
|
|
}
|
|
}
|
|
}
|
|
|