mirror of
				https://github.com/SillyTavern/SillyTavern.git
				synced 2025-06-05 21:59:27 +02:00 
			
		
		
		
	
		
			
				
	
	
		
			152 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
			
		
		
	
	
			152 lines
		
	
	
		
			4.5 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
	
	
| import { getRequestHeaders } from "../../../script.js"
 | |
| import { getApiUrl } from "../../extensions.js"
 | |
| import { doExtrasFetch, modules } from "../../extensions.js"
 | |
| import { getPreviewString } from "./index.js"
 | |
| 
 | |
| export { EdgeTtsProvider }
 | |
| 
 | |
| class EdgeTtsProvider {
 | |
|     //########//
 | |
|     // Config //
 | |
|     //########//
 | |
| 
 | |
|     settings
 | |
|     voices = []
 | |
|     separator = ' . '
 | |
|     audioElement = document.createElement('audio')
 | |
| 
 | |
|     defaultSettings = {
 | |
|         voiceMap: {},
 | |
|         rate: 0,
 | |
|     }
 | |
| 
 | |
|     get settingsHtml() {
 | |
|         let html = `Microsoft Edge TTS Provider<br>
 | |
|         <label for="edge_tts_rate">Rate: <span id="edge_tts_rate_output"></span></label>
 | |
|         <input id="edge_tts_rate" type="range" value="${this.defaultSettings.rate}" min="-100" max="100" step="1" />`
 | |
|         return html
 | |
|     }
 | |
| 
 | |
|     onSettingsChange() {
 | |
|         this.settings.rate = Number($('#edge_tts_rate').val());
 | |
|         $('#edge_tts_rate_output').text(this.settings.rate);
 | |
|     }
 | |
| 
 | |
|     loadSettings(settings) {
 | |
|         // Pupulate Provider UI given input settings
 | |
|         if (Object.keys(settings).length == 0) {
 | |
|             console.info("Using default TTS Provider settings")
 | |
|         }
 | |
| 
 | |
|         // Only accept keys defined in defaultSettings
 | |
|         this.settings = this.defaultSettings
 | |
| 
 | |
|         for (const key in settings) {
 | |
|             if (key in this.settings) {
 | |
|                 this.settings[key] = settings[key]
 | |
|             } else {
 | |
|                 throw `Invalid setting passed to TTS Provider: ${key}`
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         $('#edge_tts_rate').val(this.settings.rate || 0);
 | |
|         $('#edge_tts_rate_output').text(this.settings.rate || 0);
 | |
| 
 | |
|         console.info("Settings loaded")
 | |
|     }
 | |
| 
 | |
| 
 | |
|     async onApplyClick() {
 | |
|         return
 | |
|     }
 | |
| 
 | |
|     //#################//
 | |
|     //  TTS Interfaces //
 | |
|     //#################//
 | |
| 
 | |
|     async getVoice(voiceName) {
 | |
|         if (this.voices.length == 0) {
 | |
|             this.voices = await this.fetchTtsVoiceIds()
 | |
|         }
 | |
|         const match = this.voices.filter(
 | |
|             voice => voice.name == voiceName
 | |
|         )[0]
 | |
|         if (!match) {
 | |
|             throw `TTS Voice name ${voiceName} not found`
 | |
|         }
 | |
|         return match
 | |
|     }
 | |
| 
 | |
|     async generateTts(text, voiceId) {
 | |
|         const response = await this.fetchTtsGeneration(text, voiceId)
 | |
|         return response
 | |
|     }
 | |
| 
 | |
|     //###########//
 | |
|     // API CALLS //
 | |
|     //###########//
 | |
|     async fetchTtsVoiceIds() {
 | |
|         throwIfModuleMissing()
 | |
| 
 | |
|         const url = new URL(getApiUrl());
 | |
|         url.pathname = `/api/edge-tts/list`
 | |
|         const response = await doExtrasFetch(url)
 | |
|         if (!response.ok) {
 | |
|             throw new Error(`HTTP ${response.status}: ${await response.text()}`)
 | |
|         }
 | |
|         let responseJson = await response.json()
 | |
|         responseJson = responseJson
 | |
|             .sort((a, b) => a.Locale.localeCompare(b.Locale) || a.ShortName.localeCompare(b.ShortName))
 | |
|             .map(x => ({ name: x.ShortName, voice_id: x.ShortName, preview_url: false, lang: x.Locale }));
 | |
|         return responseJson
 | |
|     }
 | |
| 
 | |
| 
 | |
|     async previewTtsVoice(id) {
 | |
|         this.audioElement.pause();
 | |
|         this.audioElement.currentTime = 0;
 | |
|         const voice = await this.getVoice(id);
 | |
|         const text = getPreviewString(voice.lang);
 | |
|         const response = await this.fetchTtsGeneration(text, id)
 | |
|         if (!response.ok) {
 | |
|             throw new Error(`HTTP ${response.status}: ${await response.text()}`)
 | |
|         }
 | |
| 
 | |
|         const audio = await response.blob();
 | |
|         const url = URL.createObjectURL(audio);
 | |
|         this.audioElement.src = url;
 | |
|         this.audioElement.play();
 | |
|     }
 | |
| 
 | |
|     async fetchTtsGeneration(inputText, voiceId) {
 | |
|         throwIfModuleMissing()
 | |
| 
 | |
|         console.info(`Generating new TTS for voice_id ${voiceId}`)
 | |
|         const url = new URL(getApiUrl());
 | |
|         url.pathname = `/api/edge-tts/generate`;
 | |
|         const response = await doExtrasFetch(url,
 | |
|             {
 | |
|                 method: 'POST',
 | |
|                 headers: getRequestHeaders(),
 | |
|                 body: JSON.stringify({
 | |
|                     "text": inputText,
 | |
|                     "voice": voiceId,
 | |
|                     "rate": Number(this.settings.rate),
 | |
|                 })
 | |
|             }
 | |
|         )
 | |
|         if (!response.ok) {
 | |
|             toastr.error(response.statusText, 'TTS Generation Failed');
 | |
|             throw new Error(`HTTP ${response.status}: ${await response.text()}`);
 | |
|         }
 | |
|         return response
 | |
|     }
 | |
| }
 | |
| function throwIfModuleMissing() {
 | |
|     if (!modules.includes('edge-tts')) {
 | |
|         toastr.error(`Edge TTS module not loaded. Add edge-tts to enable-modules and restart the Extras API.`)
 | |
|         throw new Error(`Edge TTS module not loaded.`)
 | |
|     }
 | |
| }
 | |
| 
 |