Spaces:
Paused
Paused
| import { getRequestHeaders } from '../../../script.js'; | |
| import { getApiUrl } from '../../extensions.js'; | |
| import { doExtrasFetch, modules } from '../../extensions.js'; | |
| import { getPreviewString } from './index.js'; | |
| import { saveTtsProviderSettings } from './index.js'; | |
| export { EdgeTtsProvider }; | |
| const EDGE_TTS_PROVIDER = { | |
| extras: 'extras', | |
| plugin: 'plugin', | |
| }; | |
| class EdgeTtsProvider { | |
| //########// | |
| // Config // | |
| //########// | |
| settings; | |
| voices = []; | |
| separator = ' . '; | |
| audioElement = document.createElement('audio'); | |
| defaultSettings = { | |
| voiceMap: {}, | |
| rate: 0, | |
| provider: EDGE_TTS_PROVIDER.extras, | |
| }; | |
| get settingsHtml() { | |
| let html = `Microsoft Edge TTS<br> | |
| <label for="edge_tts_provider">Provider</label> | |
| <select id="edge_tts_provider"> | |
| <option value="${EDGE_TTS_PROVIDER.extras}">Extras</option> | |
| <option value="${EDGE_TTS_PROVIDER.plugin}">Plugin</option> | |
| </select> | |
| <label for="edge_tts_rate">Rate: <span id="edge_tts_rate_output"></span></label> | |
| <input id="edge_tts_rate" type="range" value="${this.defaultSettings.rate}" min="-100" max="100" step="1" /> | |
| `; | |
| return html; | |
| } | |
| onSettingsChange() { | |
| this.settings.rate = Number($('#edge_tts_rate').val()); | |
| $('#edge_tts_rate_output').text(this.settings.rate); | |
| this.settings.provider = String($('#edge_tts_provider').val()); | |
| saveTtsProviderSettings(); | |
| } | |
| async loadSettings(settings) { | |
| // Pupulate Provider UI given input settings | |
| if (Object.keys(settings).length == 0) { | |
| console.info('Using default TTS Provider settings'); | |
| } | |
| // Only accept keys defined in defaultSettings | |
| this.settings = this.defaultSettings; | |
| for (const key in settings) { | |
| if (key in this.settings) { | |
| this.settings[key] = settings[key]; | |
| } else { | |
| throw `Invalid setting passed to TTS Provider: ${key}`; | |
| } | |
| } | |
| $('#edge_tts_rate').val(this.settings.rate || 0); | |
| $('#edge_tts_rate_output').text(this.settings.rate || 0); | |
| $('#edge_tts_rate').on('input', () => { this.onSettingsChange(); }); | |
| $('#edge_tts_provider').val(this.settings.provider || EDGE_TTS_PROVIDER.extras); | |
| $('#edge_tts_provider').on('change', () => { this.onSettingsChange(); }); | |
| await this.checkReady(); | |
| console.debug('EdgeTTS: Settings loaded'); | |
| } | |
| /** | |
| * Perform a simple readiness check by trying to fetch voiceIds | |
| */ | |
| async checkReady() { | |
| await this.throwIfModuleMissing(); | |
| await this.fetchTtsVoiceObjects(); | |
| } | |
| async onRefreshClick() { | |
| return; | |
| } | |
| //#################// | |
| // TTS Interfaces // | |
| //#################// | |
| /** | |
| * Get a voice from the TTS provider. | |
| * @param {string} voiceName Voice name to get | |
| * @returns {Promise<Object>} Voice object | |
| */ | |
| async getVoice(voiceName) { | |
| if (this.voices.length == 0) { | |
| this.voices = await this.fetchTtsVoiceObjects(); | |
| } | |
| const match = this.voices.filter( | |
| voice => voice.name == voiceName, | |
| )[0]; | |
| if (!match) { | |
| throw `TTS Voice name ${voiceName} not found`; | |
| } | |
| return match; | |
| } | |
| /** | |
| * Generate TTS for a given text. | |
| * @param {string} text Text to generate TTS for | |
| * @param {string} voiceId Voice ID to use | |
| * @returns {Promise<Response>} Fetch response | |
| */ | |
| async generateTts(text, voiceId) { | |
| const response = await this.fetchTtsGeneration(text, voiceId); | |
| return response; | |
| } | |
| //###########// | |
| // API CALLS // | |
| //###########// | |
| async fetchTtsVoiceObjects() { | |
| await this.throwIfModuleMissing(); | |
| const url = this.getVoicesUrl(); | |
| const response = await this.doFetch(url); | |
| if (!response.ok) { | |
| throw new Error(`HTTP ${response.status}: ${await response.text()}`); | |
| } | |
| let responseJson = await response.json(); | |
| responseJson = responseJson | |
| .sort((a, b) => a.Locale.localeCompare(b.Locale) || a.ShortName.localeCompare(b.ShortName)) | |
| .map(x => ({ name: x.ShortName, voice_id: x.ShortName, preview_url: false, lang: x.Locale })); | |
| return responseJson; | |
| } | |
| /** | |
| * Preview TTS for a given voice ID. | |
| * @param {string} id Voice ID | |
| */ | |
| async previewTtsVoice(id) { | |
| this.audioElement.pause(); | |
| this.audioElement.currentTime = 0; | |
| const voice = await this.getVoice(id); | |
| const text = getPreviewString(voice.lang); | |
| const response = await this.fetchTtsGeneration(text, id); | |
| if (!response.ok) { | |
| throw new Error(`HTTP ${response.status}: ${await response.text()}`); | |
| } | |
| const audio = await response.blob(); | |
| const url = URL.createObjectURL(audio); | |
| this.audioElement.src = url; | |
| this.audioElement.play(); | |
| this.audioElement.onended = () => URL.revokeObjectURL(url); | |
| } | |
| /** | |
| * Fetch TTS generation from the API. | |
| * @param {string} inputText Text to generate TTS for | |
| * @param {string} voiceId Voice ID to use | |
| * @returns {Promise<Response>} Fetch response | |
| */ | |
| async fetchTtsGeneration(inputText, voiceId) { | |
| await this.throwIfModuleMissing(); | |
| console.info(`Generating new TTS for voice_id ${voiceId}`); | |
| const url = this.getGenerateUrl(); | |
| const response = await this.doFetch(url, | |
| { | |
| method: 'POST', | |
| headers: getRequestHeaders(), | |
| body: JSON.stringify({ | |
| 'text': inputText, | |
| 'voice': voiceId, | |
| 'rate': Number(this.settings.rate), | |
| }), | |
| }, | |
| ); | |
| if (!response.ok) { | |
| toastr.error(response.statusText, 'TTS Generation Failed'); | |
| throw new Error(`HTTP ${response.status}: ${await response.text()}`); | |
| } | |
| return response; | |
| } | |
| /** | |
| * Perform a fetch request using the configured provider. | |
| * @param {string} url URL string | |
| * @param {any} options Request options | |
| * @returns {Promise<Response>} Fetch response | |
| */ | |
| doFetch(url, options) { | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.extras) { | |
| return doExtrasFetch(url, options); | |
| } | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) { | |
| return fetch(url, options); | |
| } | |
| throw new Error('Invalid TTS Provider'); | |
| } | |
| /** | |
| * Get the URL for the TTS generation endpoint. | |
| * @returns {string} URL string | |
| */ | |
| getGenerateUrl() { | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.extras) { | |
| const url = new URL(getApiUrl()); | |
| url.pathname = '/api/edge-tts/generate'; | |
| return url.toString(); | |
| } | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) { | |
| return '/api/plugins/edge-tts/generate'; | |
| } | |
| throw new Error('Invalid TTS Provider'); | |
| } | |
| /** | |
| * Get the URL for the TTS voices endpoint. | |
| * @returns {string} URL object or string | |
| */ | |
| getVoicesUrl() { | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.extras) { | |
| const url = new URL(getApiUrl()); | |
| url.pathname = '/api/edge-tts/list'; | |
| return url.toString(); | |
| } | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.plugin) { | |
| return '/api/plugins/edge-tts/list'; | |
| } | |
| throw new Error('Invalid TTS Provider'); | |
| } | |
| async throwIfModuleMissing() { | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.extras && !modules.includes('edge-tts')) { | |
| const message = 'Edge TTS module not loaded. Add edge-tts to enable-modules and restart the Extras API.'; | |
| // toastr.error(message) | |
| throw new Error(message); | |
| } | |
| if (this.settings.provider === EDGE_TTS_PROVIDER.plugin && !this.isPluginAvailable()) { | |
| const message = 'Edge TTS Server plugin not loaded. Install it from https://github.com/SillyTavern/SillyTavern-EdgeTTS-Plugin and restart the SillyTavern server.'; | |
| // toastr.error(message) | |
| throw new Error(message); | |
| } | |
| } | |
| async isPluginAvailable() { | |
| try { | |
| const result = await fetch('/api/plugins/edge-tts/probe', { | |
| method: 'POST', | |
| headers: getRequestHeaders(), | |
| }); | |
| return result.ok; | |
| } catch (e) { | |
| return false; | |
| } | |
| } | |
| } | |