import { saveTtsProviderSettings } from './index.js'; import { event_types, eventSource, getRequestHeaders } from '/script.js'; import { SECRET_KEYS, secret_state, writeSecret } from '/scripts/secrets.js'; import { getBase64Async } from '/scripts/utils.js'; export { ElevenLabsTtsProvider }; class ElevenLabsTtsProvider { settings; voices = []; separator = ' ... ... ... '; defaultSettings = { stability: 0.75, similarity_boost: 0.75, style_exaggeration: 0.00, speaker_boost: true, speed: 1.0, model: 'eleven_turbo_v2_5', voiceMap: {}, }; get settingsHtml() { let html = `
`; return html; } constructor() { this.handler = async function (/** @type {string} */ key) { if (key !== SECRET_KEYS.ELEVENLABS) return; $('#elevenlabs_tts_key').toggleClass('success', !!secret_state[SECRET_KEYS.ELEVENLABS]); await this.fetchTtsVoiceObjects(); }.bind(this); } dispose() { [event_types.SECRET_WRITTEN, event_types.SECRET_DELETED, event_types.SECRET_ROTATED].forEach(event => { eventSource.removeListener(event, this.handler); }); } shouldInvolveExtendedSettings() { // Models that support extended settings (style_exaggeration, speaker_boost) const modelsWithExtendedSettings = [ 'eleven_v3', 'eleven_ttv_v3', 'eleven_multilingual_v2', 'eleven_multilingual_ttv_v2', ]; return modelsWithExtendedSettings.includes(this.settings.model); } onSettingsChange() { // Update dynamically this.settings.stability = $('#elevenlabs_tts_stability').val(); this.settings.similarity_boost = $('#elevenlabs_tts_similarity_boost').val(); this.settings.style_exaggeration = $('#elevenlabs_tts_style_exaggeration').val(); this.settings.speaker_boost = $('#elevenlabs_tts_speaker_boost').is(':checked'); this.settings.speed = $('#elevenlabs_tts_speed').val(); this.settings.model = $('#elevenlabs_tts_model').find(':selected').val(); $('#elevenlabs_tts_stability_output').text(Math.round(this.settings.stability * 100) + '%'); $('#elevenlabs_tts_similarity_boost_output').text(Math.round(this.settings.similarity_boost * 100) + '%'); $('#elevenlabs_tts_style_exaggeration_output').text(Math.round(this.settings.style_exaggeration * 100) + '%'); $('#elevenlabs_tts_speed_output').text(this.settings.speed + 'x'); $('#elevenlabs_tts_v2_options').toggle(this.shouldInvolveExtendedSettings()); saveTtsProviderSettings(); } async loadSettings(settings) { // Pupulate Provider UI given input settings if (Object.keys(settings).length == 0) { console.info('Using default TTS Provider settings'); } // Only accept keys defined in defaultSettings this.settings = this.defaultSettings; // Migrate old settings if (settings['multilingual'] !== undefined) { settings.model = settings.multilingual ? 'eleven_multilingual_v1' : 'eleven_monolingual_v1'; delete settings['multilingual']; } if (Object.hasOwn(settings, 'apiKey')) { if (settings.apiKey && !secret_state[SECRET_KEYS.ELEVENLABS]){ await writeSecret(SECRET_KEYS.ELEVENLABS, settings.apiKey); } delete settings['apiKey']; } $('#elevenlabs_tts_key').toggleClass('success', !!secret_state[SECRET_KEYS.ELEVENLABS]); [event_types.SECRET_WRITTEN, event_types.SECRET_DELETED, event_types.SECRET_ROTATED].forEach(event => { eventSource.on(event, this.handler); }); for (const key in settings) { if (key in this.settings) { this.settings[key] = settings[key]; } else { throw `Invalid setting passed to TTS Provider: ${key}`; } } $('#elevenlabs_tts_stability').val(this.settings.stability); $('#elevenlabs_tts_similarity_boost').val(this.settings.similarity_boost); $('#elevenlabs_tts_style_exaggeration').val(this.settings.style_exaggeration); $('#elevenlabs_tts_speaker_boost').prop('checked', this.settings.speaker_boost); $('#elevenlabs_tts_speed').val(this.settings.speed); $('#elevenlabs_tts_model').val(this.settings.model); $('#elevenlabs_tts_similarity_boost').on('input', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_stability').on('input', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_style_exaggeration').on('input', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_speaker_boost').on('change', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_speed').on('input', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_model').on('change', this.onSettingsChange.bind(this)); $('#elevenlabs_tts_stability_output').text(Math.round(this.settings.stability * 100) + '%'); $('#elevenlabs_tts_similarity_boost_output').text(Math.round(this.settings.similarity_boost * 100) + '%'); $('#elevenlabs_tts_style_exaggeration_output').text(Math.round(this.settings.style_exaggeration * 100) + '%'); $('#elevenlabs_tts_speed_output').text(this.settings.speed + 'x'); $('#elevenlabs_tts_v2_options').toggle(this.shouldInvolveExtendedSettings()); try { await this.checkReady(); console.debug('ElevenLabs: Settings loaded'); } catch { console.debug('ElevenLabs: Settings loaded, but not ready'); } this.setupVoiceCloningMenu(); } // Perform a simple readiness check by trying to fetch voiceIds async checkReady() { await this.fetchTtsVoiceObjects(); } async onRefreshClick() { await this.fetchTtsVoiceObjects(); } setupVoiceCloningMenu() { const audioFilesInput = /** @type {HTMLInputElement} */ (document.getElementById('elevenlabs_tts_audio_files')); const selectedFilesListElement = document.getElementById('elevenlabs_tts_selected_files_list'); const cloneVoiceButton = document.getElementById('elevenlabs_tts_clone_voice_button'); const uploadAudioFileButton = document.getElementById('upload_audio_file'); const voiceCloningNameInput = /** @type {HTMLInputElement} */ (document.getElementById('elevenlabs_tts_voice_cloning_name')); const voiceCloningDescriptionInput = /** @type {HTMLInputElement} */ (document.getElementById('elevenlabs_tts_voice_cloning_description')); const voiceCloningLabelsInput = /** @type {HTMLInputElement} */ (document.getElementById('elevenlabs_tts_voice_cloning_labels')); const updateCloneVoiceButtonVisibility = () => { cloneVoiceButton.style.display = audioFilesInput.files.length > 0 ? 'inline-block' : 'none'; }; const clearSelectedFiles = () => { audioFilesInput.value = ''; selectedFilesListElement.innerHTML = ''; updateCloneVoiceButtonVisibility(); }; uploadAudioFileButton.addEventListener('click', () => { audioFilesInput.click(); }); audioFilesInput.addEventListener('change', () => { selectedFilesListElement.innerHTML = ''; for (const file of audioFilesInput.files) { const listItem = document.createElement('div'); listItem.textContent = file.name; selectedFilesListElement.appendChild(listItem); } updateCloneVoiceButtonVisibility(); }); cloneVoiceButton.addEventListener('click', async () => { const voiceName = voiceCloningNameInput.value.trim(); const voiceDescription = voiceCloningDescriptionInput.value.trim(); const voiceLabels = voiceCloningLabelsInput.value.trim(); if (!voiceName) { toastr.error('Please provide a name for the cloned voice.'); return; } try { await this.addVoice(voiceName, voiceDescription, voiceLabels); toastr.success('Voice cloned successfully. Hit reload to see the new voice in the voice listing.'); clearSelectedFiles(); voiceCloningNameInput.value = ''; voiceCloningDescriptionInput.value = ''; voiceCloningLabelsInput.value = ''; } catch (error) { toastr.error(`Failed to clone voice: ${error.message}`); } }); updateCloneVoiceButtonVisibility(); } /** * Get voice object by name * @param {string} voiceName Voice name to look up * @returns {Promise