2024-06-08 03:18:48 +00:00
< script lang = "ts" >
import { toast } from 'svelte-sonner';
2024-08-02 17:24:47 +00:00
import { createEventDispatcher , onMount , getContext } from 'svelte';
const dispatch = createEventDispatcher();
2024-06-08 03:18:48 +00:00
import { getBackendConfig } from '$lib/apis';
2024-08-02 17:24:47 +00:00
import {
getAudioConfig,
updateAudioConfig,
getModels as _getModels,
getVoices as _getVoices
} from '$lib/apis/audio';
2024-08-25 00:35:42 +00:00
import { config } from '$lib/stores';
2024-08-02 17:24:47 +00:00
2024-06-25 12:15:29 +00:00
import SensitiveInput from '$lib/components/common/SensitiveInput.svelte';
2024-06-08 03:18:48 +00:00
2024-08-25 00:35:42 +00:00
import { TTS_RESPONSE_SPLIT } from '$lib/types';
2024-06-08 03:18:48 +00:00
2024-08-25 00:35:42 +00:00
import type { Writable } from 'svelte/store';
import type { i18n as i18nType } from 'i18next';
2024-06-08 03:18:48 +00:00
2024-08-25 00:35:42 +00:00
const i18n = getContext< Writable < i18nType > >('i18n');
export let saveHandler: () => void;
2024-06-08 03:18:48 +00:00
2024-08-25 00:35:42 +00:00
// Audio
2024-06-08 03:18:48 +00:00
let TTS_OPENAI_API_BASE_URL = '';
let TTS_OPENAI_API_KEY = '';
2024-07-19 08:35:05 +00:00
let TTS_API_KEY = '';
2024-06-08 03:18:48 +00:00
let TTS_ENGINE = '';
let TTS_MODEL = '';
let TTS_VOICE = '';
2024-08-25 00:35:42 +00:00
let TTS_SPLIT_ON: TTS_RESPONSE_SPLIT = TTS_RESPONSE_SPLIT.PUNCTUATION;
2024-06-08 03:18:48 +00:00
let STT_OPENAI_API_BASE_URL = '';
let STT_OPENAI_API_KEY = '';
let STT_ENGINE = '';
let STT_MODEL = '';
2024-08-25 00:35:42 +00:00
// eslint-disable-next-line no-undef
let voices: SpeechSynthesisVoice[] = [];
let models: Awaited< ReturnType < typeof _getModels > >['models'] = [];
2024-06-08 03:18:48 +00:00
2024-08-02 17:24:47 +00:00
const getModels = async () => {
if (TTS_ENGINE === '') {
models = [];
} else {
const res = await _getModels(localStorage.token).catch((e) => {
toast.error(e);
});
2024-06-08 03:18:48 +00:00
2024-08-02 17:24:47 +00:00
if (res) {
console.log(res);
models = res.models;
}
}
2024-06-08 03:18:48 +00:00
};
2024-08-02 17:24:47 +00:00
const getVoices = async () => {
if (TTS_ENGINE === '') {
2024-08-25 00:35:42 +00:00
const getVoicesLoop = setInterval(() => {
voices = speechSynthesis.getVoices();
2024-06-08 03:18:48 +00:00
2024-08-02 17:24:47 +00:00
// do your loop
if (voices.length > 0) {
clearInterval(getVoicesLoop);
}
}, 100);
} else {
const res = await _getVoices(localStorage.token).catch((e) => {
toast.error(e);
});
if (res) {
console.log(res);
voices = res.voices;
2024-06-08 03:18:48 +00:00
}
2024-08-02 17:24:47 +00:00
}
2024-06-08 03:18:48 +00:00
};
const updateConfigHandler = async () => {
const res = await updateAudioConfig(localStorage.token, {
tts: {
OPENAI_API_BASE_URL: TTS_OPENAI_API_BASE_URL,
OPENAI_API_KEY: TTS_OPENAI_API_KEY,
2024-07-19 11:30:36 +00:00
API_KEY: TTS_API_KEY,
2024-06-08 03:18:48 +00:00
ENGINE: TTS_ENGINE,
MODEL: TTS_MODEL,
2024-08-25 00:35:42 +00:00
VOICE: TTS_VOICE,
SPLIT_ON: TTS_SPLIT_ON
2024-06-08 03:18:48 +00:00
},
stt: {
OPENAI_API_BASE_URL: STT_OPENAI_API_BASE_URL,
OPENAI_API_KEY: STT_OPENAI_API_KEY,
ENGINE: STT_ENGINE,
MODEL: STT_MODEL
}
});
if (res) {
2024-08-25 00:35:42 +00:00
saveHandler();
2024-08-26 13:38:42 +00:00
getBackendConfig()
.then(config.set)
.catch(() => {} );
2024-06-08 03:18:48 +00:00
}
};
onMount(async () => {
const res = await getAudioConfig(localStorage.token);
if (res) {
console.log(res);
TTS_OPENAI_API_BASE_URL = res.tts.OPENAI_API_BASE_URL;
TTS_OPENAI_API_KEY = res.tts.OPENAI_API_KEY;
2024-07-19 11:30:36 +00:00
TTS_API_KEY = res.tts.API_KEY;
2024-06-08 03:18:48 +00:00
TTS_ENGINE = res.tts.ENGINE;
TTS_MODEL = res.tts.MODEL;
TTS_VOICE = res.tts.VOICE;
2024-08-25 00:35:42 +00:00
TTS_SPLIT_ON = res.tts.SPLIT_ON || TTS_RESPONSE_SPLIT.PUNCTUATION;
2024-06-08 03:18:48 +00:00
STT_OPENAI_API_BASE_URL = res.stt.OPENAI_API_BASE_URL;
STT_OPENAI_API_KEY = res.stt.OPENAI_API_KEY;
STT_ENGINE = res.stt.ENGINE;
STT_MODEL = res.stt.MODEL;
}
2024-08-02 17:24:47 +00:00
await getVoices();
await getModels();
2024-06-08 03:18:48 +00:00
});
< / script >
< form
class="flex flex-col h-full justify-between space-y-3 text-sm"
on:submit| preventDefault={ async () => {
await updateConfigHandler();
dispatch('save');
}}
2024-07-20 07:07:50 +00:00
>
2024-06-09 09:41:52 +00:00
< div class = " space-y-3 overflow-y-scroll scrollbar-hidden h-full" >
2024-06-09 09:05:36 +00:00
< div class = "flex flex-col gap-3" >
< div >
< div class = " mb-1 text-sm font-medium" > { $i18n . t ( 'STT Settings' )} </ div >
< div class = " py-0.5 flex w-full justify-between" >
< div class = " self-center text-xs font-medium" > { $i18n . t ( 'Speech-to-Text Engine' )} </ div >
< div class = "flex items-center relative" >
< select
2024-08-25 00:35:42 +00:00
class="dark:bg-gray-900 cursor-pointer w-fit pr-8 rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
2024-06-09 09:05:36 +00:00
bind:value={ STT_ENGINE }
placeholder="Select an engine"
>
< option value = "" > { $i18n . t ( 'Whisper (Local)' )} </ option >
< option value = "openai" > OpenAI< / option >
< option value = "web" > { $i18n . t ( 'Web API' )} </ option >
< / select >
2024-06-08 03:18:48 +00:00
< / div >
< / div >
2024-06-09 09:05:36 +00:00
{ #if STT_ENGINE === 'openai' }
< div >
< div class = "mt-1 flex gap-2 mb-1" >
2024-06-08 03:18:48 +00:00
< input
2024-07-19 08:17:59 +00:00
class="flex-1 w-full rounded-lg py-2 pl-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-09 09:05:36 +00:00
placeholder={ $i18n . t ( 'API Base URL' )}
bind:value={ STT_OPENAI_API_BASE_URL }
required
2024-06-08 03:18:48 +00:00
/>
2024-06-25 12:15:29 +00:00
< SensitiveInput placeholder = { $i18n . t ( 'API Key' )} bind:value= { STT_OPENAI_API_KEY } />
2024-06-08 03:18:48 +00:00
< / div >
< / div >
2024-06-09 09:05:36 +00:00
< hr class = " dark:border-gray-850 my-2" / >
< div >
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'STT Model' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
< input
list="model-list"
2024-07-09 03:10:00 +00:00
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-09 09:05:36 +00:00
bind:value={ STT_MODEL }
placeholder="Select a model"
/>
< datalist id = "model-list" >
< option value = "whisper-1" / >
< / datalist >
< / div >
< / div >
< / div >
{ /if }
2024-06-08 03:18:48 +00:00
< / div >
2024-06-09 09:05:36 +00:00
< hr class = " dark:border-gray-800" / >
< div >
< div class = " mb-1 text-sm font-medium" > { $i18n . t ( 'TTS Settings' )} </ div >
< div class = " py-0.5 flex w-full justify-between" >
< div class = " self-center text-xs font-medium" > { $i18n . t ( 'Text-to-Speech Engine' )} </ div >
< div class = "flex items-center relative" >
< select
2024-08-25 00:35:42 +00:00
class=" dark:bg-gray-900 w-fit pr-8 cursor-pointer rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
2024-06-09 09:05:36 +00:00
bind:value={ TTS_ENGINE }
placeholder="Select a mode"
2024-07-20 06:56:00 +00:00
on:change={ async ( e ) => {
2024-08-02 17:24:47 +00:00
await updateConfigHandler();
await getVoices();
await getModels();
2024-08-25 00:35:42 +00:00
if (e.target?.value === 'openai') {
2024-06-09 09:05:36 +00:00
TTS_VOICE = 'alloy';
TTS_MODEL = 'tts-1';
} else {
TTS_VOICE = '';
2024-07-19 08:35:05 +00:00
TTS_MODEL = '';
2024-06-09 09:05:36 +00:00
}
}}
>
< option value = "" > { $i18n . t ( 'Web API' )} </ option >
2024-06-25 06:00:02 +00:00
< option value = "openai" > { $i18n . t ( 'OpenAI' )} </ option >
2024-07-20 07:07:50 +00:00
< option value = "elevenlabs" > { $i18n . t ( 'ElevenLabs' )} </ option >
2024-06-09 09:05:36 +00:00
< / select >
2024-06-08 03:18:48 +00:00
< / div >
< / div >
2024-06-09 09:05:36 +00:00
{ #if TTS_ENGINE === 'openai' }
< div >
< div class = "mt-1 flex gap-2 mb-1" >
< input
2024-07-19 08:17:59 +00:00
class="flex-1 w-full rounded-lg py-2 pl-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-09 09:05:36 +00:00
placeholder={ $i18n . t ( 'API Base URL' )}
bind:value={ TTS_OPENAI_API_BASE_URL }
required
/>
2024-06-08 03:18:48 +00:00
2024-06-25 12:15:29 +00:00
< SensitiveInput placeholder = { $i18n . t ( 'API Key' )} bind:value= { TTS_OPENAI_API_KEY } />
2024-06-08 03:18:48 +00:00
< / div >
< / div >
2024-07-19 08:35:05 +00:00
{ :else if TTS_ENGINE === 'elevenlabs' }
< div >
< div class = "mt-1 flex gap-2 mb-1" >
< input
class="flex-1 w-full rounded-lg py-2 pl-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
placeholder={ $i18n . t ( 'API Key' )}
bind:value={ TTS_API_KEY }
required
/>
< / div >
< / div >
2024-06-09 09:05:36 +00:00
{ /if }
< hr class = " dark:border-gray-850 my-2" / >
2024-08-02 17:24:47 +00:00
{ #if TTS_ENGINE === '' }
2024-06-09 09:05:36 +00:00
< div >
2024-06-08 03:18:48 +00:00
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'TTS Voice' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
2024-06-09 09:05:36 +00:00
< select
2024-07-09 03:10:00 +00:00
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-08 03:18:48 +00:00
bind:value={ TTS_VOICE }
2024-06-09 09:05:36 +00:00
>
< option value = "" selected = { TTS_VOICE !== '' } > { $i18n . t ( 'Default' )} </option >
2024-06-08 03:18:48 +00:00
{ #each voices as voice }
2024-06-09 09:05:36 +00:00
< option
2024-08-02 17:24:47 +00:00
value={ voice . voiceURI }
2024-06-09 09:05:36 +00:00
class="bg-gray-100 dark:bg-gray-700"
2024-08-02 17:24:47 +00:00
selected={ TTS_VOICE === voice . voiceURI } >{ voice . name } < /option
2024-06-09 09:05:36 +00:00
>
2024-06-08 03:18:48 +00:00
{ /each }
2024-06-09 09:05:36 +00:00
< / select >
2024-06-08 03:18:48 +00:00
< / div >
< / div >
< / div >
2024-06-09 09:05:36 +00:00
{ :else if TTS_ENGINE === 'openai' }
2024-07-19 08:35:05 +00:00
< div class = " flex gap-2" >
< div class = "w-full" >
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'TTS Voice' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
< input
list="voice-list"
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
bind:value={ TTS_VOICE }
placeholder="Select a voice"
/>
< datalist id = "voice-list" >
{ #each voices as voice }
2024-08-02 17:24:47 +00:00
< option value = { voice . id } > { voice . name } </option >
2024-07-19 08:35:05 +00:00
{ /each }
< / datalist >
< / div >
< / div >
< / div >
< div class = "w-full" >
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'TTS Model' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
< input
2024-08-02 17:26:34 +00:00
list="tts-model-list"
2024-07-19 08:35:05 +00:00
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
bind:value={ TTS_MODEL }
placeholder="Select a model"
/>
2024-08-02 17:26:34 +00:00
< datalist id = "tts-model-list" >
2024-07-19 08:35:05 +00:00
{ #each models as model }
2024-08-02 17:24:47 +00:00
< option value = { model . id } / >
2024-07-19 08:35:05 +00:00
{ /each }
< / datalist >
< / div >
< / div >
< / div >
< / div >
{ :else if TTS_ENGINE === 'elevenlabs' }
2024-06-09 09:05:36 +00:00
< div class = " flex gap-2" >
< div class = "w-full" >
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'TTS Voice' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
< input
list="voice-list"
2024-07-09 03:10:00 +00:00
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-09 09:05:36 +00:00
bind:value={ TTS_VOICE }
placeholder="Select a voice"
/>
< datalist id = "voice-list" >
{ #each voices as voice }
2024-08-02 17:24:47 +00:00
< option value = { voice . id } > { voice . name } </option >
2024-06-09 09:05:36 +00:00
{ /each }
< / datalist >
< / div >
< / div >
< / div >
< div class = "w-full" >
< div class = " mb-1.5 text-sm font-medium" > { $i18n . t ( 'TTS Model' )} </ div >
< div class = "flex w-full" >
< div class = "flex-1" >
< input
2024-08-02 17:26:34 +00:00
list="tts-model-list"
2024-07-09 03:10:00 +00:00
class="w-full rounded-lg py-2 px-4 text-sm bg-gray-50 dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-06-09 09:05:36 +00:00
bind:value={ TTS_MODEL }
placeholder="Select a model"
/>
2024-08-02 17:26:34 +00:00
< datalist id = "tts-model-list" >
2024-06-09 09:05:36 +00:00
{ #each models as model }
2024-08-02 17:24:47 +00:00
< option value = { model . id } / >
2024-06-09 09:05:36 +00:00
{ /each }
< / datalist >
< / div >
2024-06-08 03:18:48 +00:00
< / div >
< / div >
< / div >
2024-06-09 09:05:36 +00:00
{ /if }
2024-08-25 00:35:42 +00:00
< hr class = "dark:border-gray-850 my-2" / >
< div class = "pt-0.5 flex w-full justify-between" >
< div class = "self-center text-xs font-medium" > { $i18n . t ( 'Response splitting' )} </ div >
< div class = "flex items-center relative" >
< select
class="dark:bg-gray-900 w-fit pr-8 cursor-pointer rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
2024-08-25 00:45:10 +00:00
aria-label="Select how to split message text for TTS requests"
2024-08-25 00:35:42 +00:00
bind:value={ TTS_SPLIT_ON }
>
2024-08-26 13:38:42 +00:00
{ #each Object . values ( TTS_RESPONSE_SPLIT ) as split }
< option value = { split }
>{ $i18n . t ( split . charAt ( 0 ). toUpperCase () + split . slice ( 1 ))} < /option
>
{ /each }
2024-08-25 00:35:42 +00:00
< / select >
< / div >
< / div >
< div class = "mt-2 mb-1 text-xs text-gray-400 dark:text-gray-500" >
{ $i18n . t (
2024-08-25 00:45:10 +00:00
"Control how message text is split for TTS requests. 'Punctuation' splits into sentences, 'paragraphs' splits into paragraphs, and 'none' keeps the message as a single string."
2024-08-25 00:35:42 +00:00
)}
< / div >
2024-06-09 09:05:36 +00:00
< / div >
2024-06-08 03:18:48 +00:00
< / div >
< / div >
< div class = "flex justify-end text-sm font-medium" >
< button
class=" px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
type="submit"
>
{ $i18n . t ( 'Save' )}
< / button >
< / div >
< / form >