open-webui/src/lib/components/chat/Settings/Audio.svelte

379 lines
10 KiB
Svelte
Raw Normal View History

<script lang="ts">
2024-04-20 21:00:24 +00:00
import { getAudioConfig, updateAudioConfig } from '$lib/apis/audio';
2024-05-27 05:47:42 +00:00
import { user, settings } from '$lib/stores';
import { createEventDispatcher, onMount, getContext } from 'svelte';
2024-03-01 09:18:07 +00:00
import { toast } from 'svelte-sonner';
import Switch from '$lib/components/common/Switch.svelte';
const dispatch = createEventDispatcher();
const i18n = getContext('i18n');
export let saveSettings: Function;
2024-02-11 10:21:06 +00:00
// Audio
2024-02-10 00:00:39 +00:00
2024-04-20 21:00:24 +00:00
let OpenAIUrl = '';
let OpenAIKey = '';
let OpenAISpeaker = '';
2024-04-20 21:00:24 +00:00
2024-02-11 10:12:49 +00:00
let STTEngines = ['', 'openai'];
let STTEngine = '';
2024-02-10 01:09:14 +00:00
let conversationMode = false;
2024-02-10 00:00:39 +00:00
let speechAutoSend = false;
let responseAutoPlayback = false;
let nonLocalVoices = false;
2024-02-10 00:00:39 +00:00
2024-02-11 10:12:49 +00:00
let TTSEngines = ['', 'openai'];
let TTSEngine = '';
2024-02-06 05:36:03 +00:00
let voices = [];
let speaker = '';
let models = [];
2024-05-07 00:28:34 +00:00
let model = '';
2024-02-06 06:51:08 +00:00
const getOpenAIVoices = () => {
voices = [
{ name: 'alloy' },
{ name: 'echo' },
{ name: 'fable' },
{ name: 'onyx' },
{ name: 'nova' },
{ name: 'shimmer' }
];
};
const getOpenAIVoicesModel = () => {
models = [{ name: 'tts-1' }, { name: 'tts-1-hd' }];
};
2024-02-06 06:51:08 +00:00
const getWebAPIVoices = () => {
const getVoicesLoop = setInterval(async () => {
2024-02-06 05:36:03 +00:00
voices = await speechSynthesis.getVoices();
// do your loop
2024-02-06 05:36:03 +00:00
if (voices.length > 0) {
clearInterval(getVoicesLoop);
}
}, 100);
2024-02-06 06:51:08 +00:00
};
2024-02-10 01:09:14 +00:00
const toggleConversationMode = async () => {
conversationMode = !conversationMode;
2024-02-10 01:12:44 +00:00
if (conversationMode) {
responseAutoPlayback = true;
speechAutoSend = true;
}
saveSettings({
conversationMode: conversationMode,
responseAutoPlayback: responseAutoPlayback,
speechAutoSend: speechAutoSend
});
2024-02-10 01:09:14 +00:00
};
2024-02-10 00:00:39 +00:00
const toggleResponseAutoPlayback = async () => {
responseAutoPlayback = !responseAutoPlayback;
saveSettings({ responseAutoPlayback: responseAutoPlayback });
};
const toggleSpeechAutoSend = async () => {
speechAutoSend = !speechAutoSend;
saveSettings({ speechAutoSend: speechAutoSend });
};
2024-04-20 21:00:24 +00:00
const updateConfigHandler = async () => {
2024-04-23 19:56:09 +00:00
if (TTSEngine === 'openai') {
const res = await updateAudioConfig(localStorage.token, {
url: OpenAIUrl,
key: OpenAIKey,
2024-05-07 00:28:34 +00:00
model: model,
speaker: OpenAISpeaker
2024-04-23 19:56:09 +00:00
});
if (res) {
OpenAIUrl = res.OPENAI_API_BASE_URL;
OpenAIKey = res.OPENAI_API_KEY;
2024-05-07 00:28:34 +00:00
model = res.OPENAI_API_MODEL;
OpenAISpeaker = res.OPENAI_API_VOICE;
2024-04-23 19:56:09 +00:00
}
2024-04-20 21:00:24 +00:00
}
};
2024-02-06 06:51:08 +00:00
onMount(async () => {
2024-05-27 05:47:42 +00:00
conversationMode = $settings.conversationMode ?? false;
speechAutoSend = $settings.speechAutoSend ?? false;
responseAutoPlayback = $settings.responseAutoPlayback ?? false;
STTEngine = $settings?.audio?.STTEngine ?? '';
TTSEngine = $settings?.audio?.TTSEngine ?? '';
nonLocalVoices = $settings.audio?.nonLocalVoices ?? false;
2024-05-27 05:47:42 +00:00
speaker = $settings?.audio?.speaker ?? '';
model = $settings?.audio?.model ?? '';
2024-02-06 06:51:08 +00:00
2024-02-11 10:12:49 +00:00
if (TTSEngine === 'openai') {
2024-02-06 06:51:08 +00:00
getOpenAIVoices();
getOpenAIVoicesModel();
2024-02-06 06:51:08 +00:00
} else {
getWebAPIVoices();
}
2024-04-20 21:00:24 +00:00
2024-04-21 00:01:46 +00:00
if ($user.role === 'admin') {
const res = await getAudioConfig(localStorage.token);
2024-04-20 21:00:24 +00:00
2024-04-21 00:01:46 +00:00
if (res) {
OpenAIUrl = res.OPENAI_API_BASE_URL;
OpenAIKey = res.OPENAI_API_KEY;
2024-05-07 00:28:34 +00:00
model = res.OPENAI_API_MODEL;
OpenAISpeaker = res.OPENAI_API_VOICE;
if (TTSEngine === 'openai') {
speaker = OpenAISpeaker;
}
2024-04-21 00:01:46 +00:00
}
2024-04-20 21:00:24 +00:00
}
});
</script>
<form
class="flex flex-col h-full justify-between space-y-3 text-sm"
2024-04-20 21:00:24 +00:00
on:submit|preventDefault={async () => {
2024-04-21 00:01:46 +00:00
if ($user.role === 'admin') {
await updateConfigHandler();
}
saveSettings({
2024-02-11 10:21:06 +00:00
audio: {
2024-02-11 10:12:49 +00:00
STTEngine: STTEngine !== '' ? STTEngine : undefined,
TTSEngine: TTSEngine !== '' ? TTSEngine : undefined,
speaker:
(TTSEngine === 'openai' ? OpenAISpeaker : speaker) !== ''
? TTSEngine === 'openai'
? OpenAISpeaker
: speaker
: undefined,
model: model !== '' ? model : undefined,
nonLocalVoices: nonLocalVoices
2024-02-06 06:51:08 +00:00
}
});
dispatch('save');
}}
>
2024-05-15 22:55:13 +00:00
<div class=" space-y-3 pr-1.5 overflow-y-scroll max-h-[25rem]">
2024-02-10 00:00:39 +00:00
<div>
<div class=" mb-1 text-sm font-medium">{$i18n.t('STT Settings')}</div>
2024-02-10 00:00:39 +00:00
<div class=" py-0.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">{$i18n.t('Speech-to-Text Engine')}</div>
2024-02-10 00:00:39 +00:00
<div class="flex items-center relative">
<select
2024-03-05 08:15:22 +00:00
class="dark:bg-gray-900 w-fit pr-8 rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
2024-02-11 10:12:49 +00:00
bind:value={STTEngine}
2024-02-10 00:00:39 +00:00
placeholder="Select a mode"
on:change={(e) => {
2024-02-11 10:12:49 +00:00
if (e.target.value !== '') {
navigator.mediaDevices.getUserMedia({ audio: true }).catch(function (err) {
2024-03-03 10:01:34 +00:00
toast.error(
$i18n.t(`Permission denied when accessing microphone: {{error}}`, {
error: err
})
);
2024-02-11 10:12:49 +00:00
STTEngine = '';
});
2024-02-10 00:00:39 +00:00
}
}}
>
<option value="">{$i18n.t('Default (Web API)')}</option>
<option value="whisper-local">{$i18n.t('Whisper (Local)')}</option>
2024-02-10 00:00:39 +00:00
</select>
</div>
</div>
<div class=" py-0.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">{$i18n.t('Conversation Mode')}</div>
2024-02-10 01:09:14 +00:00
<button
class="p-1 px-3 text-xs flex rounded transition"
on:click={() => {
toggleConversationMode();
}}
type="button"
>
{#if conversationMode === true}
<span class="ml-2 self-center">{$i18n.t('On')}</span>
2024-02-10 01:09:14 +00:00
{:else}
<span class="ml-2 self-center">{$i18n.t('Off')}</span>
2024-02-10 01:09:14 +00:00
{/if}
</button>
</div>
<div class=" py-0.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">
{$i18n.t('Auto-send input after 3 sec.')}
</div>
2024-02-10 00:00:39 +00:00
<button
class="p-1 px-3 text-xs flex rounded transition"
on:click={() => {
toggleSpeechAutoSend();
}}
type="button"
>
{#if speechAutoSend === true}
<span class="ml-2 self-center">{$i18n.t('On')}</span>
2024-02-10 00:00:39 +00:00
{:else}
<span class="ml-2 self-center">{$i18n.t('Off')}</span>
2024-02-10 00:00:39 +00:00
{/if}
</button>
</div>
2024-02-11 10:12:49 +00:00
</div>
<div>
<div class=" mb-1 text-sm font-medium">{$i18n.t('TTS Settings')}</div>
2024-02-11 10:12:49 +00:00
<div class=" py-0.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">{$i18n.t('Text-to-Speech Engine')}</div>
2024-02-11 10:12:49 +00:00
<div class="flex items-center relative">
<select
2024-03-05 08:15:22 +00:00
class=" dark:bg-gray-900 w-fit pr-8 rounded px-2 p-1 text-xs bg-transparent outline-none text-right"
2024-02-11 10:12:49 +00:00
bind:value={TTSEngine}
placeholder="Select a mode"
on:change={(e) => {
if (e.target.value === 'openai') {
getOpenAIVoices();
OpenAISpeaker = 'alloy';
2024-05-07 00:28:34 +00:00
model = 'tts-1';
2024-02-11 10:12:49 +00:00
} else {
getWebAPIVoices();
speaker = '';
}
}}
>
<option value="">{$i18n.t('Default (Web API)')}</option>
<option value="openai">{$i18n.t('Open AI')}</option>
2024-02-11 10:12:49 +00:00
</select>
</div>
</div>
2024-02-10 00:00:39 +00:00
2024-04-21 00:01:46 +00:00
{#if $user.role === 'admin'}
{#if TTSEngine === 'openai'}
<div class="mt-1 flex gap-2 mb-1">
<input
class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
placeholder={$i18n.t('API Base URL')}
bind:value={OpenAIUrl}
required
/>
<input
class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
placeholder={$i18n.t('API Key')}
bind:value={OpenAIKey}
required
/>
</div>
{/if}
2024-04-20 21:00:24 +00:00
{/if}
2024-02-10 00:00:39 +00:00
<div class=" py-0.5 flex w-full justify-between">
<div class=" self-center text-xs font-medium">{$i18n.t('Auto-playback response')}</div>
2024-02-10 00:00:39 +00:00
<button
class="p-1 px-3 text-xs flex rounded transition"
on:click={() => {
toggleResponseAutoPlayback();
2024-02-06 05:36:03 +00:00
}}
2024-02-10 00:00:39 +00:00
type="button"
2024-02-06 05:36:03 +00:00
>
2024-02-10 00:00:39 +00:00
{#if responseAutoPlayback === true}
<span class="ml-2 self-center">{$i18n.t('On')}</span>
2024-02-10 00:00:39 +00:00
{:else}
<span class="ml-2 self-center">{$i18n.t('Off')}</span>
2024-02-10 00:00:39 +00:00
{/if}
</button>
2024-02-06 05:36:03 +00:00
</div>
</div>
<hr class=" dark:border-gray-700" />
2024-02-11 10:12:49 +00:00
{#if TTSEngine === ''}
<div>
<div class=" mb-2.5 text-sm font-medium">{$i18n.t('Set Voice')}</div>
<div class="flex w-full">
<div class="flex-1">
<select
2024-04-21 00:01:46 +00:00
class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-02-06 05:36:03 +00:00
bind:value={speaker}
>
<option value="" selected={speaker !== ''}>{$i18n.t('Default')}</option>
{#each voices.filter((v) => nonLocalVoices || v.localService === true) as voice}
<option
value={voice.name}
class="bg-gray-100 dark:bg-gray-700"
selected={speaker === voice.name}>{voice.name}</option
>
{/each}
</select>
</div>
</div>
2024-06-05 15:48:02 +00:00
<div class="flex items-center justify-between my-1.5">
<div class="text-xs">
{$i18n.t('Allow non-local voices')}
</div>
<div class="mt-1">
<Switch bind:state={nonLocalVoices} />
</div>
</div>
</div>
2024-02-11 10:12:49 +00:00
{:else if TTSEngine === 'openai'}
2024-02-06 06:51:08 +00:00
<div>
<div class=" mb-2.5 text-sm font-medium">{$i18n.t('Set Voice')}</div>
2024-02-06 06:51:08 +00:00
<div class="flex w-full">
<div class="flex-1">
2024-04-20 21:00:24 +00:00
<input
list="voice-list"
class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
bind:value={OpenAISpeaker}
2024-02-06 06:51:08 +00:00
placeholder="Select a voice"
2024-04-20 21:00:24 +00:00
/>
<datalist id="voice-list">
2024-02-06 06:51:08 +00:00
{#each voices as voice}
2024-04-20 21:00:24 +00:00
<option value={voice.name} />
2024-02-06 06:51:08 +00:00
{/each}
2024-04-20 21:00:24 +00:00
</datalist>
2024-02-06 06:51:08 +00:00
</div>
</div>
</div>
<div>
<div class=" mb-2.5 text-sm font-medium">{$i18n.t('Set Model')}</div>
<div class="flex w-full">
<div class="flex-1">
<input
list="model-list"
class="w-full rounded-lg py-2 px-4 text-sm dark:text-gray-300 dark:bg-gray-850 outline-none"
2024-05-07 00:28:34 +00:00
bind:value={model}
placeholder="Select a model"
/>
<datalist id="model-list">
2024-05-07 00:28:34 +00:00
{#each models as model}
<option value={model.name} />
{/each}
</datalist>
</div>
</div>
</div>
2024-02-06 05:36:03 +00:00
{/if}
</div>
2024-05-15 22:55:13 +00:00
<div class="flex justify-end text-sm font-medium">
<button
2024-03-10 06:02:27 +00:00
class=" px-4 py-2 bg-emerald-700 hover:bg-emerald-800 text-gray-100 transition rounded-lg"
type="submit"
>
2024-03-04 08:53:56 +00:00
{$i18n.t('Save')}
</button>
</div>
</form>