diff --git a/backend/apps/web/models/models.py b/backend/apps/web/models/models.py index 2329b8f88..bf835c8fd 100644 --- a/backend/apps/web/models/models.py +++ b/backend/apps/web/models/models.py @@ -31,7 +31,6 @@ class ModelParams(BaseModel): # ModelMeta is a model for the data stored in the meta field of the Model table -# It isn't currently used in the backend, but it's here as a reference class ModelMeta(BaseModel): profile_image_url: Optional[str] = "/favicon.png" @@ -40,10 +39,7 @@ class ModelMeta(BaseModel): User-facing description of the model. """ - vision_capable: Optional[bool] = None - """ - A flag indicating if the model is capable of vision and thus image inputs - """ + capabilities: Optional[dict] = None model_config = ConfigDict(extra="allow") diff --git a/src/lib/components/chat/MessageInput.svelte b/src/lib/components/chat/MessageInput.svelte index 5ed6ee129..afff1217d 100644 --- a/src/lib/components/chat/MessageInput.svelte +++ b/src/lib/components/chat/MessageInput.svelte @@ -53,7 +53,11 @@ export let messages = []; let speechRecognition; - let visionCapableState = 'all'; + + let visionCapableModels = []; + $: visionCapableModels = [...(atSelectedModel ? [atSelectedModel] : selectedModels)].filter( + (model) => $models.find((m) => m.id === model)?.info?.meta?.capabilities?.vision ?? true + ); $: if (prompt) { if (chatTextAreaElement) { @@ -62,49 +66,6 @@ } } - // $: { - // if (atSelectedModel || selectedModels) { - // visionCapableState = checkModelsAreVisionCapable(); - // if (visionCapableState === 'none') { - // // Remove all image files - // const fileCount = files.length; - // files = files.filter((file) => file.type != 'image'); - // if (files.length < fileCount) { - // toast.warning($i18n.t('All selected models do not support image input, removed images')); - // } - // } - // } - // } - - const checkModelsAreVisionCapable = () => { - let modelsToCheck = []; - if (atSelectedModel !== undefined) { - modelsToCheck = [atSelectedModel.id]; - } else { - modelsToCheck = selectedModels; - } - if (modelsToCheck.length == 0 || modelsToCheck[0] == '') { - return 'all'; - } - let visionCapableCount = 0; - for (const modelName of modelsToCheck) { - const model = $models.find((m) => m.id === modelName); - if (!model) { - continue; - } - if (model.custom_info?.meta.vision_capable ?? true) { - visionCapableCount++; - } - } - if (visionCapableCount == modelsToCheck.length) { - return 'all'; - } else if (visionCapableCount == 0) { - return 'none'; - } else { - return 'some'; - } - }; - let mediaRecorder; let audioChunks = []; let isRecording = false; @@ -404,8 +365,8 @@ inputFiles.forEach((file) => { console.log(file, file.name.split('.').at(-1)); if (['image/gif', 'image/webp', 'image/jpeg', 'image/png'].includes(file['type'])) { - if (visionCapableState == 'none') { - toast.error($i18n.t('Selected models do not support image inputs')); + if (visionCapableModels.length === 0) { + toast.error($i18n.t('Selected model(s) do not support image inputs')); return; } let reader = new FileReader(); @@ -600,8 +561,8 @@ if ( ['image/gif', 'image/webp', 'image/jpeg', 'image/png'].includes(file['type']) ) { - if (visionCapableState === 'none') { - toast.error($i18n.t('Selected models do not support image inputs')); + if (visionCapableModels.length === 0) { + toast.error($i18n.t('Selected model(s) do not support image inputs')); inputFiles = null; filesInputElement.value = ''; return; @@ -645,6 +606,7 @@ dir={$settings?.chatDirection ?? 'LTR'} class=" flex flex-col relative w-full rounded-3xl px-1.5 bg-gray-50 dark:bg-gray-850 dark:text-gray-100" on:submit|preventDefault={() => { + // check if selectedModels support image input submitPrompt(prompt, user); }} > @@ -659,16 +621,20 @@ alt="input" class=" h-16 w-16 rounded-xl object-cover" /> - {#if visionCapableState === 'some'} + {#if atSelectedModel ? visionCapableModels.length === 0 : selectedModels.length !== visionCapableModels.length} !visionCapableModels.includes(id)) + .join(', ') + })} > -
+
{$i18n.t('Seed')}
diff --git a/src/lib/components/common/Checkbox.svelte b/src/lib/components/common/Checkbox.svelte index f69a58401..3d43a6950 100644 --- a/src/lib/components/common/Checkbox.svelte +++ b/src/lib/components/common/Checkbox.svelte @@ -29,6 +29,7 @@ dispatch('change', _state); } }} + type="button" >
{#if _state === 'checked'} diff --git a/src/lib/components/workspace/Models.svelte b/src/lib/components/workspace/Models.svelte index bcf7eb31e..cdbd79691 100644 --- a/src/lib/components/workspace/Models.svelte +++ b/src/lib/components/workspace/Models.svelte @@ -142,7 +142,7 @@
{model.name}
- {model?.info?.meta?.description ?? model.id} + {!!model?.info?.meta?.description ? model?.info?.meta?.description : model.id}
diff --git a/src/routes/(app)/workspace/models/create/+page.svelte b/src/routes/(app)/workspace/models/create/+page.svelte index b8bdb7b41..a3bbca921 100644 --- a/src/routes/(app)/workspace/models/create/+page.svelte +++ b/src/routes/(app)/workspace/models/create/+page.svelte @@ -9,6 +9,7 @@ import { getModels } from '$lib/apis'; import AdvancedParams from '$lib/components/chat/Settings/Advanced/AdvancedParams.svelte'; + import Checkbox from '$lib/components/common/Checkbox.svelte'; const i18n = getContext('i18n'); @@ -48,6 +49,10 @@ let params = {}; + let capabilities = { + vision: false + }; + $: if (name) { id = name.replace(/\s+/g, '-').toLowerCase(); } @@ -57,6 +62,7 @@ info.id = id; info.name = name; + info.meta.capabilities = capabilities; if ($models.find((m) => m.id === info.id)) { toast.error( @@ -298,14 +304,13 @@
-
{$i18n.t('Description')}*
+
{$i18n.t('Description')}
@@ -329,7 +334,7 @@
-
+
{$i18n.t('Advanced Params')}
@@ -422,6 +427,28 @@
+
+
+
{$i18n.t('Capabilities')}
+
+
+ {#each Object.keys(capabilities) as capability} +
+ { + capabilities[capability] = e.detail === 'checked'; + }} + /> + +
+ {$i18n.t(capability)} +
+
+ {/each} +
+
+
{$i18n.t('JSON Preview')}
diff --git a/src/routes/(app)/workspace/models/edit/+page.svelte b/src/routes/(app)/workspace/models/edit/+page.svelte index a0bbc2f10..18efe5a08 100644 --- a/src/routes/(app)/workspace/models/edit/+page.svelte +++ b/src/routes/(app)/workspace/models/edit/+page.svelte @@ -12,6 +12,7 @@ import AdvancedParams from '$lib/components/chat/Settings/Advanced/AdvancedParams.svelte'; import { getModels } from '$lib/apis'; + import Checkbox from '$lib/components/common/Checkbox.svelte'; const i18n = getContext('i18n'); @@ -53,11 +54,16 @@ let params = {}; + let capabilities = { + vision: true + }; + const updateHandler = async () => { loading = true; info.id = id; info.name = name; + info.meta.capabilities = capabilities; const res = await updateModelById(localStorage.token, info.id, info); @@ -98,6 +104,10 @@ info.base_model_id = `${info.base_model_id}:latest`; } + if (model?.info?.meta?.capabilities) { + capabilities = { ...capabilities, ...model?.info?.meta?.capabilities }; + } + console.log(model); } else { goto('/workspace/models'); @@ -291,14 +301,13 @@ {/if}
-
{$i18n.t('Description')}*
+
{$i18n.t('Description')}
@@ -324,7 +333,7 @@
-
+
{$i18n.t('Advanced Params')}
@@ -417,6 +426,28 @@
+
+
+
{$i18n.t('Capabilities')}
+
+
+ {#each Object.keys(capabilities) as capability} +
+ { + capabilities[capability] = e.detail === 'checked'; + }} + /> + +
+ {$i18n.t(capability)} +
+
+ {/each} +
+
+
{$i18n.t('JSON Preview')}
diff --git a/src/routes/(app)/workspace/models/edit/asdf.json b/src/routes/(app)/workspace/models/edit/asdf.json deleted file mode 100644 index a7255cca7..000000000 --- a/src/routes/(app)/workspace/models/edit/asdf.json +++ /dev/null @@ -1,28 +0,0 @@ -{ - "description": "Developer lead assistant with no code explanation", - "profile_image_url": "", - "ollama": { - "modelfile": "FROM llama3\nPARAMETER temperature 1\nSYSTEM \"\"\"\nI want you to act as a senior full-stack tech leader and top-tier brilliant software developer, you embody technical excellence and a deep understanding of a wide range of technologies. Your expertise covers not just coding, but also algorithm design, system architecture, and technology strategy. for every question there is no need to explain, only give the solution.\n\nCoding Mastery: Possess exceptional skills in programming languages including Python, JavaScript, SQL, NoSQL, mySQL, C++, C, Rust, Groovy, Go, and Java. Your proficiency goes beyond mere syntax; you explore and master the nuances and complexities of each language, crafting code that is both highly efficient and robust. Your capability to optimize performance and manage complex codebases sets the benchmark in software development.\n\nPython | JavaScript | C++ | C | RUST | Groovy | Go | Java | SQL | MySQL | NoSQL\nEfficient, Optimal, Good Performance, Excellent Complexity, Robust Code\n\nCutting-Edge Technologies: Adept at leveraging the latest technologies, frameworks, and tools to drive innovation and efficiency. Experienced with Docker, Kubernetes, React, Angular, AWS, Supabase, Firebase, Azure, and Google Cloud. Your understanding of these platforms enables you to architect and deploy scalable, resilient applications that meet modern business demands.\n\nDocker | Kubernetes | React | Angular | AWS | Supabase | Firebase | Azure | Google Cloud\nSeamlessly Integrating Modern Tech Stacks\n\nComplex Algorithms & Data Structures\nOptimized Solutions for Enhanced Performance & Scalability\n\nSolution Architect: Your comprehensive grasp of the software development lifecycle empowers you to design solutions that are not only technically sound but also align perfectly with business goals. From concept to deployment, you ensure adherence to industry best practices and agile methodologies, making the development process both agile and effective.\n\nInteractive Solutions: When crafting user-facing features, employ modern ES6 JavaScript, TypeScript, and native browser APIs to manage interactivity seamlessly, enabling a dynamic and engaging user experience. Your focus lies in delivering functional, ready-to-deploy code, ensuring that explanations are succinct and directly aligned with the required solutions.\n\nnever explain the code just write code \n\"\"\"" - }, - "suggestion_prompts": [ - { - "content": "Create a pac-man game in C" - }, - { - "content": "Create react page example" - }, - { - "content": "write character collisions in godot engine" - } - ], - "categories": [ - "assistant", - "programming", - "data analysis" - ], - "user": { - "username": "vianch", - "name": "", - "community": true - } -} \ No newline at end of file