open-webui/backend/open_webui/utils/task.py

316 lines
10 KiB
Python
Raw Normal View History

2024-11-25 02:49:56 +00:00
import logging
2024-06-09 21:25:31 +00:00
import math
2024-08-27 22:10:27 +00:00
import re
2024-06-09 21:25:31 +00:00
from datetime import datetime
from typing import Optional
2024-11-25 02:49:56 +00:00
import uuid
2024-06-09 21:25:31 +00:00
2024-09-07 03:50:29 +00:00
from open_webui.utils.misc import get_last_user_message, get_messages_content
2024-11-25 02:49:56 +00:00
from open_webui.env import SRC_LOG_LEVELS
from open_webui.config import DEFAULT_RAG_TEMPLATE
log = logging.getLogger(__name__)
log.setLevel(SRC_LOG_LEVELS["RAG"])
2024-09-07 03:50:29 +00:00
2024-12-12 03:52:46 +00:00
def get_task_model_id(
default_model_id: str, task_model: str, task_model_external: str, models
) -> str:
# Set the task model
task_model_id = default_model_id
# Check if the user has a custom task model and use that model
if models[task_model_id]["owned_by"] == "ollama":
if task_model and task_model in models:
task_model_id = task_model
else:
if task_model_external and task_model_external in models:
task_model_id = task_model_external
return task_model_id
2024-06-09 21:25:31 +00:00
def prompt_template(
2024-08-03 13:24:26 +00:00
template: str, user_name: Optional[str] = None, user_location: Optional[str] = None
2024-06-09 21:25:31 +00:00
) -> str:
# Get the current date
current_date = datetime.now()
# Format the date to YYYY-MM-DD
formatted_date = current_date.strftime("%Y-%m-%d")
2024-06-16 16:39:48 +00:00
formatted_time = current_date.strftime("%I:%M:%S %p")
2024-11-27 04:03:06 +00:00
formatted_weekday = current_date.strftime("%A")
2024-06-09 21:25:31 +00:00
template = template.replace("{{CURRENT_DATE}}", formatted_date)
2024-06-16 16:39:48 +00:00
template = template.replace("{{CURRENT_TIME}}", formatted_time)
template = template.replace(
"{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
)
template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
2024-06-09 21:25:31 +00:00
if user_name:
# Replace {{USER_NAME}} in the template with the user's name
template = template.replace("{{USER_NAME}}", user_name)
2024-06-17 21:39:21 +00:00
else:
# Replace {{USER_NAME}} in the template with "Unknown"
template = template.replace("{{USER_NAME}}", "Unknown")
2024-06-09 21:25:31 +00:00
2024-06-16 22:32:26 +00:00
if user_location:
# Replace {{USER_LOCATION}} in the template with the current location
template = template.replace("{{USER_LOCATION}}", user_location)
2024-06-17 21:39:21 +00:00
else:
# Replace {{USER_LOCATION}} in the template with "Unknown"
template = template.replace("{{USER_LOCATION}}", "Unknown")
2024-06-09 21:25:31 +00:00
return template
2024-09-07 03:50:29 +00:00
def replace_prompt_variable(template: str, prompt: str) -> str:
2024-06-09 21:25:31 +00:00
def replacement_function(match):
2024-11-29 08:16:49 +00:00
full_match = match.group(
0
).lower() # Normalize to lowercase for consistent handling
2024-06-09 21:25:31 +00:00
start_length = match.group(1)
end_length = match.group(2)
middle_length = match.group(3)
if full_match == "{{prompt}}":
return prompt
elif start_length is not None:
return prompt[: int(start_length)]
elif end_length is not None:
return prompt[-int(end_length) :]
elif middle_length is not None:
middle_length = int(middle_length)
if len(prompt) <= middle_length:
return prompt
start = prompt[: math.ceil(middle_length / 2)]
end = prompt[-math.floor(middle_length / 2) :]
return f"{start}...{end}"
return ""
2024-11-29 08:16:49 +00:00
# Updated regex pattern to make it case-insensitive with the `(?i)` flag
pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
template = re.sub(pattern, replacement_function, template)
2024-09-07 03:50:29 +00:00
return template
2024-06-09 21:25:31 +00:00
2024-09-07 03:50:29 +00:00
2024-12-01 07:50:05 +00:00
def replace_messages_variable(
template: str, messages: Optional[list[str]] = None
) -> str:
2024-06-09 21:53:10 +00:00
def replacement_function(match):
full_match = match.group(0)
start_length = match.group(1)
end_length = match.group(2)
middle_length = match.group(3)
2024-12-01 07:50:05 +00:00
# If messages is None, handle it as an empty list
if messages is None:
return ""
2024-06-09 21:53:10 +00:00
2024-09-07 03:50:29 +00:00
# Process messages based on the number of messages required
if full_match == "{{MESSAGES}}":
return get_messages_content(messages)
2024-06-09 21:53:10 +00:00
elif start_length is not None:
2024-09-07 03:50:29 +00:00
return get_messages_content(messages[: int(start_length)])
2024-06-09 21:53:10 +00:00
elif end_length is not None:
2024-09-07 03:50:29 +00:00
return get_messages_content(messages[-int(end_length) :])
2024-06-09 21:53:10 +00:00
elif middle_length is not None:
2024-09-07 03:50:29 +00:00
mid = int(middle_length)
if len(messages) <= mid:
return get_messages_content(messages)
# Handle middle truncation: split to get start and end portions of the messages list
half = mid // 2
start_msgs = messages[:half]
end_msgs = messages[-half:] if mid % 2 == 0 else messages[-(half + 1) :]
formatted_start = get_messages_content(start_msgs)
formatted_end = get_messages_content(end_msgs)
return f"{formatted_start}\n{formatted_end}"
2024-06-09 21:53:10 +00:00
return ""
template = re.sub(
2024-09-07 03:50:29 +00:00
r"{{MESSAGES}}|{{MESSAGES:START:(\d+)}}|{{MESSAGES:END:(\d+)}}|{{MESSAGES:MIDDLETRUNCATE:(\d+)}}",
2024-06-09 21:53:10 +00:00
replacement_function,
template,
)
2024-09-07 03:50:29 +00:00
return template
2024-10-21 11:24:17 +00:00
# {{prompt:middletruncate:8000}}
2024-11-25 02:49:56 +00:00
def rag_template(template: str, context: str, query: str):
2024-11-28 03:24:20 +00:00
if template.strip() == "":
2024-11-25 02:49:56 +00:00
template = DEFAULT_RAG_TEMPLATE
if "[context]" not in template and "{{CONTEXT}}" not in template:
log.debug(
"WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
)
if "<context>" in context and "</context>" in context:
log.debug(
"WARNING: Potential prompt injection attack: the RAG "
"context contains '<context>' and '</context>'. This might be "
"nothing, or the user might be trying to hack something."
)
query_placeholders = []
if "[query]" in context:
query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
template = template.replace("[query]", query_placeholder)
query_placeholders.append(query_placeholder)
if "{{QUERY}}" in context:
query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
template = template.replace("{{QUERY}}", query_placeholder)
query_placeholders.append(query_placeholder)
template = template.replace("[context]", context)
template = template.replace("{{CONTEXT}}", context)
template = template.replace("[query]", query)
template = template.replace("{{QUERY}}", query)
for query_placeholder in query_placeholders:
template = template.replace(query_placeholder, query)
return template
2024-10-21 11:24:17 +00:00
def title_generation_template(
template: str, messages: list[dict], user: Optional[dict] = None
) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
template = prompt_template(
template,
**(
{"user_name": user.get("name"), "user_location": user.get("location")}
if user
else {}
),
)
return template
2024-10-20 03:34:17 +00:00
def tags_generation_template(
template: str, messages: list[dict], user: Optional[dict] = None
) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
template = prompt_template(
template,
**(
{"user_name": user.get("name"), "user_location": user.get("location")}
if user
else {}
),
)
return template
2024-10-22 18:23:38 +00:00
def emoji_generation_template(
template: str, prompt: str, user: Optional[dict] = None
) -> str:
template = replace_prompt_variable(template, prompt)
template = prompt_template(
template,
**(
{"user_name": user.get("name"), "user_location": user.get("location")}
if user
else {}
),
)
return template
2024-11-29 07:53:52 +00:00
def autocomplete_generation_template(
template: str,
2024-11-30 08:29:27 +00:00
prompt: str,
messages: Optional[list[dict]] = None,
2024-11-29 09:02:32 +00:00
type: Optional[str] = None,
2024-11-29 07:53:52 +00:00
user: Optional[dict] = None,
) -> str:
2024-11-29 09:02:32 +00:00
template = template.replace("{{TYPE}}", type if type else "")
2024-11-29 07:53:52 +00:00
template = replace_prompt_variable(template, prompt)
2024-12-01 07:50:05 +00:00
template = replace_messages_variable(template, messages)
2024-11-30 08:29:27 +00:00
2024-11-29 07:53:52 +00:00
template = prompt_template(
template,
**(
{"user_name": user.get("name"), "user_location": user.get("location")}
if user
else {}
),
)
return template
2024-11-19 10:24:32 +00:00
def query_generation_template(
2024-09-07 03:50:29 +00:00
template: str, messages: list[dict], user: Optional[dict] = None
) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
2024-06-09 21:53:10 +00:00
template = prompt_template(
template,
**(
2024-06-16 22:32:26 +00:00
{"user_name": user.get("name"), "user_location": user.get("location")}
2024-06-09 21:53:10 +00:00
if user
else {}
),
)
return template
2024-06-11 06:40:27 +00:00
2024-08-18 18:59:59 +00:00
def moa_response_generation_template(
template: str, prompt: str, responses: list[str]
) -> str:
def replacement_function(match):
full_match = match.group(0)
start_length = match.group(1)
end_length = match.group(2)
middle_length = match.group(3)
if full_match == "{{prompt}}":
return prompt
elif start_length is not None:
return prompt[: int(start_length)]
elif end_length is not None:
return prompt[-int(end_length) :]
elif middle_length is not None:
middle_length = int(middle_length)
if len(prompt) <= middle_length:
return prompt
start = prompt[: math.ceil(middle_length / 2)]
end = prompt[-math.floor(middle_length / 2) :]
return f"{start}...{end}"
return ""
template = re.sub(
r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
replacement_function,
template,
)
responses = [f'"""{response}"""' for response in responses]
responses = "\n\n".join(responses)
template = template.replace("{{responses}}", responses)
return template
2024-08-17 15:01:35 +00:00
def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
2024-06-11 06:40:27 +00:00
template = template.replace("{{TOOLS}}", tools_specs)
return template