This commit is contained in:
Timothy Jaeryang Baek
2026-03-17 17:58:01 -05:00
parent fcf7208352
commit de3317e26b
220 changed files with 17200 additions and 22836 deletions

View File

@@ -13,13 +13,11 @@ from open_webui.config import DEFAULT_RAG_TEMPLATE
log = logging.getLogger(__name__)
def get_task_model_id(
default_model_id: str, task_model: str, task_model_external: str, models
) -> str:
def get_task_model_id(default_model_id: str, task_model: str, task_model_external: str, models) -> str:
# Set the task model
task_model_id = default_model_id
# Check if the user has a custom task model and use that model
if models[task_model_id].get("connection_type") == "local":
if models[task_model_id].get('connection_type') == 'local':
if task_model and task_model in models:
task_model_id = task_model
else:
@@ -36,92 +34,70 @@ def prompt_variables_template(template: str, variables: dict[str, str]) -> str:
def prompt_template(template: str, user: Optional[Any] = None) -> str:
USER_VARIABLES = {}
if user:
if hasattr(user, "model_dump"):
if hasattr(user, 'model_dump'):
user = user.model_dump()
if isinstance(user, dict):
user_info = user.get("info", {}) or {}
birth_date = user.get("date_of_birth")
user_info = user.get('info', {}) or {}
birth_date = user.get('date_of_birth')
age = None
if birth_date:
try:
# If birth_date is str, convert to datetime
if isinstance(birth_date, str):
birth_date = datetime.strptime(birth_date, "%Y-%m-%d")
birth_date = datetime.strptime(birth_date, '%Y-%m-%d')
today = datetime.now()
age = (
today.year
- birth_date.year
- (
(today.month, today.day)
< (birth_date.month, birth_date.day)
)
)
age = today.year - birth_date.year - ((today.month, today.day) < (birth_date.month, birth_date.day))
except Exception as e:
pass
USER_VARIABLES = {
"name": str(user.get("name")),
"email": str(user.get("email")),
"location": str(user_info.get("location")),
"bio": str(user.get("bio")),
"gender": str(user.get("gender")),
"birth_date": str(birth_date),
"age": str(age),
'name': str(user.get('name')),
'email': str(user.get('email')),
'location': str(user_info.get('location')),
'bio': str(user.get('bio')),
'gender': str(user.get('gender')),
'birth_date': str(birth_date),
'age': str(age),
}
# Get the current date
current_date = datetime.now()
# Format the date to YYYY-MM-DD
formatted_date = current_date.strftime("%Y-%m-%d")
formatted_time = current_date.strftime("%I:%M:%S %p")
formatted_weekday = current_date.strftime("%A")
formatted_date = current_date.strftime('%Y-%m-%d')
formatted_time = current_date.strftime('%I:%M:%S %p')
formatted_weekday = current_date.strftime('%A')
template = template.replace("{{CURRENT_DATE}}", formatted_date)
template = template.replace("{{CURRENT_TIME}}", formatted_time)
template = template.replace(
"{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
)
template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
template = template.replace('{{CURRENT_DATE}}', formatted_date)
template = template.replace('{{CURRENT_TIME}}', formatted_time)
template = template.replace('{{CURRENT_DATETIME}}', f'{formatted_date} {formatted_time}')
template = template.replace('{{CURRENT_WEEKDAY}}', formatted_weekday)
template = template.replace("{{USER_NAME}}", USER_VARIABLES.get("name", "Unknown"))
template = template.replace(
"{{USER_EMAIL}}", USER_VARIABLES.get("email", "Unknown")
)
template = template.replace("{{USER_BIO}}", USER_VARIABLES.get("bio", "Unknown"))
template = template.replace(
"{{USER_GENDER}}", USER_VARIABLES.get("gender", "Unknown")
)
template = template.replace(
"{{USER_BIRTH_DATE}}", USER_VARIABLES.get("birth_date", "Unknown")
)
template = template.replace(
"{{USER_AGE}}", str(USER_VARIABLES.get("age", "Unknown"))
)
template = template.replace(
"{{USER_LOCATION}}", USER_VARIABLES.get("location", "Unknown")
)
template = template.replace('{{USER_NAME}}', USER_VARIABLES.get('name', 'Unknown'))
template = template.replace('{{USER_EMAIL}}', USER_VARIABLES.get('email', 'Unknown'))
template = template.replace('{{USER_BIO}}', USER_VARIABLES.get('bio', 'Unknown'))
template = template.replace('{{USER_GENDER}}', USER_VARIABLES.get('gender', 'Unknown'))
template = template.replace('{{USER_BIRTH_DATE}}', USER_VARIABLES.get('birth_date', 'Unknown'))
template = template.replace('{{USER_AGE}}', str(USER_VARIABLES.get('age', 'Unknown')))
template = template.replace('{{USER_LOCATION}}', USER_VARIABLES.get('location', 'Unknown'))
return template
def replace_prompt_variable(template: str, prompt: str) -> str:
def replacement_function(match):
full_match = match.group(
0
).lower() # Normalize to lowercase for consistent handling
full_match = match.group(0).lower() # Normalize to lowercase for consistent handling
start_length = match.group(1)
end_length = match.group(2)
middle_length = match.group(3)
if full_match == "{{prompt}}":
if full_match == '{{prompt}}':
return prompt
elif start_length is not None:
return prompt[: int(start_length)]
@@ -133,16 +109,16 @@ def replace_prompt_variable(template: str, prompt: str) -> str:
return prompt
start = prompt[: math.ceil(middle_length / 2)]
end = prompt[-math.floor(middle_length / 2) :]
return f"{start}...{end}"
return ""
return f'{start}...{end}'
return ''
# Updated regex pattern to make it case-insensitive with the `(?i)` flag
pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
pattern = r'(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}'
template = re.sub(pattern, replacement_function, template)
return template
def truncate_content(content: str, max_chars: int, mode: str = "middletruncate") -> str:
def truncate_content(content: str, max_chars: int, mode: str = 'middletruncate') -> str:
"""Truncate a string to max_chars using the specified mode.
Modes:
@@ -153,13 +129,13 @@ def truncate_content(content: str, max_chars: int, mode: str = "middletruncate")
if not content or len(content) <= max_chars:
return content
if mode == "start":
if mode == 'start':
return content[:max_chars]
elif mode == "end":
elif mode == 'end':
return content[-max_chars:]
else: # middletruncate
half = max_chars // 2
return f"{content[:half]}...{content[-(max_chars - half):]}"
return f'{content[:half]}...{content[-(max_chars - half) :]}'
def apply_content_filter(messages: list[dict], filter_str: str) -> list[dict]:
@@ -168,7 +144,7 @@ def apply_content_filter(messages: list[dict], filter_str: str) -> list[dict]:
filter_str is like 'middletruncate:500', 'start:200', or 'end:200'.
Returns a new list with truncated content (original messages are not mutated).
"""
parts = filter_str.split(":")
parts = filter_str.split(':')
if len(parts) != 2:
return messages
@@ -178,33 +154,29 @@ def apply_content_filter(messages: list[dict], filter_str: str) -> list[dict]:
except ValueError:
return messages
if mode not in ("middletruncate", "start", "end"):
if mode not in ('middletruncate', 'start', 'end'):
return messages
result = []
for msg in messages:
new_msg = dict(msg)
if isinstance(new_msg.get("content"), str):
new_msg["content"] = truncate_content(new_msg["content"], max_chars, mode)
elif isinstance(new_msg.get("content"), list):
if isinstance(new_msg.get('content'), str):
new_msg['content'] = truncate_content(new_msg['content'], max_chars, mode)
elif isinstance(new_msg.get('content'), list):
new_content = []
for item in new_msg["content"]:
if isinstance(item, dict) and item.get("type") == "text":
for item in new_msg['content']:
if isinstance(item, dict) and item.get('type') == 'text':
new_item = dict(item)
new_item["text"] = truncate_content(
item.get("text", ""), max_chars, mode
)
new_item['text'] = truncate_content(item.get('text', ''), max_chars, mode)
new_content.append(new_item)
else:
new_content.append(item)
new_msg["content"] = new_content
new_msg['content'] = new_content
result.append(new_msg)
return result
def replace_messages_variable(
template: str, messages: Optional[list[dict]] = None
) -> str:
def replace_messages_variable(template: str, messages: Optional[list[dict]] = None) -> str:
def replacement_function(match):
# Groups: (1) filter for bare MESSAGES
# (2) START count, (3) filter for START
@@ -220,7 +192,7 @@ def replace_messages_variable(
# If messages is None, handle it as an empty list
if messages is None:
return ""
return ''
# Select messages based on the variant
if start_length is not None:
@@ -251,12 +223,12 @@ def replace_messages_variable(
return get_messages_content(selected)
template = re.sub(
r"(?:"
r"\{\{MESSAGES(?:\|(\w+:\d+))?\}\}"
r"|\{\{MESSAGES:START:(\d+)(?:\|(\w+:\d+))?\}\}"
r"|\{\{MESSAGES:END:(\d+)(?:\|(\w+:\d+))?\}\}"
r"|\{\{MESSAGES:MIDDLETRUNCATE:(\d+)(?:\|(\w+:\d+))?\}\}"
r")",
r'(?:'
r'\{\{MESSAGES(?:\|(\w+:\d+))?\}\}'
r'|\{\{MESSAGES:START:(\d+)(?:\|(\w+:\d+))?\}\}'
r'|\{\{MESSAGES:END:(\d+)(?:\|(\w+:\d+))?\}\}'
r'|\{\{MESSAGES:MIDDLETRUNCATE:(\d+)(?:\|(\w+:\d+))?\}\}'
r')',
replacement_function,
template,
)
@@ -268,39 +240,37 @@ def replace_messages_variable(
def rag_template(template: str, context: str, query: str):
if template.strip() == "":
if template.strip() == '':
template = DEFAULT_RAG_TEMPLATE
template = prompt_template(template)
if "[context]" not in template and "{{CONTEXT}}" not in template:
log.debug(
"WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
)
if '[context]' not in template and '{{CONTEXT}}' not in template:
log.debug("WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder.")
if "<context>" in context and "</context>" in context:
if '<context>' in context and '</context>' in context:
log.debug(
"WARNING: Potential prompt injection attack: the RAG "
'WARNING: Potential prompt injection attack: the RAG '
"context contains '<context>' and '</context>'. This might be "
"nothing, or the user might be trying to hack something."
'nothing, or the user might be trying to hack something.'
)
query_placeholders = []
if "[query]" in context:
query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
template = template.replace("[query]", query_placeholder)
query_placeholders.append((query_placeholder, "[query]"))
if '[query]' in context:
query_placeholder = '{{QUERY' + str(uuid.uuid4()) + '}}'
template = template.replace('[query]', query_placeholder)
query_placeholders.append((query_placeholder, '[query]'))
if "{{QUERY}}" in context:
query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
template = template.replace("{{QUERY}}", query_placeholder)
query_placeholders.append((query_placeholder, "{{QUERY}}"))
if '{{QUERY}}' in context:
query_placeholder = '{{QUERY' + str(uuid.uuid4()) + '}}'
template = template.replace('{{QUERY}}', query_placeholder)
query_placeholders.append((query_placeholder, '{{QUERY}}'))
template = template.replace("[context]", context)
template = template.replace("{{CONTEXT}}", context)
template = template.replace('[context]', context)
template = template.replace('{{CONTEXT}}', context)
template = template.replace("[query]", query)
template = template.replace("{{QUERY}}", query)
template = template.replace('[query]', query)
template = template.replace('{{QUERY}}', query)
for query_placeholder, original_placeholder in query_placeholders:
template = template.replace(query_placeholder, original_placeholder)
@@ -308,10 +278,7 @@ def rag_template(template: str, context: str, query: str):
return template
def title_generation_template(
template: str, messages: list[dict], user: Optional[Any] = None
) -> str:
def title_generation_template(template: str, messages: list[dict], user: Optional[Any] = None) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -321,9 +288,7 @@ def title_generation_template(
return template
def follow_up_generation_template(
template: str, messages: list[dict], user: Optional[Any] = None
) -> str:
def follow_up_generation_template(template: str, messages: list[dict], user: Optional[Any] = None) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -332,9 +297,7 @@ def follow_up_generation_template(
return template
def tags_generation_template(
template: str, messages: list[dict], user: Optional[Any] = None
) -> str:
def tags_generation_template(template: str, messages: list[dict], user: Optional[Any] = None) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -343,9 +306,7 @@ def tags_generation_template(
return template
def image_prompt_generation_template(
template: str, messages: list[dict], user: Optional[Any] = None
) -> str:
def image_prompt_generation_template(template: str, messages: list[dict], user: Optional[Any] = None) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -354,9 +315,7 @@ def image_prompt_generation_template(
return template
def emoji_generation_template(
template: str, prompt: str, user: Optional[Any] = None
) -> str:
def emoji_generation_template(template: str, prompt: str, user: Optional[Any] = None) -> str:
template = replace_prompt_variable(template, prompt)
template = prompt_template(template, user)
@@ -370,7 +329,7 @@ def autocomplete_generation_template(
type: Optional[str] = None,
user: Optional[Any] = None,
) -> str:
template = template.replace("{{TYPE}}", type if type else "")
template = template.replace('{{TYPE}}', type if type else '')
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -378,9 +337,7 @@ def autocomplete_generation_template(
return template
def query_generation_template(
template: str, messages: list[dict], user: Optional[Any] = None
) -> str:
def query_generation_template(template: str, messages: list[dict], user: Optional[Any] = None) -> str:
prompt = get_last_user_message(messages)
template = replace_prompt_variable(template, prompt)
template = replace_messages_variable(template, messages)
@@ -389,16 +346,14 @@ def query_generation_template(
return template
def moa_response_generation_template(
template: str, prompt: str, responses: list[str]
) -> str:
def moa_response_generation_template(template: str, prompt: str, responses: list[str]) -> str:
def replacement_function(match):
full_match = match.group(0)
start_length = match.group(1)
end_length = match.group(2)
middle_length = match.group(3)
if full_match == "{{prompt}}":
if full_match == '{{prompt}}':
return prompt
elif start_length is not None:
return prompt[: int(start_length)]
@@ -410,22 +365,22 @@ def moa_response_generation_template(
return prompt
start = prompt[: math.ceil(middle_length / 2)]
end = prompt[-math.floor(middle_length / 2) :]
return f"{start}...{end}"
return ""
return f'{start}...{end}'
return ''
template = re.sub(
r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
r'{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}',
replacement_function,
template,
)
responses = [f'"""{response}"""' for response in responses]
responses = "\n\n".join(responses)
responses = '\n\n'.join(responses)
template = template.replace("{{responses}}", responses)
template = template.replace('{{responses}}', responses)
return template
def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
template = template.replace("{{TOOLS}}", tools_specs)
template = template.replace('{{TOOLS}}', tools_specs)
return template