123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339 |
- import logging
- import math
- import re
- from datetime import datetime
- from typing import Optional
- import uuid
- from open_webui.utils.misc import get_last_user_message, get_messages_content
- from open_webui.env import SRC_LOG_LEVELS
- from open_webui.config import DEFAULT_RAG_TEMPLATE
- log = logging.getLogger(__name__)
- log.setLevel(SRC_LOG_LEVELS["RAG"])
- def get_task_model_id(
- default_model_id: str, task_model: str, task_model_external: str, models
- ) -> str:
- # Set the task model
- task_model_id = default_model_id
- # Check if the user has a custom task model and use that model
- if models[task_model_id].get("owned_by") == "ollama":
- if task_model and task_model in models:
- task_model_id = task_model
- else:
- if task_model_external and task_model_external in models:
- task_model_id = task_model_external
- return task_model_id
- def prompt_variables_template(template: str, variables: dict[str, str]) -> str:
- for variable, value in variables.items():
- template = template.replace(variable, value)
- return template
- def prompt_template(
- template: str, user_name: Optional[str] = None, user_location: Optional[str] = None
- ) -> str:
- # Get the current date
- current_date = datetime.now()
- # Format the date to YYYY-MM-DD
- formatted_date = current_date.strftime("%Y-%m-%d")
- formatted_time = current_date.strftime("%I:%M:%S %p")
- formatted_weekday = current_date.strftime("%A")
- template = template.replace("{{CURRENT_DATE}}", formatted_date)
- template = template.replace("{{CURRENT_TIME}}", formatted_time)
- template = template.replace(
- "{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
- )
- template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
- if user_name:
- # Replace {{USER_NAME}} in the template with the user's name
- template = template.replace("{{USER_NAME}}", user_name)
- else:
- # Replace {{USER_NAME}} in the template with "Unknown"
- template = template.replace("{{USER_NAME}}", "Unknown")
- if user_location:
- # Replace {{USER_LOCATION}} in the template with the current location
- template = template.replace("{{USER_LOCATION}}", user_location)
- else:
- # Replace {{USER_LOCATION}} in the template with "Unknown"
- template = template.replace("{{USER_LOCATION}}", "Unknown")
- return template
- def replace_prompt_variable(template: str, prompt: str) -> str:
- def replacement_function(match):
- full_match = match.group(
- 0
- ).lower() # Normalize to lowercase for consistent handling
- start_length = match.group(1)
- end_length = match.group(2)
- middle_length = match.group(3)
- if full_match == "{{prompt}}":
- return prompt
- elif start_length is not None:
- return prompt[: int(start_length)]
- elif end_length is not None:
- return prompt[-int(end_length) :]
- elif middle_length is not None:
- middle_length = int(middle_length)
- if len(prompt) <= middle_length:
- return prompt
- start = prompt[: math.ceil(middle_length / 2)]
- end = prompt[-math.floor(middle_length / 2) :]
- return f"{start}...{end}"
- return ""
- # Updated regex pattern to make it case-insensitive with the `(?i)` flag
- pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
- template = re.sub(pattern, replacement_function, template)
- return template
- def replace_messages_variable(
- template: str, messages: Optional[list[dict]] = None
- ) -> str:
- def replacement_function(match):
- full_match = match.group(0)
- start_length = match.group(1)
- end_length = match.group(2)
- middle_length = match.group(3)
- # If messages is None, handle it as an empty list
- if messages is None:
- return ""
- # Process messages based on the number of messages required
- if full_match == "{{MESSAGES}}":
- return get_messages_content(messages)
- elif start_length is not None:
- return get_messages_content(messages[: int(start_length)])
- elif end_length is not None:
- return get_messages_content(messages[-int(end_length) :])
- elif middle_length is not None:
- mid = int(middle_length)
- if len(messages) <= mid:
- return get_messages_content(messages)
- # Handle middle truncation: split to get start and end portions of the messages list
- half = mid // 2
- start_msgs = messages[:half]
- end_msgs = messages[-half:] if mid % 2 == 0 else messages[-(half + 1) :]
- formatted_start = get_messages_content(start_msgs)
- formatted_end = get_messages_content(end_msgs)
- return f"{formatted_start}\n{formatted_end}"
- return ""
- template = re.sub(
- r"{{MESSAGES}}|{{MESSAGES:START:(\d+)}}|{{MESSAGES:END:(\d+)}}|{{MESSAGES:MIDDLETRUNCATE:(\d+)}}",
- replacement_function,
- template,
- )
- return template
- # {{prompt:middletruncate:8000}}
- def rag_template(template: str, context: str, query: str):
- if template.strip() == "":
- template = DEFAULT_RAG_TEMPLATE
- if "[context]" not in template and "{{CONTEXT}}" not in template:
- log.debug(
- "WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
- )
- if "<context>" in context and "</context>" in context:
- log.debug(
- "WARNING: Potential prompt injection attack: the RAG "
- "context contains '<context>' and '</context>'. This might be "
- "nothing, or the user might be trying to hack something."
- )
- query_placeholders = []
- if "[query]" in context:
- query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
- template = template.replace("[query]", query_placeholder)
- query_placeholders.append(query_placeholder)
- if "{{QUERY}}" in context:
- query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
- template = template.replace("{{QUERY}}", query_placeholder)
- query_placeholders.append(query_placeholder)
- template = template.replace("[context]", context)
- template = template.replace("{{CONTEXT}}", context)
- template = template.replace("[query]", query)
- template = template.replace("{{QUERY}}", query)
- for query_placeholder in query_placeholders:
- template = template.replace(query_placeholder, query)
- return template
- def title_generation_template(
- template: str, messages: list[dict], user: Optional[dict] = None
- ) -> str:
- prompt = get_last_user_message(messages)
- template = replace_prompt_variable(template, prompt)
- template = replace_messages_variable(template, messages)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def tags_generation_template(
- template: str, messages: list[dict], user: Optional[dict] = None
- ) -> str:
- prompt = get_last_user_message(messages)
- template = replace_prompt_variable(template, prompt)
- template = replace_messages_variable(template, messages)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def image_prompt_generation_template(
- template: str, messages: list[dict], user: Optional[dict] = None
- ) -> str:
- prompt = get_last_user_message(messages)
- template = replace_prompt_variable(template, prompt)
- template = replace_messages_variable(template, messages)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def emoji_generation_template(
- template: str, prompt: str, user: Optional[dict] = None
- ) -> str:
- template = replace_prompt_variable(template, prompt)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def autocomplete_generation_template(
- template: str,
- prompt: str,
- messages: Optional[list[dict]] = None,
- type: Optional[str] = None,
- user: Optional[dict] = None,
- ) -> str:
- template = template.replace("{{TYPE}}", type if type else "")
- template = replace_prompt_variable(template, prompt)
- template = replace_messages_variable(template, messages)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def query_generation_template(
- template: str, messages: list[dict], user: Optional[dict] = None
- ) -> str:
- prompt = get_last_user_message(messages)
- template = replace_prompt_variable(template, prompt)
- template = replace_messages_variable(template, messages)
- template = prompt_template(
- template,
- **(
- {"user_name": user.get("name"), "user_location": user.get("location")}
- if user
- else {}
- ),
- )
- return template
- def moa_response_generation_template(
- template: str, prompt: str, responses: list[str]
- ) -> str:
- def replacement_function(match):
- full_match = match.group(0)
- start_length = match.group(1)
- end_length = match.group(2)
- middle_length = match.group(3)
- if full_match == "{{prompt}}":
- return prompt
- elif start_length is not None:
- return prompt[: int(start_length)]
- elif end_length is not None:
- return prompt[-int(end_length) :]
- elif middle_length is not None:
- middle_length = int(middle_length)
- if len(prompt) <= middle_length:
- return prompt
- start = prompt[: math.ceil(middle_length / 2)]
- end = prompt[-math.floor(middle_length / 2) :]
- return f"{start}...{end}"
- return ""
- template = re.sub(
- r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
- replacement_function,
- template,
- )
- responses = [f'"""{response}"""' for response in responses]
- responses = "\n\n".join(responses)
- template = template.replace("{{responses}}", responses)
- return template
- def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
- template = template.replace("{{TOOLS}}", tools_specs)
- return template
|