task.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345
  1. import logging
  2. import math
  3. import re
  4. from datetime import datetime
  5. from typing import Optional, Any
  6. import uuid
  7. from open_webui.utils.misc import get_last_user_message, get_messages_content
  8. from open_webui.env import SRC_LOG_LEVELS
  9. from open_webui.config import DEFAULT_RAG_TEMPLATE
  10. log = logging.getLogger(__name__)
  11. log.setLevel(SRC_LOG_LEVELS["RAG"])
  12. def get_task_model_id(
  13. default_model_id: str, task_model: str, task_model_external: str, models
  14. ) -> str:
  15. # Set the task model
  16. task_model_id = default_model_id
  17. # Check if the user has a custom task model and use that model
  18. if models[task_model_id].get("connection_type") == "local":
  19. if task_model and task_model in models:
  20. task_model_id = task_model
  21. else:
  22. if task_model_external and task_model_external in models:
  23. task_model_id = task_model_external
  24. return task_model_id
  25. def prompt_variables_template(template: str, variables: dict[str, str]) -> str:
  26. for variable, value in variables.items():
  27. template = template.replace(variable, value)
  28. return template
  29. def prompt_template(template: str, user: Optional[Any] = None) -> str:
  30. if hasattr(user, "model_dump"):
  31. user = user.model_dump()
  32. USER_VARIABLES = {}
  33. if isinstance(user, dict):
  34. birth_date = user.get("date_of_birth")
  35. age = None
  36. if birth_date:
  37. try:
  38. # If birth_date is str, convert to datetime
  39. if isinstance(birth_date, str):
  40. birth_date = datetime.strptime(birth_date, "%Y-%m-%d")
  41. today = datetime.now()
  42. age = (
  43. today.year
  44. - birth_date.year
  45. - ((today.month, today.day) < (birth_date.month, birth_date.day))
  46. )
  47. except Exception as e:
  48. pass
  49. USER_VARIABLES = {
  50. "name": str(user.get("name")),
  51. "location": str(user.get("info", {}).get("location")),
  52. "bio": str(user.get("bio")),
  53. "gender": str(user.get("gender")),
  54. "birth_date": str(birth_date),
  55. "age": str(age),
  56. }
  57. print(USER_VARIABLES)
  58. # Get the current date
  59. current_date = datetime.now()
  60. # Format the date to YYYY-MM-DD
  61. formatted_date = current_date.strftime("%Y-%m-%d")
  62. formatted_time = current_date.strftime("%I:%M:%S %p")
  63. formatted_weekday = current_date.strftime("%A")
  64. template = template.replace("{{CURRENT_DATE}}", formatted_date)
  65. template = template.replace("{{CURRENT_TIME}}", formatted_time)
  66. template = template.replace(
  67. "{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
  68. )
  69. template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
  70. template = template.replace("{{USER_NAME}}", USER_VARIABLES.get("name", "Unknown"))
  71. template = template.replace("{{USER_BIO}}", USER_VARIABLES.get("bio", "Unknown"))
  72. template = template.replace(
  73. "{{USER_GENDER}}", USER_VARIABLES.get("gender", "Unknown")
  74. )
  75. template = template.replace(
  76. "{{USER_BIRTH_DATE}}", USER_VARIABLES.get("birth_date", "Unknown")
  77. )
  78. template = template.replace(
  79. "{{USER_AGE}}", str(USER_VARIABLES.get("age", "Unknown"))
  80. )
  81. template = template.replace(
  82. "{{USER_LOCATION}}", USER_VARIABLES.get("location", "Unknown")
  83. )
  84. return template
  85. def replace_prompt_variable(template: str, prompt: str) -> str:
  86. def replacement_function(match):
  87. full_match = match.group(
  88. 0
  89. ).lower() # Normalize to lowercase for consistent handling
  90. start_length = match.group(1)
  91. end_length = match.group(2)
  92. middle_length = match.group(3)
  93. if full_match == "{{prompt}}":
  94. return prompt
  95. elif start_length is not None:
  96. return prompt[: int(start_length)]
  97. elif end_length is not None:
  98. return prompt[-int(end_length) :]
  99. elif middle_length is not None:
  100. middle_length = int(middle_length)
  101. if len(prompt) <= middle_length:
  102. return prompt
  103. start = prompt[: math.ceil(middle_length / 2)]
  104. end = prompt[-math.floor(middle_length / 2) :]
  105. return f"{start}...{end}"
  106. return ""
  107. # Updated regex pattern to make it case-insensitive with the `(?i)` flag
  108. pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
  109. template = re.sub(pattern, replacement_function, template)
  110. return template
  111. def replace_messages_variable(
  112. template: str, messages: Optional[list[dict]] = None
  113. ) -> str:
  114. def replacement_function(match):
  115. full_match = match.group(0)
  116. start_length = match.group(1)
  117. end_length = match.group(2)
  118. middle_length = match.group(3)
  119. # If messages is None, handle it as an empty list
  120. if messages is None:
  121. return ""
  122. # Process messages based on the number of messages required
  123. if full_match == "{{MESSAGES}}":
  124. return get_messages_content(messages)
  125. elif start_length is not None:
  126. return get_messages_content(messages[: int(start_length)])
  127. elif end_length is not None:
  128. return get_messages_content(messages[-int(end_length) :])
  129. elif middle_length is not None:
  130. mid = int(middle_length)
  131. if len(messages) <= mid:
  132. return get_messages_content(messages)
  133. # Handle middle truncation: split to get start and end portions of the messages list
  134. half = mid // 2
  135. start_msgs = messages[:half]
  136. end_msgs = messages[-half:] if mid % 2 == 0 else messages[-(half + 1) :]
  137. formatted_start = get_messages_content(start_msgs)
  138. formatted_end = get_messages_content(end_msgs)
  139. return f"{formatted_start}\n{formatted_end}"
  140. return ""
  141. template = re.sub(
  142. r"{{MESSAGES}}|{{MESSAGES:START:(\d+)}}|{{MESSAGES:END:(\d+)}}|{{MESSAGES:MIDDLETRUNCATE:(\d+)}}",
  143. replacement_function,
  144. template,
  145. )
  146. return template
  147. # {{prompt:middletruncate:8000}}
  148. def rag_template(template: str, context: str, query: str):
  149. if template.strip() == "":
  150. template = DEFAULT_RAG_TEMPLATE
  151. template = prompt_template(template)
  152. if "[context]" not in template and "{{CONTEXT}}" not in template:
  153. log.debug(
  154. "WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
  155. )
  156. if "<context>" in context and "</context>" in context:
  157. log.debug(
  158. "WARNING: Potential prompt injection attack: the RAG "
  159. "context contains '<context>' and '</context>'. This might be "
  160. "nothing, or the user might be trying to hack something."
  161. )
  162. query_placeholders = []
  163. if "[query]" in context:
  164. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  165. template = template.replace("[query]", query_placeholder)
  166. query_placeholders.append(query_placeholder)
  167. if "{{QUERY}}" in context:
  168. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  169. template = template.replace("{{QUERY}}", query_placeholder)
  170. query_placeholders.append(query_placeholder)
  171. template = template.replace("[context]", context)
  172. template = template.replace("{{CONTEXT}}", context)
  173. template = template.replace("[query]", query)
  174. template = template.replace("{{QUERY}}", query)
  175. for query_placeholder in query_placeholders:
  176. template = template.replace(query_placeholder, query)
  177. return template
  178. def title_generation_template(
  179. template: str, messages: list[dict], user: Optional[Any] = None
  180. ) -> str:
  181. prompt = get_last_user_message(messages)
  182. template = replace_prompt_variable(template, prompt)
  183. template = replace_messages_variable(template, messages)
  184. template = prompt_template(template, user)
  185. return template
  186. def follow_up_generation_template(
  187. template: str, messages: list[dict], user: Optional[Any] = None
  188. ) -> str:
  189. prompt = get_last_user_message(messages)
  190. template = replace_prompt_variable(template, prompt)
  191. template = replace_messages_variable(template, messages)
  192. template = prompt_template(template, user)
  193. return template
  194. def tags_generation_template(
  195. template: str, messages: list[dict], user: Optional[Any] = None
  196. ) -> str:
  197. prompt = get_last_user_message(messages)
  198. template = replace_prompt_variable(template, prompt)
  199. template = replace_messages_variable(template, messages)
  200. template = prompt_template(template, user)
  201. return template
  202. def image_prompt_generation_template(
  203. template: str, messages: list[dict], user: Optional[Any] = None
  204. ) -> str:
  205. prompt = get_last_user_message(messages)
  206. template = replace_prompt_variable(template, prompt)
  207. template = replace_messages_variable(template, messages)
  208. template = prompt_template(template, user)
  209. return template
  210. def emoji_generation_template(
  211. template: str, prompt: str, user: Optional[Any] = None
  212. ) -> str:
  213. template = replace_prompt_variable(template, prompt)
  214. template = prompt_template(template, user)
  215. return template
  216. def autocomplete_generation_template(
  217. template: str,
  218. prompt: str,
  219. messages: Optional[list[dict]] = None,
  220. type: Optional[str] = None,
  221. user: Optional[Any] = None,
  222. ) -> str:
  223. template = template.replace("{{TYPE}}", type if type else "")
  224. template = replace_prompt_variable(template, prompt)
  225. template = replace_messages_variable(template, messages)
  226. template = prompt_template(template, user)
  227. return template
  228. def query_generation_template(
  229. template: str, messages: list[dict], user: Optional[Any] = None
  230. ) -> str:
  231. prompt = get_last_user_message(messages)
  232. template = replace_prompt_variable(template, prompt)
  233. template = replace_messages_variable(template, messages)
  234. template = prompt_template(template, user)
  235. return template
  236. def moa_response_generation_template(
  237. template: str, prompt: str, responses: list[str]
  238. ) -> str:
  239. def replacement_function(match):
  240. full_match = match.group(0)
  241. start_length = match.group(1)
  242. end_length = match.group(2)
  243. middle_length = match.group(3)
  244. if full_match == "{{prompt}}":
  245. return prompt
  246. elif start_length is not None:
  247. return prompt[: int(start_length)]
  248. elif end_length is not None:
  249. return prompt[-int(end_length) :]
  250. elif middle_length is not None:
  251. middle_length = int(middle_length)
  252. if len(prompt) <= middle_length:
  253. return prompt
  254. start = prompt[: math.ceil(middle_length / 2)]
  255. end = prompt[-math.floor(middle_length / 2) :]
  256. return f"{start}...{end}"
  257. return ""
  258. template = re.sub(
  259. r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
  260. replacement_function,
  261. template,
  262. )
  263. responses = [f'"""{response}"""' for response in responses]
  264. responses = "\n\n".join(responses)
  265. template = template.replace("{{responses}}", responses)
  266. return template
  267. def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
  268. template = template.replace("{{TOOLS}}", tools_specs)
  269. return template