task.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348
  1. import logging
  2. import math
  3. import re
  4. from datetime import datetime
  5. from typing import Optional, Any
  6. import uuid
  7. from open_webui.utils.misc import get_last_user_message, get_messages_content
  8. from open_webui.env import SRC_LOG_LEVELS
  9. from open_webui.config import DEFAULT_RAG_TEMPLATE
  10. log = logging.getLogger(__name__)
  11. log.setLevel(SRC_LOG_LEVELS["RAG"])
  12. def get_task_model_id(
  13. default_model_id: str, task_model: str, task_model_external: str, models
  14. ) -> str:
  15. # Set the task model
  16. task_model_id = default_model_id
  17. # Check if the user has a custom task model and use that model
  18. if models[task_model_id].get("connection_type") == "local":
  19. if task_model and task_model in models:
  20. task_model_id = task_model
  21. else:
  22. if task_model_external and task_model_external in models:
  23. task_model_id = task_model_external
  24. return task_model_id
  25. def prompt_variables_template(template: str, variables: dict[str, str]) -> str:
  26. for variable, value in variables.items():
  27. template = template.replace(variable, value)
  28. return template
  29. def prompt_template(template: str, user: Optional[Any] = None) -> str:
  30. USER_VARIABLES = {}
  31. if user:
  32. if hasattr(user, "model_dump"):
  33. user = user.model_dump()
  34. if isinstance(user, dict):
  35. birth_date = user.get("date_of_birth")
  36. age = None
  37. if birth_date:
  38. try:
  39. # If birth_date is str, convert to datetime
  40. if isinstance(birth_date, str):
  41. birth_date = datetime.strptime(birth_date, "%Y-%m-%d")
  42. today = datetime.now()
  43. age = (
  44. today.year
  45. - birth_date.year
  46. - (
  47. (today.month, today.day)
  48. < (birth_date.month, birth_date.day)
  49. )
  50. )
  51. except Exception as e:
  52. pass
  53. USER_VARIABLES = {
  54. "name": str(user.get("name")),
  55. "location": str(user.get("info", {}).get("location")),
  56. "bio": str(user.get("bio")),
  57. "gender": str(user.get("gender")),
  58. "birth_date": str(birth_date),
  59. "age": str(age),
  60. }
  61. # Get the current date
  62. current_date = datetime.now()
  63. # Format the date to YYYY-MM-DD
  64. formatted_date = current_date.strftime("%Y-%m-%d")
  65. formatted_time = current_date.strftime("%I:%M:%S %p")
  66. formatted_weekday = current_date.strftime("%A")
  67. template = template.replace("{{CURRENT_DATE}}", formatted_date)
  68. template = template.replace("{{CURRENT_TIME}}", formatted_time)
  69. template = template.replace(
  70. "{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
  71. )
  72. template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
  73. template = template.replace("{{USER_NAME}}", USER_VARIABLES.get("name", "Unknown"))
  74. template = template.replace("{{USER_BIO}}", USER_VARIABLES.get("bio", "Unknown"))
  75. template = template.replace(
  76. "{{USER_GENDER}}", USER_VARIABLES.get("gender", "Unknown")
  77. )
  78. template = template.replace(
  79. "{{USER_BIRTH_DATE}}", USER_VARIABLES.get("birth_date", "Unknown")
  80. )
  81. template = template.replace(
  82. "{{USER_AGE}}", str(USER_VARIABLES.get("age", "Unknown"))
  83. )
  84. template = template.replace(
  85. "{{USER_LOCATION}}", USER_VARIABLES.get("location", "Unknown")
  86. )
  87. return template
  88. def replace_prompt_variable(template: str, prompt: str) -> str:
  89. def replacement_function(match):
  90. full_match = match.group(
  91. 0
  92. ).lower() # Normalize to lowercase for consistent handling
  93. start_length = match.group(1)
  94. end_length = match.group(2)
  95. middle_length = match.group(3)
  96. if full_match == "{{prompt}}":
  97. return prompt
  98. elif start_length is not None:
  99. return prompt[: int(start_length)]
  100. elif end_length is not None:
  101. return prompt[-int(end_length) :]
  102. elif middle_length is not None:
  103. middle_length = int(middle_length)
  104. if len(prompt) <= middle_length:
  105. return prompt
  106. start = prompt[: math.ceil(middle_length / 2)]
  107. end = prompt[-math.floor(middle_length / 2) :]
  108. return f"{start}...{end}"
  109. return ""
  110. # Updated regex pattern to make it case-insensitive with the `(?i)` flag
  111. pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
  112. template = re.sub(pattern, replacement_function, template)
  113. return template
  114. def replace_messages_variable(
  115. template: str, messages: Optional[list[dict]] = None
  116. ) -> str:
  117. def replacement_function(match):
  118. full_match = match.group(0)
  119. start_length = match.group(1)
  120. end_length = match.group(2)
  121. middle_length = match.group(3)
  122. # If messages is None, handle it as an empty list
  123. if messages is None:
  124. return ""
  125. # Process messages based on the number of messages required
  126. if full_match == "{{MESSAGES}}":
  127. return get_messages_content(messages)
  128. elif start_length is not None:
  129. return get_messages_content(messages[: int(start_length)])
  130. elif end_length is not None:
  131. return get_messages_content(messages[-int(end_length) :])
  132. elif middle_length is not None:
  133. mid = int(middle_length)
  134. if len(messages) <= mid:
  135. return get_messages_content(messages)
  136. # Handle middle truncation: split to get start and end portions of the messages list
  137. half = mid // 2
  138. start_msgs = messages[:half]
  139. end_msgs = messages[-half:] if mid % 2 == 0 else messages[-(half + 1) :]
  140. formatted_start = get_messages_content(start_msgs)
  141. formatted_end = get_messages_content(end_msgs)
  142. return f"{formatted_start}\n{formatted_end}"
  143. return ""
  144. template = re.sub(
  145. r"{{MESSAGES}}|{{MESSAGES:START:(\d+)}}|{{MESSAGES:END:(\d+)}}|{{MESSAGES:MIDDLETRUNCATE:(\d+)}}",
  146. replacement_function,
  147. template,
  148. )
  149. return template
  150. # {{prompt:middletruncate:8000}}
  151. def rag_template(template: str, context: str, query: str):
  152. if template.strip() == "":
  153. template = DEFAULT_RAG_TEMPLATE
  154. template = prompt_template(template)
  155. if "[context]" not in template and "{{CONTEXT}}" not in template:
  156. log.debug(
  157. "WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
  158. )
  159. if "<context>" in context and "</context>" in context:
  160. log.debug(
  161. "WARNING: Potential prompt injection attack: the RAG "
  162. "context contains '<context>' and '</context>'. This might be "
  163. "nothing, or the user might be trying to hack something."
  164. )
  165. query_placeholders = []
  166. if "[query]" in context:
  167. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  168. template = template.replace("[query]", query_placeholder)
  169. query_placeholders.append(query_placeholder)
  170. if "{{QUERY}}" in context:
  171. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  172. template = template.replace("{{QUERY}}", query_placeholder)
  173. query_placeholders.append(query_placeholder)
  174. template = template.replace("[context]", context)
  175. template = template.replace("{{CONTEXT}}", context)
  176. template = template.replace("[query]", query)
  177. template = template.replace("{{QUERY}}", query)
  178. for query_placeholder in query_placeholders:
  179. template = template.replace(query_placeholder, query)
  180. return template
  181. def title_generation_template(
  182. template: str, messages: list[dict], user: Optional[Any] = None
  183. ) -> str:
  184. prompt = get_last_user_message(messages)
  185. template = replace_prompt_variable(template, prompt)
  186. template = replace_messages_variable(template, messages)
  187. template = prompt_template(template, user)
  188. return template
  189. def follow_up_generation_template(
  190. template: str, messages: list[dict], user: Optional[Any] = None
  191. ) -> str:
  192. prompt = get_last_user_message(messages)
  193. template = replace_prompt_variable(template, prompt)
  194. template = replace_messages_variable(template, messages)
  195. template = prompt_template(template, user)
  196. return template
  197. def tags_generation_template(
  198. template: str, messages: list[dict], user: Optional[Any] = None
  199. ) -> str:
  200. prompt = get_last_user_message(messages)
  201. template = replace_prompt_variable(template, prompt)
  202. template = replace_messages_variable(template, messages)
  203. template = prompt_template(template, user)
  204. return template
  205. def image_prompt_generation_template(
  206. template: str, messages: list[dict], user: Optional[Any] = None
  207. ) -> str:
  208. prompt = get_last_user_message(messages)
  209. template = replace_prompt_variable(template, prompt)
  210. template = replace_messages_variable(template, messages)
  211. template = prompt_template(template, user)
  212. return template
  213. def emoji_generation_template(
  214. template: str, prompt: str, user: Optional[Any] = None
  215. ) -> str:
  216. template = replace_prompt_variable(template, prompt)
  217. template = prompt_template(template, user)
  218. return template
  219. def autocomplete_generation_template(
  220. template: str,
  221. prompt: str,
  222. messages: Optional[list[dict]] = None,
  223. type: Optional[str] = None,
  224. user: Optional[Any] = None,
  225. ) -> str:
  226. template = template.replace("{{TYPE}}", type if type else "")
  227. template = replace_prompt_variable(template, prompt)
  228. template = replace_messages_variable(template, messages)
  229. template = prompt_template(template, user)
  230. return template
  231. def query_generation_template(
  232. template: str, messages: list[dict], user: Optional[Any] = None
  233. ) -> str:
  234. prompt = get_last_user_message(messages)
  235. template = replace_prompt_variable(template, prompt)
  236. template = replace_messages_variable(template, messages)
  237. template = prompt_template(template, user)
  238. return template
  239. def moa_response_generation_template(
  240. template: str, prompt: str, responses: list[str]
  241. ) -> str:
  242. def replacement_function(match):
  243. full_match = match.group(0)
  244. start_length = match.group(1)
  245. end_length = match.group(2)
  246. middle_length = match.group(3)
  247. if full_match == "{{prompt}}":
  248. return prompt
  249. elif start_length is not None:
  250. return prompt[: int(start_length)]
  251. elif end_length is not None:
  252. return prompt[-int(end_length) :]
  253. elif middle_length is not None:
  254. middle_length = int(middle_length)
  255. if len(prompt) <= middle_length:
  256. return prompt
  257. start = prompt[: math.ceil(middle_length / 2)]
  258. end = prompt[-math.floor(middle_length / 2) :]
  259. return f"{start}...{end}"
  260. return ""
  261. template = re.sub(
  262. r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
  263. replacement_function,
  264. template,
  265. )
  266. responses = [f'"""{response}"""' for response in responses]
  267. responses = "\n\n".join(responses)
  268. template = template.replace("{{responses}}", responses)
  269. return template
  270. def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
  271. template = template.replace("{{TOOLS}}", tools_specs)
  272. return template