task.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349
  1. import logging
  2. import math
  3. import re
  4. from datetime import datetime
  5. from typing import Optional, Any
  6. import uuid
  7. from open_webui.utils.misc import get_last_user_message, get_messages_content
  8. from open_webui.env import SRC_LOG_LEVELS
  9. from open_webui.config import DEFAULT_RAG_TEMPLATE
  10. log = logging.getLogger(__name__)
  11. log.setLevel(SRC_LOG_LEVELS["RAG"])
  12. def get_task_model_id(
  13. default_model_id: str, task_model: str, task_model_external: str, models
  14. ) -> str:
  15. # Set the task model
  16. task_model_id = default_model_id
  17. # Check if the user has a custom task model and use that model
  18. if models[task_model_id].get("connection_type") == "local":
  19. if task_model and task_model in models:
  20. task_model_id = task_model
  21. else:
  22. if task_model_external and task_model_external in models:
  23. task_model_id = task_model_external
  24. return task_model_id
  25. def prompt_variables_template(template: str, variables: dict[str, str]) -> str:
  26. for variable, value in variables.items():
  27. template = template.replace(variable, value)
  28. return template
  29. def prompt_template(template: str, user: Optional[Any] = None) -> str:
  30. USER_VARIABLES = {}
  31. if user:
  32. if hasattr(user, "model_dump"):
  33. user = user.model_dump()
  34. if isinstance(user, dict):
  35. user_info = user.get("info", {}) or {}
  36. birth_date = user.get("date_of_birth")
  37. age = None
  38. if birth_date:
  39. try:
  40. # If birth_date is str, convert to datetime
  41. if isinstance(birth_date, str):
  42. birth_date = datetime.strptime(birth_date, "%Y-%m-%d")
  43. today = datetime.now()
  44. age = (
  45. today.year
  46. - birth_date.year
  47. - (
  48. (today.month, today.day)
  49. < (birth_date.month, birth_date.day)
  50. )
  51. )
  52. except Exception as e:
  53. pass
  54. USER_VARIABLES = {
  55. "name": str(user.get("name")),
  56. "location": str(user_info.get("location")),
  57. "bio": str(user.get("bio")),
  58. "gender": str(user.get("gender")),
  59. "birth_date": str(birth_date),
  60. "age": str(age),
  61. }
  62. # Get the current date
  63. current_date = datetime.now()
  64. # Format the date to YYYY-MM-DD
  65. formatted_date = current_date.strftime("%Y-%m-%d")
  66. formatted_time = current_date.strftime("%I:%M:%S %p")
  67. formatted_weekday = current_date.strftime("%A")
  68. template = template.replace("{{CURRENT_DATE}}", formatted_date)
  69. template = template.replace("{{CURRENT_TIME}}", formatted_time)
  70. template = template.replace(
  71. "{{CURRENT_DATETIME}}", f"{formatted_date} {formatted_time}"
  72. )
  73. template = template.replace("{{CURRENT_WEEKDAY}}", formatted_weekday)
  74. template = template.replace("{{USER_NAME}}", USER_VARIABLES.get("name", "Unknown"))
  75. template = template.replace("{{USER_BIO}}", USER_VARIABLES.get("bio", "Unknown"))
  76. template = template.replace(
  77. "{{USER_GENDER}}", USER_VARIABLES.get("gender", "Unknown")
  78. )
  79. template = template.replace(
  80. "{{USER_BIRTH_DATE}}", USER_VARIABLES.get("birth_date", "Unknown")
  81. )
  82. template = template.replace(
  83. "{{USER_AGE}}", str(USER_VARIABLES.get("age", "Unknown"))
  84. )
  85. template = template.replace(
  86. "{{USER_LOCATION}}", USER_VARIABLES.get("location", "Unknown")
  87. )
  88. return template
  89. def replace_prompt_variable(template: str, prompt: str) -> str:
  90. def replacement_function(match):
  91. full_match = match.group(
  92. 0
  93. ).lower() # Normalize to lowercase for consistent handling
  94. start_length = match.group(1)
  95. end_length = match.group(2)
  96. middle_length = match.group(3)
  97. if full_match == "{{prompt}}":
  98. return prompt
  99. elif start_length is not None:
  100. return prompt[: int(start_length)]
  101. elif end_length is not None:
  102. return prompt[-int(end_length) :]
  103. elif middle_length is not None:
  104. middle_length = int(middle_length)
  105. if len(prompt) <= middle_length:
  106. return prompt
  107. start = prompt[: math.ceil(middle_length / 2)]
  108. end = prompt[-math.floor(middle_length / 2) :]
  109. return f"{start}...{end}"
  110. return ""
  111. # Updated regex pattern to make it case-insensitive with the `(?i)` flag
  112. pattern = r"(?i){{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}"
  113. template = re.sub(pattern, replacement_function, template)
  114. return template
  115. def replace_messages_variable(
  116. template: str, messages: Optional[list[dict]] = None
  117. ) -> str:
  118. def replacement_function(match):
  119. full_match = match.group(0)
  120. start_length = match.group(1)
  121. end_length = match.group(2)
  122. middle_length = match.group(3)
  123. # If messages is None, handle it as an empty list
  124. if messages is None:
  125. return ""
  126. # Process messages based on the number of messages required
  127. if full_match == "{{MESSAGES}}":
  128. return get_messages_content(messages)
  129. elif start_length is not None:
  130. return get_messages_content(messages[: int(start_length)])
  131. elif end_length is not None:
  132. return get_messages_content(messages[-int(end_length) :])
  133. elif middle_length is not None:
  134. mid = int(middle_length)
  135. if len(messages) <= mid:
  136. return get_messages_content(messages)
  137. # Handle middle truncation: split to get start and end portions of the messages list
  138. half = mid // 2
  139. start_msgs = messages[:half]
  140. end_msgs = messages[-half:] if mid % 2 == 0 else messages[-(half + 1) :]
  141. formatted_start = get_messages_content(start_msgs)
  142. formatted_end = get_messages_content(end_msgs)
  143. return f"{formatted_start}\n{formatted_end}"
  144. return ""
  145. template = re.sub(
  146. r"{{MESSAGES}}|{{MESSAGES:START:(\d+)}}|{{MESSAGES:END:(\d+)}}|{{MESSAGES:MIDDLETRUNCATE:(\d+)}}",
  147. replacement_function,
  148. template,
  149. )
  150. return template
  151. # {{prompt:middletruncate:8000}}
  152. def rag_template(template: str, context: str, query: str):
  153. if template.strip() == "":
  154. template = DEFAULT_RAG_TEMPLATE
  155. template = prompt_template(template)
  156. if "[context]" not in template and "{{CONTEXT}}" not in template:
  157. log.debug(
  158. "WARNING: The RAG template does not contain the '[context]' or '{{CONTEXT}}' placeholder."
  159. )
  160. if "<context>" in context and "</context>" in context:
  161. log.debug(
  162. "WARNING: Potential prompt injection attack: the RAG "
  163. "context contains '<context>' and '</context>'. This might be "
  164. "nothing, or the user might be trying to hack something."
  165. )
  166. query_placeholders = []
  167. if "[query]" in context:
  168. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  169. template = template.replace("[query]", query_placeholder)
  170. query_placeholders.append(query_placeholder)
  171. if "{{QUERY}}" in context:
  172. query_placeholder = "{{QUERY" + str(uuid.uuid4()) + "}}"
  173. template = template.replace("{{QUERY}}", query_placeholder)
  174. query_placeholders.append(query_placeholder)
  175. template = template.replace("[context]", context)
  176. template = template.replace("{{CONTEXT}}", context)
  177. template = template.replace("[query]", query)
  178. template = template.replace("{{QUERY}}", query)
  179. for query_placeholder in query_placeholders:
  180. template = template.replace(query_placeholder, query)
  181. return template
  182. def title_generation_template(
  183. template: str, messages: list[dict], user: Optional[Any] = None
  184. ) -> str:
  185. prompt = get_last_user_message(messages)
  186. template = replace_prompt_variable(template, prompt)
  187. template = replace_messages_variable(template, messages)
  188. template = prompt_template(template, user)
  189. return template
  190. def follow_up_generation_template(
  191. template: str, messages: list[dict], user: Optional[Any] = None
  192. ) -> str:
  193. prompt = get_last_user_message(messages)
  194. template = replace_prompt_variable(template, prompt)
  195. template = replace_messages_variable(template, messages)
  196. template = prompt_template(template, user)
  197. return template
  198. def tags_generation_template(
  199. template: str, messages: list[dict], user: Optional[Any] = None
  200. ) -> str:
  201. prompt = get_last_user_message(messages)
  202. template = replace_prompt_variable(template, prompt)
  203. template = replace_messages_variable(template, messages)
  204. template = prompt_template(template, user)
  205. return template
  206. def image_prompt_generation_template(
  207. template: str, messages: list[dict], user: Optional[Any] = None
  208. ) -> str:
  209. prompt = get_last_user_message(messages)
  210. template = replace_prompt_variable(template, prompt)
  211. template = replace_messages_variable(template, messages)
  212. template = prompt_template(template, user)
  213. return template
  214. def emoji_generation_template(
  215. template: str, prompt: str, user: Optional[Any] = None
  216. ) -> str:
  217. template = replace_prompt_variable(template, prompt)
  218. template = prompt_template(template, user)
  219. return template
  220. def autocomplete_generation_template(
  221. template: str,
  222. prompt: str,
  223. messages: Optional[list[dict]] = None,
  224. type: Optional[str] = None,
  225. user: Optional[Any] = None,
  226. ) -> str:
  227. template = template.replace("{{TYPE}}", type if type else "")
  228. template = replace_prompt_variable(template, prompt)
  229. template = replace_messages_variable(template, messages)
  230. template = prompt_template(template, user)
  231. return template
  232. def query_generation_template(
  233. template: str, messages: list[dict], user: Optional[Any] = None
  234. ) -> str:
  235. prompt = get_last_user_message(messages)
  236. template = replace_prompt_variable(template, prompt)
  237. template = replace_messages_variable(template, messages)
  238. template = prompt_template(template, user)
  239. return template
  240. def moa_response_generation_template(
  241. template: str, prompt: str, responses: list[str]
  242. ) -> str:
  243. def replacement_function(match):
  244. full_match = match.group(0)
  245. start_length = match.group(1)
  246. end_length = match.group(2)
  247. middle_length = match.group(3)
  248. if full_match == "{{prompt}}":
  249. return prompt
  250. elif start_length is not None:
  251. return prompt[: int(start_length)]
  252. elif end_length is not None:
  253. return prompt[-int(end_length) :]
  254. elif middle_length is not None:
  255. middle_length = int(middle_length)
  256. if len(prompt) <= middle_length:
  257. return prompt
  258. start = prompt[: math.ceil(middle_length / 2)]
  259. end = prompt[-math.floor(middle_length / 2) :]
  260. return f"{start}...{end}"
  261. return ""
  262. template = re.sub(
  263. r"{{prompt}}|{{prompt:start:(\d+)}}|{{prompt:end:(\d+)}}|{{prompt:middletruncate:(\d+)}}",
  264. replacement_function,
  265. template,
  266. )
  267. responses = [f'"""{response}"""' for response in responses]
  268. responses = "\n\n".join(responses)
  269. template = template.replace("{{responses}}", responses)
  270. return template
  271. def tools_function_calling_generation_template(template: str, tools_specs: str) -> str:
  272. template = template.replace("{{TOOLS}}", tools_specs)
  273. return template