main.py 66 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971
  1. import asyncio
  2. import inspect
  3. import json
  4. import logging
  5. import mimetypes
  6. import os
  7. import shutil
  8. import sys
  9. import time
  10. import random
  11. from uuid import uuid4
  12. from contextlib import asynccontextmanager
  13. from urllib.parse import urlencode, parse_qs, urlparse
  14. from pydantic import BaseModel
  15. from sqlalchemy import text
  16. from typing import Optional
  17. from aiocache import cached
  18. import aiohttp
  19. import anyio.to_thread
  20. import requests
  21. from redis import Redis
  22. from fastapi import (
  23. Depends,
  24. FastAPI,
  25. File,
  26. Form,
  27. HTTPException,
  28. Request,
  29. UploadFile,
  30. status,
  31. applications,
  32. BackgroundTasks,
  33. )
  34. from fastapi.openapi.docs import get_swagger_ui_html
  35. from fastapi.middleware.cors import CORSMiddleware
  36. from fastapi.responses import FileResponse, JSONResponse, RedirectResponse
  37. from fastapi.staticfiles import StaticFiles
  38. from starlette_compress import CompressMiddleware
  39. from starlette.exceptions import HTTPException as StarletteHTTPException
  40. from starlette.middleware.base import BaseHTTPMiddleware
  41. from starlette.middleware.sessions import SessionMiddleware
  42. from starlette.responses import Response, StreamingResponse
  43. from starlette.datastructures import Headers
  44. from open_webui.utils import logger
  45. from open_webui.utils.audit import AuditLevel, AuditLoggingMiddleware
  46. from open_webui.utils.logger import start_logger
  47. from open_webui.socket.main import (
  48. app as socket_app,
  49. periodic_usage_pool_cleanup,
  50. get_event_emitter,
  51. get_models_in_use,
  52. get_active_user_ids,
  53. )
  54. from open_webui.routers import (
  55. audio,
  56. images,
  57. ollama,
  58. openai,
  59. retrieval,
  60. pipelines,
  61. tasks,
  62. auths,
  63. channels,
  64. chats,
  65. notes,
  66. folders,
  67. configs,
  68. groups,
  69. files,
  70. functions,
  71. memories,
  72. models,
  73. knowledge,
  74. prompts,
  75. evaluations,
  76. tools,
  77. users,
  78. utils,
  79. scim,
  80. )
  81. from open_webui.routers.retrieval import (
  82. get_embedding_function,
  83. get_reranking_function,
  84. get_ef,
  85. get_rf,
  86. )
  87. from open_webui.internal.db import Session, engine
  88. from open_webui.models.functions import Functions
  89. from open_webui.models.models import Models
  90. from open_webui.models.users import UserModel, Users
  91. from open_webui.models.chats import Chats
  92. from open_webui.config import (
  93. # Ollama
  94. ENABLE_OLLAMA_API,
  95. OLLAMA_BASE_URLS,
  96. OLLAMA_API_CONFIGS,
  97. # OpenAI
  98. ENABLE_OPENAI_API,
  99. ONEDRIVE_CLIENT_ID,
  100. ONEDRIVE_SHAREPOINT_URL,
  101. ONEDRIVE_SHAREPOINT_TENANT_ID,
  102. OPENAI_API_BASE_URLS,
  103. OPENAI_API_KEYS,
  104. OPENAI_API_CONFIGS,
  105. # Direct Connections
  106. ENABLE_DIRECT_CONNECTIONS,
  107. # Model list
  108. ENABLE_BASE_MODELS_CACHE,
  109. # Thread pool size for FastAPI/AnyIO
  110. THREAD_POOL_SIZE,
  111. # Tool Server Configs
  112. TOOL_SERVER_CONNECTIONS,
  113. # Code Execution
  114. ENABLE_CODE_EXECUTION,
  115. CODE_EXECUTION_ENGINE,
  116. CODE_EXECUTION_JUPYTER_URL,
  117. CODE_EXECUTION_JUPYTER_AUTH,
  118. CODE_EXECUTION_JUPYTER_AUTH_TOKEN,
  119. CODE_EXECUTION_JUPYTER_AUTH_PASSWORD,
  120. CODE_EXECUTION_JUPYTER_TIMEOUT,
  121. ENABLE_CODE_INTERPRETER,
  122. CODE_INTERPRETER_ENGINE,
  123. CODE_INTERPRETER_PROMPT_TEMPLATE,
  124. CODE_INTERPRETER_JUPYTER_URL,
  125. CODE_INTERPRETER_JUPYTER_AUTH,
  126. CODE_INTERPRETER_JUPYTER_AUTH_TOKEN,
  127. CODE_INTERPRETER_JUPYTER_AUTH_PASSWORD,
  128. CODE_INTERPRETER_JUPYTER_TIMEOUT,
  129. # Image
  130. AUTOMATIC1111_API_AUTH,
  131. AUTOMATIC1111_BASE_URL,
  132. AUTOMATIC1111_CFG_SCALE,
  133. AUTOMATIC1111_SAMPLER,
  134. AUTOMATIC1111_SCHEDULER,
  135. COMFYUI_BASE_URL,
  136. COMFYUI_API_KEY,
  137. COMFYUI_WORKFLOW,
  138. COMFYUI_WORKFLOW_NODES,
  139. ENABLE_IMAGE_GENERATION,
  140. ENABLE_IMAGE_PROMPT_GENERATION,
  141. IMAGE_GENERATION_ENGINE,
  142. IMAGE_GENERATION_MODEL,
  143. IMAGE_SIZE,
  144. IMAGE_STEPS,
  145. IMAGES_OPENAI_API_BASE_URL,
  146. IMAGES_OPENAI_API_KEY,
  147. IMAGES_GEMINI_API_BASE_URL,
  148. IMAGES_GEMINI_API_KEY,
  149. # Audio
  150. AUDIO_STT_ENGINE,
  151. AUDIO_STT_MODEL,
  152. AUDIO_STT_SUPPORTED_CONTENT_TYPES,
  153. AUDIO_STT_OPENAI_API_BASE_URL,
  154. AUDIO_STT_OPENAI_API_KEY,
  155. AUDIO_STT_AZURE_API_KEY,
  156. AUDIO_STT_AZURE_REGION,
  157. AUDIO_STT_AZURE_LOCALES,
  158. AUDIO_STT_AZURE_BASE_URL,
  159. AUDIO_STT_AZURE_MAX_SPEAKERS,
  160. AUDIO_TTS_API_KEY,
  161. AUDIO_TTS_ENGINE,
  162. AUDIO_TTS_MODEL,
  163. AUDIO_TTS_OPENAI_API_BASE_URL,
  164. AUDIO_TTS_OPENAI_API_KEY,
  165. AUDIO_TTS_SPLIT_ON,
  166. AUDIO_TTS_VOICE,
  167. AUDIO_TTS_AZURE_SPEECH_REGION,
  168. AUDIO_TTS_AZURE_SPEECH_BASE_URL,
  169. AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT,
  170. PLAYWRIGHT_WS_URL,
  171. PLAYWRIGHT_TIMEOUT,
  172. FIRECRAWL_API_BASE_URL,
  173. FIRECRAWL_API_KEY,
  174. WEB_LOADER_ENGINE,
  175. WEB_LOADER_CONCURRENT_REQUESTS,
  176. WHISPER_MODEL,
  177. WHISPER_VAD_FILTER,
  178. WHISPER_LANGUAGE,
  179. DEEPGRAM_API_KEY,
  180. WHISPER_MODEL_AUTO_UPDATE,
  181. WHISPER_MODEL_DIR,
  182. # Retrieval
  183. RAG_TEMPLATE,
  184. DEFAULT_RAG_TEMPLATE,
  185. RAG_FULL_CONTEXT,
  186. BYPASS_EMBEDDING_AND_RETRIEVAL,
  187. RAG_EMBEDDING_MODEL,
  188. RAG_EMBEDDING_MODEL_AUTO_UPDATE,
  189. RAG_EMBEDDING_MODEL_TRUST_REMOTE_CODE,
  190. RAG_RERANKING_ENGINE,
  191. RAG_RERANKING_MODEL,
  192. RAG_EXTERNAL_RERANKER_URL,
  193. RAG_EXTERNAL_RERANKER_API_KEY,
  194. RAG_RERANKING_MODEL_AUTO_UPDATE,
  195. RAG_RERANKING_MODEL_TRUST_REMOTE_CODE,
  196. RAG_EMBEDDING_ENGINE,
  197. RAG_EMBEDDING_BATCH_SIZE,
  198. RAG_TOP_K,
  199. RAG_TOP_K_RERANKER,
  200. RAG_RELEVANCE_THRESHOLD,
  201. RAG_HYBRID_BM25_WEIGHT,
  202. RAG_ALLOWED_FILE_EXTENSIONS,
  203. RAG_FILE_MAX_COUNT,
  204. RAG_FILE_MAX_SIZE,
  205. FILE_IMAGE_COMPRESSION_WIDTH,
  206. FILE_IMAGE_COMPRESSION_HEIGHT,
  207. RAG_OPENAI_API_BASE_URL,
  208. RAG_OPENAI_API_KEY,
  209. RAG_AZURE_OPENAI_BASE_URL,
  210. RAG_AZURE_OPENAI_API_KEY,
  211. RAG_AZURE_OPENAI_API_VERSION,
  212. RAG_OLLAMA_BASE_URL,
  213. RAG_OLLAMA_API_KEY,
  214. CHUNK_OVERLAP,
  215. CHUNK_SIZE,
  216. CONTENT_EXTRACTION_ENGINE,
  217. DATALAB_MARKER_API_KEY,
  218. DATALAB_MARKER_API_BASE_URL,
  219. DATALAB_MARKER_ADDITIONAL_CONFIG,
  220. DATALAB_MARKER_SKIP_CACHE,
  221. DATALAB_MARKER_FORCE_OCR,
  222. DATALAB_MARKER_PAGINATE,
  223. DATALAB_MARKER_STRIP_EXISTING_OCR,
  224. DATALAB_MARKER_DISABLE_IMAGE_EXTRACTION,
  225. DATALAB_MARKER_FORMAT_LINES,
  226. DATALAB_MARKER_OUTPUT_FORMAT,
  227. DATALAB_MARKER_USE_LLM,
  228. EXTERNAL_DOCUMENT_LOADER_URL,
  229. EXTERNAL_DOCUMENT_LOADER_API_KEY,
  230. TIKA_SERVER_URL,
  231. DOCLING_SERVER_URL,
  232. DOCLING_OCR_ENGINE,
  233. DOCLING_OCR_LANG,
  234. DOCLING_DO_PICTURE_DESCRIPTION,
  235. DOCLING_PICTURE_DESCRIPTION_MODE,
  236. DOCLING_PICTURE_DESCRIPTION_LOCAL,
  237. DOCLING_PICTURE_DESCRIPTION_API,
  238. DOCUMENT_INTELLIGENCE_ENDPOINT,
  239. DOCUMENT_INTELLIGENCE_KEY,
  240. MISTRAL_OCR_API_KEY,
  241. RAG_TEXT_SPLITTER,
  242. TIKTOKEN_ENCODING_NAME,
  243. PDF_EXTRACT_IMAGES,
  244. YOUTUBE_LOADER_LANGUAGE,
  245. YOUTUBE_LOADER_PROXY_URL,
  246. # Retrieval (Web Search)
  247. ENABLE_WEB_SEARCH,
  248. WEB_SEARCH_ENGINE,
  249. BYPASS_WEB_SEARCH_EMBEDDING_AND_RETRIEVAL,
  250. BYPASS_WEB_SEARCH_WEB_LOADER,
  251. WEB_SEARCH_RESULT_COUNT,
  252. WEB_SEARCH_CONCURRENT_REQUESTS,
  253. WEB_SEARCH_TRUST_ENV,
  254. WEB_SEARCH_DOMAIN_FILTER_LIST,
  255. JINA_API_KEY,
  256. SEARCHAPI_API_KEY,
  257. SEARCHAPI_ENGINE,
  258. SERPAPI_API_KEY,
  259. SERPAPI_ENGINE,
  260. SEARXNG_QUERY_URL,
  261. YACY_QUERY_URL,
  262. YACY_USERNAME,
  263. YACY_PASSWORD,
  264. SERPER_API_KEY,
  265. SERPLY_API_KEY,
  266. SERPSTACK_API_KEY,
  267. SERPSTACK_HTTPS,
  268. TAVILY_API_KEY,
  269. TAVILY_EXTRACT_DEPTH,
  270. BING_SEARCH_V7_ENDPOINT,
  271. BING_SEARCH_V7_SUBSCRIPTION_KEY,
  272. BRAVE_SEARCH_API_KEY,
  273. EXA_API_KEY,
  274. PERPLEXITY_API_KEY,
  275. PERPLEXITY_MODEL,
  276. PERPLEXITY_SEARCH_CONTEXT_USAGE,
  277. SOUGOU_API_SID,
  278. SOUGOU_API_SK,
  279. KAGI_SEARCH_API_KEY,
  280. MOJEEK_SEARCH_API_KEY,
  281. BOCHA_SEARCH_API_KEY,
  282. GOOGLE_PSE_API_KEY,
  283. GOOGLE_PSE_ENGINE_ID,
  284. GOOGLE_DRIVE_CLIENT_ID,
  285. GOOGLE_DRIVE_API_KEY,
  286. ONEDRIVE_CLIENT_ID,
  287. ONEDRIVE_SHAREPOINT_URL,
  288. ONEDRIVE_SHAREPOINT_TENANT_ID,
  289. ENABLE_RAG_HYBRID_SEARCH,
  290. ENABLE_RAG_LOCAL_WEB_FETCH,
  291. ENABLE_WEB_LOADER_SSL_VERIFICATION,
  292. ENABLE_GOOGLE_DRIVE_INTEGRATION,
  293. ENABLE_ONEDRIVE_INTEGRATION,
  294. UPLOAD_DIR,
  295. EXTERNAL_WEB_SEARCH_URL,
  296. EXTERNAL_WEB_SEARCH_API_KEY,
  297. EXTERNAL_WEB_LOADER_URL,
  298. EXTERNAL_WEB_LOADER_API_KEY,
  299. # WebUI
  300. WEBUI_AUTH,
  301. WEBUI_NAME,
  302. WEBUI_BANNERS,
  303. WEBHOOK_URL,
  304. ADMIN_EMAIL,
  305. SHOW_ADMIN_DETAILS,
  306. JWT_EXPIRES_IN,
  307. ENABLE_SIGNUP,
  308. ENABLE_LOGIN_FORM,
  309. ENABLE_API_KEY,
  310. ENABLE_API_KEY_ENDPOINT_RESTRICTIONS,
  311. API_KEY_ALLOWED_ENDPOINTS,
  312. ENABLE_CHANNELS,
  313. ENABLE_NOTES,
  314. ENABLE_COMMUNITY_SHARING,
  315. ENABLE_MESSAGE_RATING,
  316. ENABLE_USER_WEBHOOKS,
  317. ENABLE_EVALUATION_ARENA_MODELS,
  318. ENABLE_ADMIN_WORKSPACE_CONTENT_ACCESS,
  319. USER_PERMISSIONS,
  320. DEFAULT_USER_ROLE,
  321. PENDING_USER_OVERLAY_CONTENT,
  322. PENDING_USER_OVERLAY_TITLE,
  323. DEFAULT_PROMPT_SUGGESTIONS,
  324. DEFAULT_MODELS,
  325. DEFAULT_ARENA_MODEL,
  326. MODEL_ORDER_LIST,
  327. EVALUATION_ARENA_MODELS,
  328. # WebUI (OAuth)
  329. ENABLE_OAUTH_ROLE_MANAGEMENT,
  330. OAUTH_ROLES_CLAIM,
  331. OAUTH_EMAIL_CLAIM,
  332. OAUTH_PICTURE_CLAIM,
  333. OAUTH_USERNAME_CLAIM,
  334. OAUTH_ALLOWED_ROLES,
  335. OAUTH_ADMIN_ROLES,
  336. # WebUI (LDAP)
  337. ENABLE_LDAP,
  338. LDAP_SERVER_LABEL,
  339. LDAP_SERVER_HOST,
  340. LDAP_SERVER_PORT,
  341. LDAP_ATTRIBUTE_FOR_MAIL,
  342. LDAP_ATTRIBUTE_FOR_USERNAME,
  343. LDAP_SEARCH_FILTERS,
  344. LDAP_SEARCH_BASE,
  345. LDAP_APP_DN,
  346. LDAP_APP_PASSWORD,
  347. LDAP_USE_TLS,
  348. LDAP_CA_CERT_FILE,
  349. LDAP_VALIDATE_CERT,
  350. LDAP_CIPHERS,
  351. # LDAP Group Management
  352. ENABLE_LDAP_GROUP_MANAGEMENT,
  353. ENABLE_LDAP_GROUP_CREATION,
  354. LDAP_ATTRIBUTE_FOR_GROUPS,
  355. # Misc
  356. ENV,
  357. CACHE_DIR,
  358. STATIC_DIR,
  359. FRONTEND_BUILD_DIR,
  360. CORS_ALLOW_ORIGIN,
  361. DEFAULT_LOCALE,
  362. OAUTH_PROVIDERS,
  363. WEBUI_URL,
  364. RESPONSE_WATERMARK,
  365. # Admin
  366. ENABLE_ADMIN_CHAT_ACCESS,
  367. ENABLE_ADMIN_WORKSPACE_CONTENT_ACCESS,
  368. ENABLE_ADMIN_EXPORT,
  369. # Tasks
  370. TASK_MODEL,
  371. TASK_MODEL_EXTERNAL,
  372. ENABLE_TAGS_GENERATION,
  373. ENABLE_TITLE_GENERATION,
  374. ENABLE_FOLLOW_UP_GENERATION,
  375. ENABLE_SEARCH_QUERY_GENERATION,
  376. ENABLE_RETRIEVAL_QUERY_GENERATION,
  377. ENABLE_AUTOCOMPLETE_GENERATION,
  378. TITLE_GENERATION_PROMPT_TEMPLATE,
  379. FOLLOW_UP_GENERATION_PROMPT_TEMPLATE,
  380. TAGS_GENERATION_PROMPT_TEMPLATE,
  381. IMAGE_PROMPT_GENERATION_PROMPT_TEMPLATE,
  382. TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE,
  383. QUERY_GENERATION_PROMPT_TEMPLATE,
  384. AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE,
  385. AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH,
  386. AppConfig,
  387. reset_config,
  388. )
  389. from open_webui.env import (
  390. LICENSE_KEY,
  391. AUDIT_EXCLUDED_PATHS,
  392. AUDIT_LOG_LEVEL,
  393. CHANGELOG,
  394. REDIS_URL,
  395. REDIS_CLUSTER,
  396. REDIS_KEY_PREFIX,
  397. REDIS_SENTINEL_HOSTS,
  398. REDIS_SENTINEL_PORT,
  399. GLOBAL_LOG_LEVEL,
  400. MAX_BODY_LOG_SIZE,
  401. SAFE_MODE,
  402. SRC_LOG_LEVELS,
  403. VERSION,
  404. INSTANCE_ID,
  405. WEBUI_BUILD_HASH,
  406. WEBUI_SECRET_KEY,
  407. WEBUI_SESSION_COOKIE_SAME_SITE,
  408. WEBUI_SESSION_COOKIE_SECURE,
  409. ENABLE_SIGNUP_PASSWORD_CONFIRMATION,
  410. WEBUI_AUTH_TRUSTED_EMAIL_HEADER,
  411. WEBUI_AUTH_TRUSTED_NAME_HEADER,
  412. WEBUI_AUTH_SIGNOUT_REDIRECT_URL,
  413. # SCIM
  414. SCIM_ENABLED,
  415. SCIM_TOKEN,
  416. ENABLE_COMPRESSION_MIDDLEWARE,
  417. ENABLE_WEBSOCKET_SUPPORT,
  418. BYPASS_MODEL_ACCESS_CONTROL,
  419. RESET_CONFIG_ON_START,
  420. ENABLE_VERSION_UPDATE_CHECK,
  421. ENABLE_OTEL,
  422. EXTERNAL_PWA_MANIFEST_URL,
  423. AIOHTTP_CLIENT_SESSION_SSL,
  424. )
  425. from open_webui.utils.models import (
  426. get_all_models,
  427. get_all_base_models,
  428. check_model_access,
  429. )
  430. from open_webui.utils.chat import (
  431. generate_chat_completion as chat_completion_handler,
  432. chat_completed as chat_completed_handler,
  433. chat_action as chat_action_handler,
  434. )
  435. from open_webui.utils.embeddings import generate_embeddings
  436. from open_webui.utils.middleware import process_chat_payload, process_chat_response
  437. from open_webui.utils.access_control import has_access
  438. from open_webui.utils.auth import (
  439. get_license_data,
  440. get_http_authorization_cred,
  441. decode_token,
  442. get_admin_user,
  443. get_verified_user,
  444. )
  445. from open_webui.utils.plugin import install_tool_and_function_dependencies
  446. from open_webui.utils.oauth import OAuthManager
  447. from open_webui.utils.security_headers import SecurityHeadersMiddleware
  448. from open_webui.utils.redis import get_redis_connection
  449. from open_webui.tasks import (
  450. redis_task_command_listener,
  451. list_task_ids_by_item_id,
  452. create_task,
  453. stop_task,
  454. list_tasks,
  455. ) # Import from tasks.py
  456. from open_webui.utils.redis import get_sentinels_from_env
  457. from open_webui.constants import ERROR_MESSAGES
  458. if SAFE_MODE:
  459. print("SAFE MODE ENABLED")
  460. Functions.deactivate_all_functions()
  461. logging.basicConfig(stream=sys.stdout, level=GLOBAL_LOG_LEVEL)
  462. log = logging.getLogger(__name__)
  463. log.setLevel(SRC_LOG_LEVELS["MAIN"])
  464. class SPAStaticFiles(StaticFiles):
  465. async def get_response(self, path: str, scope):
  466. try:
  467. return await super().get_response(path, scope)
  468. except (HTTPException, StarletteHTTPException) as ex:
  469. if ex.status_code == 404:
  470. if path.endswith(".js"):
  471. # Return 404 for javascript files
  472. raise ex
  473. else:
  474. return await super().get_response("index.html", scope)
  475. else:
  476. raise ex
  477. print(
  478. rf"""
  479. ██████╗ ██████╗ ███████╗███╗ ██╗ ██╗ ██╗███████╗██████╗ ██╗ ██╗██╗
  480. ██╔═══██╗██╔══██╗██╔════╝████╗ ██║ ██║ ██║██╔════╝██╔══██╗██║ ██║██║
  481. ██║ ██║██████╔╝█████╗ ██╔██╗ ██║ ██║ █╗ ██║█████╗ ██████╔╝██║ ██║██║
  482. ██║ ██║██╔═══╝ ██╔══╝ ██║╚██╗██║ ██║███╗██║██╔══╝ ██╔══██╗██║ ██║██║
  483. ╚██████╔╝██║ ███████╗██║ ╚████║ ╚███╔███╔╝███████╗██████╔╝╚██████╔╝██║
  484. ╚═════╝ ╚═╝ ╚══════╝╚═╝ ╚═══╝ ╚══╝╚══╝ ╚══════╝╚═════╝ ╚═════╝ ╚═╝
  485. v{VERSION} - building the best AI user interface.
  486. {f"Commit: {WEBUI_BUILD_HASH}" if WEBUI_BUILD_HASH != "dev-build" else ""}
  487. https://github.com/open-webui/open-webui
  488. """
  489. )
  490. @asynccontextmanager
  491. async def lifespan(app: FastAPI):
  492. app.state.instance_id = INSTANCE_ID
  493. start_logger()
  494. if RESET_CONFIG_ON_START:
  495. reset_config()
  496. if LICENSE_KEY:
  497. get_license_data(app, LICENSE_KEY)
  498. # This should be blocking (sync) so functions are not deactivated on first /get_models calls
  499. # when the first user lands on the / route.
  500. log.info("Installing external dependencies of functions and tools...")
  501. install_tool_and_function_dependencies()
  502. app.state.redis = get_redis_connection(
  503. redis_url=REDIS_URL,
  504. redis_sentinels=get_sentinels_from_env(
  505. REDIS_SENTINEL_HOSTS, REDIS_SENTINEL_PORT
  506. ),
  507. redis_cluster=REDIS_CLUSTER,
  508. async_mode=True,
  509. )
  510. if app.state.redis is not None:
  511. app.state.redis_task_command_listener = asyncio.create_task(
  512. redis_task_command_listener(app)
  513. )
  514. if THREAD_POOL_SIZE and THREAD_POOL_SIZE > 0:
  515. limiter = anyio.to_thread.current_default_thread_limiter()
  516. limiter.total_tokens = THREAD_POOL_SIZE
  517. asyncio.create_task(periodic_usage_pool_cleanup())
  518. if app.state.config.ENABLE_BASE_MODELS_CACHE:
  519. await get_all_models(
  520. Request(
  521. # Creating a mock request object to pass to get_all_models
  522. {
  523. "type": "http",
  524. "asgi.version": "3.0",
  525. "asgi.spec_version": "2.0",
  526. "method": "GET",
  527. "path": "/internal",
  528. "query_string": b"",
  529. "headers": Headers({}).raw,
  530. "client": ("127.0.0.1", 12345),
  531. "server": ("127.0.0.1", 80),
  532. "scheme": "http",
  533. "app": app,
  534. }
  535. ),
  536. None,
  537. )
  538. yield
  539. if hasattr(app.state, "redis_task_command_listener"):
  540. app.state.redis_task_command_listener.cancel()
  541. app = FastAPI(
  542. title="Open WebUI",
  543. docs_url="/docs" if ENV == "dev" else None,
  544. openapi_url="/openapi.json" if ENV == "dev" else None,
  545. redoc_url=None,
  546. lifespan=lifespan,
  547. )
  548. oauth_manager = OAuthManager(app)
  549. app.state.instance_id = None
  550. app.state.config = AppConfig(
  551. redis_url=REDIS_URL,
  552. redis_sentinels=get_sentinels_from_env(REDIS_SENTINEL_HOSTS, REDIS_SENTINEL_PORT),
  553. redis_cluster=REDIS_CLUSTER,
  554. redis_key_prefix=REDIS_KEY_PREFIX,
  555. )
  556. app.state.redis = None
  557. app.state.WEBUI_NAME = WEBUI_NAME
  558. app.state.LICENSE_METADATA = None
  559. ########################################
  560. #
  561. # OPENTELEMETRY
  562. #
  563. ########################################
  564. if ENABLE_OTEL:
  565. from open_webui.utils.telemetry.setup import setup as setup_opentelemetry
  566. setup_opentelemetry(app=app, db_engine=engine)
  567. ########################################
  568. #
  569. # OLLAMA
  570. #
  571. ########################################
  572. app.state.config.ENABLE_OLLAMA_API = ENABLE_OLLAMA_API
  573. app.state.config.OLLAMA_BASE_URLS = OLLAMA_BASE_URLS
  574. app.state.config.OLLAMA_API_CONFIGS = OLLAMA_API_CONFIGS
  575. app.state.OLLAMA_MODELS = {}
  576. ########################################
  577. #
  578. # OPENAI
  579. #
  580. ########################################
  581. app.state.config.ENABLE_OPENAI_API = ENABLE_OPENAI_API
  582. app.state.config.OPENAI_API_BASE_URLS = OPENAI_API_BASE_URLS
  583. app.state.config.OPENAI_API_KEYS = OPENAI_API_KEYS
  584. app.state.config.OPENAI_API_CONFIGS = OPENAI_API_CONFIGS
  585. app.state.OPENAI_MODELS = {}
  586. ########################################
  587. #
  588. # TOOL SERVERS
  589. #
  590. ########################################
  591. app.state.config.TOOL_SERVER_CONNECTIONS = TOOL_SERVER_CONNECTIONS
  592. app.state.TOOL_SERVERS = []
  593. ########################################
  594. #
  595. # DIRECT CONNECTIONS
  596. #
  597. ########################################
  598. app.state.config.ENABLE_DIRECT_CONNECTIONS = ENABLE_DIRECT_CONNECTIONS
  599. ########################################
  600. #
  601. # SCIM
  602. #
  603. ########################################
  604. app.state.SCIM_ENABLED = SCIM_ENABLED
  605. app.state.SCIM_TOKEN = SCIM_TOKEN
  606. ########################################
  607. #
  608. # MODELS
  609. #
  610. ########################################
  611. app.state.config.ENABLE_BASE_MODELS_CACHE = ENABLE_BASE_MODELS_CACHE
  612. app.state.BASE_MODELS = []
  613. ########################################
  614. #
  615. # WEBUI
  616. #
  617. ########################################
  618. app.state.config.WEBUI_URL = WEBUI_URL
  619. app.state.config.ENABLE_SIGNUP = ENABLE_SIGNUP
  620. app.state.config.ENABLE_LOGIN_FORM = ENABLE_LOGIN_FORM
  621. app.state.config.ENABLE_API_KEY = ENABLE_API_KEY
  622. app.state.config.ENABLE_API_KEY_ENDPOINT_RESTRICTIONS = (
  623. ENABLE_API_KEY_ENDPOINT_RESTRICTIONS
  624. )
  625. app.state.config.API_KEY_ALLOWED_ENDPOINTS = API_KEY_ALLOWED_ENDPOINTS
  626. app.state.config.JWT_EXPIRES_IN = JWT_EXPIRES_IN
  627. app.state.config.SHOW_ADMIN_DETAILS = SHOW_ADMIN_DETAILS
  628. app.state.config.ADMIN_EMAIL = ADMIN_EMAIL
  629. app.state.config.DEFAULT_MODELS = DEFAULT_MODELS
  630. app.state.config.DEFAULT_PROMPT_SUGGESTIONS = DEFAULT_PROMPT_SUGGESTIONS
  631. app.state.config.DEFAULT_USER_ROLE = DEFAULT_USER_ROLE
  632. app.state.config.PENDING_USER_OVERLAY_CONTENT = PENDING_USER_OVERLAY_CONTENT
  633. app.state.config.PENDING_USER_OVERLAY_TITLE = PENDING_USER_OVERLAY_TITLE
  634. app.state.config.RESPONSE_WATERMARK = RESPONSE_WATERMARK
  635. app.state.config.USER_PERMISSIONS = USER_PERMISSIONS
  636. app.state.config.WEBHOOK_URL = WEBHOOK_URL
  637. app.state.config.BANNERS = WEBUI_BANNERS
  638. app.state.config.MODEL_ORDER_LIST = MODEL_ORDER_LIST
  639. app.state.config.ENABLE_CHANNELS = ENABLE_CHANNELS
  640. app.state.config.ENABLE_NOTES = ENABLE_NOTES
  641. app.state.config.ENABLE_COMMUNITY_SHARING = ENABLE_COMMUNITY_SHARING
  642. app.state.config.ENABLE_MESSAGE_RATING = ENABLE_MESSAGE_RATING
  643. app.state.config.ENABLE_USER_WEBHOOKS = ENABLE_USER_WEBHOOKS
  644. app.state.config.ENABLE_EVALUATION_ARENA_MODELS = ENABLE_EVALUATION_ARENA_MODELS
  645. app.state.config.EVALUATION_ARENA_MODELS = EVALUATION_ARENA_MODELS
  646. app.state.config.OAUTH_USERNAME_CLAIM = OAUTH_USERNAME_CLAIM
  647. app.state.config.OAUTH_PICTURE_CLAIM = OAUTH_PICTURE_CLAIM
  648. app.state.config.OAUTH_EMAIL_CLAIM = OAUTH_EMAIL_CLAIM
  649. app.state.config.ENABLE_OAUTH_ROLE_MANAGEMENT = ENABLE_OAUTH_ROLE_MANAGEMENT
  650. app.state.config.OAUTH_ROLES_CLAIM = OAUTH_ROLES_CLAIM
  651. app.state.config.OAUTH_ALLOWED_ROLES = OAUTH_ALLOWED_ROLES
  652. app.state.config.OAUTH_ADMIN_ROLES = OAUTH_ADMIN_ROLES
  653. app.state.config.ENABLE_LDAP = ENABLE_LDAP
  654. app.state.config.LDAP_SERVER_LABEL = LDAP_SERVER_LABEL
  655. app.state.config.LDAP_SERVER_HOST = LDAP_SERVER_HOST
  656. app.state.config.LDAP_SERVER_PORT = LDAP_SERVER_PORT
  657. app.state.config.LDAP_ATTRIBUTE_FOR_MAIL = LDAP_ATTRIBUTE_FOR_MAIL
  658. app.state.config.LDAP_ATTRIBUTE_FOR_USERNAME = LDAP_ATTRIBUTE_FOR_USERNAME
  659. app.state.config.LDAP_APP_DN = LDAP_APP_DN
  660. app.state.config.LDAP_APP_PASSWORD = LDAP_APP_PASSWORD
  661. app.state.config.LDAP_SEARCH_BASE = LDAP_SEARCH_BASE
  662. app.state.config.LDAP_SEARCH_FILTERS = LDAP_SEARCH_FILTERS
  663. app.state.config.LDAP_USE_TLS = LDAP_USE_TLS
  664. app.state.config.LDAP_CA_CERT_FILE = LDAP_CA_CERT_FILE
  665. app.state.config.LDAP_VALIDATE_CERT = LDAP_VALIDATE_CERT
  666. app.state.config.LDAP_CIPHERS = LDAP_CIPHERS
  667. # For LDAP Group Management
  668. app.state.config.ENABLE_LDAP_GROUP_MANAGEMENT = ENABLE_LDAP_GROUP_MANAGEMENT
  669. app.state.config.ENABLE_LDAP_GROUP_CREATION = ENABLE_LDAP_GROUP_CREATION
  670. app.state.config.LDAP_ATTRIBUTE_FOR_GROUPS = LDAP_ATTRIBUTE_FOR_GROUPS
  671. app.state.AUTH_TRUSTED_EMAIL_HEADER = WEBUI_AUTH_TRUSTED_EMAIL_HEADER
  672. app.state.AUTH_TRUSTED_NAME_HEADER = WEBUI_AUTH_TRUSTED_NAME_HEADER
  673. app.state.WEBUI_AUTH_SIGNOUT_REDIRECT_URL = WEBUI_AUTH_SIGNOUT_REDIRECT_URL
  674. app.state.EXTERNAL_PWA_MANIFEST_URL = EXTERNAL_PWA_MANIFEST_URL
  675. app.state.USER_COUNT = None
  676. app.state.TOOLS = {}
  677. app.state.TOOL_CONTENTS = {}
  678. app.state.FUNCTIONS = {}
  679. app.state.FUNCTION_CONTENTS = {}
  680. ########################################
  681. #
  682. # RETRIEVAL
  683. #
  684. ########################################
  685. app.state.config.TOP_K = RAG_TOP_K
  686. app.state.config.TOP_K_RERANKER = RAG_TOP_K_RERANKER
  687. app.state.config.RELEVANCE_THRESHOLD = RAG_RELEVANCE_THRESHOLD
  688. app.state.config.HYBRID_BM25_WEIGHT = RAG_HYBRID_BM25_WEIGHT
  689. app.state.config.ALLOWED_FILE_EXTENSIONS = RAG_ALLOWED_FILE_EXTENSIONS
  690. app.state.config.FILE_MAX_SIZE = RAG_FILE_MAX_SIZE
  691. app.state.config.FILE_MAX_COUNT = RAG_FILE_MAX_COUNT
  692. app.state.config.FILE_IMAGE_COMPRESSION_WIDTH = FILE_IMAGE_COMPRESSION_WIDTH
  693. app.state.config.FILE_IMAGE_COMPRESSION_HEIGHT = FILE_IMAGE_COMPRESSION_HEIGHT
  694. app.state.config.RAG_FULL_CONTEXT = RAG_FULL_CONTEXT
  695. app.state.config.BYPASS_EMBEDDING_AND_RETRIEVAL = BYPASS_EMBEDDING_AND_RETRIEVAL
  696. app.state.config.ENABLE_RAG_HYBRID_SEARCH = ENABLE_RAG_HYBRID_SEARCH
  697. app.state.config.ENABLE_WEB_LOADER_SSL_VERIFICATION = ENABLE_WEB_LOADER_SSL_VERIFICATION
  698. app.state.config.CONTENT_EXTRACTION_ENGINE = CONTENT_EXTRACTION_ENGINE
  699. app.state.config.DATALAB_MARKER_API_KEY = DATALAB_MARKER_API_KEY
  700. app.state.config.DATALAB_MARKER_API_BASE_URL = DATALAB_MARKER_API_BASE_URL
  701. app.state.config.DATALAB_MARKER_ADDITIONAL_CONFIG = DATALAB_MARKER_ADDITIONAL_CONFIG
  702. app.state.config.DATALAB_MARKER_SKIP_CACHE = DATALAB_MARKER_SKIP_CACHE
  703. app.state.config.DATALAB_MARKER_FORCE_OCR = DATALAB_MARKER_FORCE_OCR
  704. app.state.config.DATALAB_MARKER_PAGINATE = DATALAB_MARKER_PAGINATE
  705. app.state.config.DATALAB_MARKER_STRIP_EXISTING_OCR = DATALAB_MARKER_STRIP_EXISTING_OCR
  706. app.state.config.DATALAB_MARKER_DISABLE_IMAGE_EXTRACTION = (
  707. DATALAB_MARKER_DISABLE_IMAGE_EXTRACTION
  708. )
  709. app.state.config.DATALAB_MARKER_FORMAT_LINES = DATALAB_MARKER_FORMAT_LINES
  710. app.state.config.DATALAB_MARKER_USE_LLM = DATALAB_MARKER_USE_LLM
  711. app.state.config.DATALAB_MARKER_OUTPUT_FORMAT = DATALAB_MARKER_OUTPUT_FORMAT
  712. app.state.config.EXTERNAL_DOCUMENT_LOADER_URL = EXTERNAL_DOCUMENT_LOADER_URL
  713. app.state.config.EXTERNAL_DOCUMENT_LOADER_API_KEY = EXTERNAL_DOCUMENT_LOADER_API_KEY
  714. app.state.config.TIKA_SERVER_URL = TIKA_SERVER_URL
  715. app.state.config.DOCLING_SERVER_URL = DOCLING_SERVER_URL
  716. app.state.config.DOCLING_OCR_ENGINE = DOCLING_OCR_ENGINE
  717. app.state.config.DOCLING_OCR_LANG = DOCLING_OCR_LANG
  718. app.state.config.DOCLING_DO_PICTURE_DESCRIPTION = DOCLING_DO_PICTURE_DESCRIPTION
  719. app.state.config.DOCLING_PICTURE_DESCRIPTION_MODE = DOCLING_PICTURE_DESCRIPTION_MODE
  720. app.state.config.DOCLING_PICTURE_DESCRIPTION_LOCAL = DOCLING_PICTURE_DESCRIPTION_LOCAL
  721. app.state.config.DOCLING_PICTURE_DESCRIPTION_API = DOCLING_PICTURE_DESCRIPTION_API
  722. app.state.config.DOCUMENT_INTELLIGENCE_ENDPOINT = DOCUMENT_INTELLIGENCE_ENDPOINT
  723. app.state.config.DOCUMENT_INTELLIGENCE_KEY = DOCUMENT_INTELLIGENCE_KEY
  724. app.state.config.MISTRAL_OCR_API_KEY = MISTRAL_OCR_API_KEY
  725. app.state.config.TEXT_SPLITTER = RAG_TEXT_SPLITTER
  726. app.state.config.TIKTOKEN_ENCODING_NAME = TIKTOKEN_ENCODING_NAME
  727. app.state.config.CHUNK_SIZE = CHUNK_SIZE
  728. app.state.config.CHUNK_OVERLAP = CHUNK_OVERLAP
  729. app.state.config.RAG_EMBEDDING_ENGINE = RAG_EMBEDDING_ENGINE
  730. app.state.config.RAG_EMBEDDING_MODEL = RAG_EMBEDDING_MODEL
  731. app.state.config.RAG_EMBEDDING_BATCH_SIZE = RAG_EMBEDDING_BATCH_SIZE
  732. app.state.config.RAG_RERANKING_ENGINE = RAG_RERANKING_ENGINE
  733. app.state.config.RAG_RERANKING_MODEL = RAG_RERANKING_MODEL
  734. app.state.config.RAG_EXTERNAL_RERANKER_URL = RAG_EXTERNAL_RERANKER_URL
  735. app.state.config.RAG_EXTERNAL_RERANKER_API_KEY = RAG_EXTERNAL_RERANKER_API_KEY
  736. app.state.config.RAG_TEMPLATE = RAG_TEMPLATE
  737. app.state.config.RAG_OPENAI_API_BASE_URL = RAG_OPENAI_API_BASE_URL
  738. app.state.config.RAG_OPENAI_API_KEY = RAG_OPENAI_API_KEY
  739. app.state.config.RAG_AZURE_OPENAI_BASE_URL = RAG_AZURE_OPENAI_BASE_URL
  740. app.state.config.RAG_AZURE_OPENAI_API_KEY = RAG_AZURE_OPENAI_API_KEY
  741. app.state.config.RAG_AZURE_OPENAI_API_VERSION = RAG_AZURE_OPENAI_API_VERSION
  742. app.state.config.RAG_OLLAMA_BASE_URL = RAG_OLLAMA_BASE_URL
  743. app.state.config.RAG_OLLAMA_API_KEY = RAG_OLLAMA_API_KEY
  744. app.state.config.PDF_EXTRACT_IMAGES = PDF_EXTRACT_IMAGES
  745. app.state.config.YOUTUBE_LOADER_LANGUAGE = YOUTUBE_LOADER_LANGUAGE
  746. app.state.config.YOUTUBE_LOADER_PROXY_URL = YOUTUBE_LOADER_PROXY_URL
  747. app.state.config.ENABLE_WEB_SEARCH = ENABLE_WEB_SEARCH
  748. app.state.config.WEB_SEARCH_ENGINE = WEB_SEARCH_ENGINE
  749. app.state.config.WEB_SEARCH_DOMAIN_FILTER_LIST = WEB_SEARCH_DOMAIN_FILTER_LIST
  750. app.state.config.WEB_SEARCH_RESULT_COUNT = WEB_SEARCH_RESULT_COUNT
  751. app.state.config.WEB_SEARCH_CONCURRENT_REQUESTS = WEB_SEARCH_CONCURRENT_REQUESTS
  752. app.state.config.WEB_LOADER_ENGINE = WEB_LOADER_ENGINE
  753. app.state.config.WEB_LOADER_CONCURRENT_REQUESTS = WEB_LOADER_CONCURRENT_REQUESTS
  754. app.state.config.WEB_SEARCH_TRUST_ENV = WEB_SEARCH_TRUST_ENV
  755. app.state.config.BYPASS_WEB_SEARCH_EMBEDDING_AND_RETRIEVAL = (
  756. BYPASS_WEB_SEARCH_EMBEDDING_AND_RETRIEVAL
  757. )
  758. app.state.config.BYPASS_WEB_SEARCH_WEB_LOADER = BYPASS_WEB_SEARCH_WEB_LOADER
  759. app.state.config.ENABLE_GOOGLE_DRIVE_INTEGRATION = ENABLE_GOOGLE_DRIVE_INTEGRATION
  760. app.state.config.ENABLE_ONEDRIVE_INTEGRATION = ENABLE_ONEDRIVE_INTEGRATION
  761. app.state.config.SEARXNG_QUERY_URL = SEARXNG_QUERY_URL
  762. app.state.config.YACY_QUERY_URL = YACY_QUERY_URL
  763. app.state.config.YACY_USERNAME = YACY_USERNAME
  764. app.state.config.YACY_PASSWORD = YACY_PASSWORD
  765. app.state.config.GOOGLE_PSE_API_KEY = GOOGLE_PSE_API_KEY
  766. app.state.config.GOOGLE_PSE_ENGINE_ID = GOOGLE_PSE_ENGINE_ID
  767. app.state.config.BRAVE_SEARCH_API_KEY = BRAVE_SEARCH_API_KEY
  768. app.state.config.KAGI_SEARCH_API_KEY = KAGI_SEARCH_API_KEY
  769. app.state.config.MOJEEK_SEARCH_API_KEY = MOJEEK_SEARCH_API_KEY
  770. app.state.config.BOCHA_SEARCH_API_KEY = BOCHA_SEARCH_API_KEY
  771. app.state.config.SERPSTACK_API_KEY = SERPSTACK_API_KEY
  772. app.state.config.SERPSTACK_HTTPS = SERPSTACK_HTTPS
  773. app.state.config.SERPER_API_KEY = SERPER_API_KEY
  774. app.state.config.SERPLY_API_KEY = SERPLY_API_KEY
  775. app.state.config.TAVILY_API_KEY = TAVILY_API_KEY
  776. app.state.config.SEARCHAPI_API_KEY = SEARCHAPI_API_KEY
  777. app.state.config.SEARCHAPI_ENGINE = SEARCHAPI_ENGINE
  778. app.state.config.SERPAPI_API_KEY = SERPAPI_API_KEY
  779. app.state.config.SERPAPI_ENGINE = SERPAPI_ENGINE
  780. app.state.config.JINA_API_KEY = JINA_API_KEY
  781. app.state.config.BING_SEARCH_V7_ENDPOINT = BING_SEARCH_V7_ENDPOINT
  782. app.state.config.BING_SEARCH_V7_SUBSCRIPTION_KEY = BING_SEARCH_V7_SUBSCRIPTION_KEY
  783. app.state.config.EXA_API_KEY = EXA_API_KEY
  784. app.state.config.PERPLEXITY_API_KEY = PERPLEXITY_API_KEY
  785. app.state.config.PERPLEXITY_MODEL = PERPLEXITY_MODEL
  786. app.state.config.PERPLEXITY_SEARCH_CONTEXT_USAGE = PERPLEXITY_SEARCH_CONTEXT_USAGE
  787. app.state.config.SOUGOU_API_SID = SOUGOU_API_SID
  788. app.state.config.SOUGOU_API_SK = SOUGOU_API_SK
  789. app.state.config.EXTERNAL_WEB_SEARCH_URL = EXTERNAL_WEB_SEARCH_URL
  790. app.state.config.EXTERNAL_WEB_SEARCH_API_KEY = EXTERNAL_WEB_SEARCH_API_KEY
  791. app.state.config.EXTERNAL_WEB_LOADER_URL = EXTERNAL_WEB_LOADER_URL
  792. app.state.config.EXTERNAL_WEB_LOADER_API_KEY = EXTERNAL_WEB_LOADER_API_KEY
  793. app.state.config.PLAYWRIGHT_WS_URL = PLAYWRIGHT_WS_URL
  794. app.state.config.PLAYWRIGHT_TIMEOUT = PLAYWRIGHT_TIMEOUT
  795. app.state.config.FIRECRAWL_API_BASE_URL = FIRECRAWL_API_BASE_URL
  796. app.state.config.FIRECRAWL_API_KEY = FIRECRAWL_API_KEY
  797. app.state.config.TAVILY_EXTRACT_DEPTH = TAVILY_EXTRACT_DEPTH
  798. app.state.EMBEDDING_FUNCTION = None
  799. app.state.RERANKING_FUNCTION = None
  800. app.state.ef = None
  801. app.state.rf = None
  802. app.state.YOUTUBE_LOADER_TRANSLATION = None
  803. try:
  804. app.state.ef = get_ef(
  805. app.state.config.RAG_EMBEDDING_ENGINE,
  806. app.state.config.RAG_EMBEDDING_MODEL,
  807. RAG_EMBEDDING_MODEL_AUTO_UPDATE,
  808. )
  809. app.state.rf = get_rf(
  810. app.state.config.RAG_RERANKING_ENGINE,
  811. app.state.config.RAG_RERANKING_MODEL,
  812. app.state.config.RAG_EXTERNAL_RERANKER_URL,
  813. app.state.config.RAG_EXTERNAL_RERANKER_API_KEY,
  814. RAG_RERANKING_MODEL_AUTO_UPDATE,
  815. )
  816. except Exception as e:
  817. log.error(f"Error updating models: {e}")
  818. pass
  819. app.state.EMBEDDING_FUNCTION = get_embedding_function(
  820. app.state.config.RAG_EMBEDDING_ENGINE,
  821. app.state.config.RAG_EMBEDDING_MODEL,
  822. embedding_function=app.state.ef,
  823. url=(
  824. app.state.config.RAG_OPENAI_API_BASE_URL
  825. if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
  826. else (
  827. app.state.config.RAG_OLLAMA_BASE_URL
  828. if app.state.config.RAG_EMBEDDING_ENGINE == "ollama"
  829. else app.state.config.RAG_AZURE_OPENAI_BASE_URL
  830. )
  831. ),
  832. key=(
  833. app.state.config.RAG_OPENAI_API_KEY
  834. if app.state.config.RAG_EMBEDDING_ENGINE == "openai"
  835. else (
  836. app.state.config.RAG_OLLAMA_API_KEY
  837. if app.state.config.RAG_EMBEDDING_ENGINE == "ollama"
  838. else app.state.config.RAG_AZURE_OPENAI_API_KEY
  839. )
  840. ),
  841. embedding_batch_size=app.state.config.RAG_EMBEDDING_BATCH_SIZE,
  842. azure_api_version=(
  843. app.state.config.RAG_AZURE_OPENAI_API_VERSION
  844. if app.state.config.RAG_EMBEDDING_ENGINE == "azure_openai"
  845. else None
  846. ),
  847. )
  848. app.state.RERANKING_FUNCTION = get_reranking_function(
  849. app.state.config.RAG_RERANKING_ENGINE,
  850. app.state.config.RAG_RERANKING_MODEL,
  851. reranking_function=app.state.rf,
  852. )
  853. ########################################
  854. #
  855. # CODE EXECUTION
  856. #
  857. ########################################
  858. app.state.config.ENABLE_CODE_EXECUTION = ENABLE_CODE_EXECUTION
  859. app.state.config.CODE_EXECUTION_ENGINE = CODE_EXECUTION_ENGINE
  860. app.state.config.CODE_EXECUTION_JUPYTER_URL = CODE_EXECUTION_JUPYTER_URL
  861. app.state.config.CODE_EXECUTION_JUPYTER_AUTH = CODE_EXECUTION_JUPYTER_AUTH
  862. app.state.config.CODE_EXECUTION_JUPYTER_AUTH_TOKEN = CODE_EXECUTION_JUPYTER_AUTH_TOKEN
  863. app.state.config.CODE_EXECUTION_JUPYTER_AUTH_PASSWORD = (
  864. CODE_EXECUTION_JUPYTER_AUTH_PASSWORD
  865. )
  866. app.state.config.CODE_EXECUTION_JUPYTER_TIMEOUT = CODE_EXECUTION_JUPYTER_TIMEOUT
  867. app.state.config.ENABLE_CODE_INTERPRETER = ENABLE_CODE_INTERPRETER
  868. app.state.config.CODE_INTERPRETER_ENGINE = CODE_INTERPRETER_ENGINE
  869. app.state.config.CODE_INTERPRETER_PROMPT_TEMPLATE = CODE_INTERPRETER_PROMPT_TEMPLATE
  870. app.state.config.CODE_INTERPRETER_JUPYTER_URL = CODE_INTERPRETER_JUPYTER_URL
  871. app.state.config.CODE_INTERPRETER_JUPYTER_AUTH = CODE_INTERPRETER_JUPYTER_AUTH
  872. app.state.config.CODE_INTERPRETER_JUPYTER_AUTH_TOKEN = (
  873. CODE_INTERPRETER_JUPYTER_AUTH_TOKEN
  874. )
  875. app.state.config.CODE_INTERPRETER_JUPYTER_AUTH_PASSWORD = (
  876. CODE_INTERPRETER_JUPYTER_AUTH_PASSWORD
  877. )
  878. app.state.config.CODE_INTERPRETER_JUPYTER_TIMEOUT = CODE_INTERPRETER_JUPYTER_TIMEOUT
  879. ########################################
  880. #
  881. # IMAGES
  882. #
  883. ########################################
  884. app.state.config.IMAGE_GENERATION_ENGINE = IMAGE_GENERATION_ENGINE
  885. app.state.config.ENABLE_IMAGE_GENERATION = ENABLE_IMAGE_GENERATION
  886. app.state.config.ENABLE_IMAGE_PROMPT_GENERATION = ENABLE_IMAGE_PROMPT_GENERATION
  887. app.state.config.IMAGES_OPENAI_API_BASE_URL = IMAGES_OPENAI_API_BASE_URL
  888. app.state.config.IMAGES_OPENAI_API_KEY = IMAGES_OPENAI_API_KEY
  889. app.state.config.IMAGES_GEMINI_API_BASE_URL = IMAGES_GEMINI_API_BASE_URL
  890. app.state.config.IMAGES_GEMINI_API_KEY = IMAGES_GEMINI_API_KEY
  891. app.state.config.IMAGE_GENERATION_MODEL = IMAGE_GENERATION_MODEL
  892. app.state.config.AUTOMATIC1111_BASE_URL = AUTOMATIC1111_BASE_URL
  893. app.state.config.AUTOMATIC1111_API_AUTH = AUTOMATIC1111_API_AUTH
  894. app.state.config.AUTOMATIC1111_CFG_SCALE = AUTOMATIC1111_CFG_SCALE
  895. app.state.config.AUTOMATIC1111_SAMPLER = AUTOMATIC1111_SAMPLER
  896. app.state.config.AUTOMATIC1111_SCHEDULER = AUTOMATIC1111_SCHEDULER
  897. app.state.config.COMFYUI_BASE_URL = COMFYUI_BASE_URL
  898. app.state.config.COMFYUI_API_KEY = COMFYUI_API_KEY
  899. app.state.config.COMFYUI_WORKFLOW = COMFYUI_WORKFLOW
  900. app.state.config.COMFYUI_WORKFLOW_NODES = COMFYUI_WORKFLOW_NODES
  901. app.state.config.IMAGE_SIZE = IMAGE_SIZE
  902. app.state.config.IMAGE_STEPS = IMAGE_STEPS
  903. ########################################
  904. #
  905. # AUDIO
  906. #
  907. ########################################
  908. app.state.config.STT_ENGINE = AUDIO_STT_ENGINE
  909. app.state.config.STT_MODEL = AUDIO_STT_MODEL
  910. app.state.config.STT_SUPPORTED_CONTENT_TYPES = AUDIO_STT_SUPPORTED_CONTENT_TYPES
  911. app.state.config.STT_OPENAI_API_BASE_URL = AUDIO_STT_OPENAI_API_BASE_URL
  912. app.state.config.STT_OPENAI_API_KEY = AUDIO_STT_OPENAI_API_KEY
  913. app.state.config.WHISPER_MODEL = WHISPER_MODEL
  914. app.state.config.WHISPER_VAD_FILTER = WHISPER_VAD_FILTER
  915. app.state.config.DEEPGRAM_API_KEY = DEEPGRAM_API_KEY
  916. app.state.config.AUDIO_STT_AZURE_API_KEY = AUDIO_STT_AZURE_API_KEY
  917. app.state.config.AUDIO_STT_AZURE_REGION = AUDIO_STT_AZURE_REGION
  918. app.state.config.AUDIO_STT_AZURE_LOCALES = AUDIO_STT_AZURE_LOCALES
  919. app.state.config.AUDIO_STT_AZURE_BASE_URL = AUDIO_STT_AZURE_BASE_URL
  920. app.state.config.AUDIO_STT_AZURE_MAX_SPEAKERS = AUDIO_STT_AZURE_MAX_SPEAKERS
  921. app.state.config.TTS_OPENAI_API_BASE_URL = AUDIO_TTS_OPENAI_API_BASE_URL
  922. app.state.config.TTS_OPENAI_API_KEY = AUDIO_TTS_OPENAI_API_KEY
  923. app.state.config.TTS_ENGINE = AUDIO_TTS_ENGINE
  924. app.state.config.TTS_MODEL = AUDIO_TTS_MODEL
  925. app.state.config.TTS_VOICE = AUDIO_TTS_VOICE
  926. app.state.config.TTS_API_KEY = AUDIO_TTS_API_KEY
  927. app.state.config.TTS_SPLIT_ON = AUDIO_TTS_SPLIT_ON
  928. app.state.config.TTS_AZURE_SPEECH_REGION = AUDIO_TTS_AZURE_SPEECH_REGION
  929. app.state.config.TTS_AZURE_SPEECH_BASE_URL = AUDIO_TTS_AZURE_SPEECH_BASE_URL
  930. app.state.config.TTS_AZURE_SPEECH_OUTPUT_FORMAT = AUDIO_TTS_AZURE_SPEECH_OUTPUT_FORMAT
  931. app.state.faster_whisper_model = None
  932. app.state.speech_synthesiser = None
  933. app.state.speech_speaker_embeddings_dataset = None
  934. ########################################
  935. #
  936. # TASKS
  937. #
  938. ########################################
  939. app.state.config.TASK_MODEL = TASK_MODEL
  940. app.state.config.TASK_MODEL_EXTERNAL = TASK_MODEL_EXTERNAL
  941. app.state.config.ENABLE_SEARCH_QUERY_GENERATION = ENABLE_SEARCH_QUERY_GENERATION
  942. app.state.config.ENABLE_RETRIEVAL_QUERY_GENERATION = ENABLE_RETRIEVAL_QUERY_GENERATION
  943. app.state.config.ENABLE_AUTOCOMPLETE_GENERATION = ENABLE_AUTOCOMPLETE_GENERATION
  944. app.state.config.ENABLE_TAGS_GENERATION = ENABLE_TAGS_GENERATION
  945. app.state.config.ENABLE_TITLE_GENERATION = ENABLE_TITLE_GENERATION
  946. app.state.config.ENABLE_FOLLOW_UP_GENERATION = ENABLE_FOLLOW_UP_GENERATION
  947. app.state.config.TITLE_GENERATION_PROMPT_TEMPLATE = TITLE_GENERATION_PROMPT_TEMPLATE
  948. app.state.config.TAGS_GENERATION_PROMPT_TEMPLATE = TAGS_GENERATION_PROMPT_TEMPLATE
  949. app.state.config.IMAGE_PROMPT_GENERATION_PROMPT_TEMPLATE = (
  950. IMAGE_PROMPT_GENERATION_PROMPT_TEMPLATE
  951. )
  952. app.state.config.FOLLOW_UP_GENERATION_PROMPT_TEMPLATE = (
  953. FOLLOW_UP_GENERATION_PROMPT_TEMPLATE
  954. )
  955. app.state.config.TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE = (
  956. TOOLS_FUNCTION_CALLING_PROMPT_TEMPLATE
  957. )
  958. app.state.config.QUERY_GENERATION_PROMPT_TEMPLATE = QUERY_GENERATION_PROMPT_TEMPLATE
  959. app.state.config.AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE = (
  960. AUTOCOMPLETE_GENERATION_PROMPT_TEMPLATE
  961. )
  962. app.state.config.AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH = (
  963. AUTOCOMPLETE_GENERATION_INPUT_MAX_LENGTH
  964. )
  965. ########################################
  966. #
  967. # WEBUI
  968. #
  969. ########################################
  970. app.state.MODELS = {}
  971. class RedirectMiddleware(BaseHTTPMiddleware):
  972. async def dispatch(self, request: Request, call_next):
  973. # Check if the request is a GET request
  974. if request.method == "GET":
  975. path = request.url.path
  976. query_params = dict(parse_qs(urlparse(str(request.url)).query))
  977. # Check for the specific watch path and the presence of 'v' parameter
  978. if path.endswith("/watch") and "v" in query_params:
  979. # Extract the first 'v' parameter
  980. video_id = query_params["v"][0]
  981. encoded_video_id = urlencode({"youtube": video_id})
  982. redirect_url = f"/?{encoded_video_id}"
  983. return RedirectResponse(url=redirect_url)
  984. # Proceed with the normal flow of other requests
  985. response = await call_next(request)
  986. return response
  987. # Add the middleware to the app
  988. if ENABLE_COMPRESSION_MIDDLEWARE:
  989. app.add_middleware(CompressMiddleware)
  990. app.add_middleware(RedirectMiddleware)
  991. app.add_middleware(SecurityHeadersMiddleware)
  992. @app.middleware("http")
  993. async def commit_session_after_request(request: Request, call_next):
  994. response = await call_next(request)
  995. # log.debug("Commit session after request")
  996. Session.commit()
  997. return response
  998. @app.middleware("http")
  999. async def check_url(request: Request, call_next):
  1000. start_time = int(time.time())
  1001. request.state.token = get_http_authorization_cred(
  1002. request.headers.get("Authorization")
  1003. )
  1004. request.state.enable_api_key = app.state.config.ENABLE_API_KEY
  1005. response = await call_next(request)
  1006. process_time = int(time.time()) - start_time
  1007. response.headers["X-Process-Time"] = str(process_time)
  1008. return response
  1009. @app.middleware("http")
  1010. async def inspect_websocket(request: Request, call_next):
  1011. if (
  1012. "/ws/socket.io" in request.url.path
  1013. and request.query_params.get("transport") == "websocket"
  1014. ):
  1015. upgrade = (request.headers.get("Upgrade") or "").lower()
  1016. connection = (request.headers.get("Connection") or "").lower().split(",")
  1017. # Check that there's the correct headers for an upgrade, else reject the connection
  1018. # This is to work around this upstream issue: https://github.com/miguelgrinberg/python-engineio/issues/367
  1019. if upgrade != "websocket" or "upgrade" not in connection:
  1020. return JSONResponse(
  1021. status_code=status.HTTP_400_BAD_REQUEST,
  1022. content={"detail": "Invalid WebSocket upgrade request"},
  1023. )
  1024. return await call_next(request)
  1025. app.add_middleware(
  1026. CORSMiddleware,
  1027. allow_origins=CORS_ALLOW_ORIGIN,
  1028. allow_credentials=True,
  1029. allow_methods=["*"],
  1030. allow_headers=["*"],
  1031. )
  1032. app.mount("/ws", socket_app)
  1033. app.include_router(ollama.router, prefix="/ollama", tags=["ollama"])
  1034. app.include_router(openai.router, prefix="/openai", tags=["openai"])
  1035. app.include_router(pipelines.router, prefix="/api/v1/pipelines", tags=["pipelines"])
  1036. app.include_router(tasks.router, prefix="/api/v1/tasks", tags=["tasks"])
  1037. app.include_router(images.router, prefix="/api/v1/images", tags=["images"])
  1038. app.include_router(audio.router, prefix="/api/v1/audio", tags=["audio"])
  1039. app.include_router(retrieval.router, prefix="/api/v1/retrieval", tags=["retrieval"])
  1040. app.include_router(configs.router, prefix="/api/v1/configs", tags=["configs"])
  1041. app.include_router(auths.router, prefix="/api/v1/auths", tags=["auths"])
  1042. app.include_router(users.router, prefix="/api/v1/users", tags=["users"])
  1043. app.include_router(channels.router, prefix="/api/v1/channels", tags=["channels"])
  1044. app.include_router(chats.router, prefix="/api/v1/chats", tags=["chats"])
  1045. app.include_router(notes.router, prefix="/api/v1/notes", tags=["notes"])
  1046. app.include_router(models.router, prefix="/api/v1/models", tags=["models"])
  1047. app.include_router(knowledge.router, prefix="/api/v1/knowledge", tags=["knowledge"])
  1048. app.include_router(prompts.router, prefix="/api/v1/prompts", tags=["prompts"])
  1049. app.include_router(tools.router, prefix="/api/v1/tools", tags=["tools"])
  1050. app.include_router(memories.router, prefix="/api/v1/memories", tags=["memories"])
  1051. app.include_router(folders.router, prefix="/api/v1/folders", tags=["folders"])
  1052. app.include_router(groups.router, prefix="/api/v1/groups", tags=["groups"])
  1053. app.include_router(files.router, prefix="/api/v1/files", tags=["files"])
  1054. app.include_router(functions.router, prefix="/api/v1/functions", tags=["functions"])
  1055. app.include_router(
  1056. evaluations.router, prefix="/api/v1/evaluations", tags=["evaluations"]
  1057. )
  1058. app.include_router(utils.router, prefix="/api/v1/utils", tags=["utils"])
  1059. # SCIM 2.0 API for identity management
  1060. if SCIM_ENABLED:
  1061. app.include_router(scim.router, prefix="/api/v1/scim/v2", tags=["scim"])
  1062. try:
  1063. audit_level = AuditLevel(AUDIT_LOG_LEVEL)
  1064. except ValueError as e:
  1065. logger.error(f"Invalid audit level: {AUDIT_LOG_LEVEL}. Error: {e}")
  1066. audit_level = AuditLevel.NONE
  1067. if audit_level != AuditLevel.NONE:
  1068. app.add_middleware(
  1069. AuditLoggingMiddleware,
  1070. audit_level=audit_level,
  1071. excluded_paths=AUDIT_EXCLUDED_PATHS,
  1072. max_body_size=MAX_BODY_LOG_SIZE,
  1073. )
  1074. ##################################
  1075. #
  1076. # Chat Endpoints
  1077. #
  1078. ##################################
  1079. @app.get("/api/models")
  1080. @app.get("/api/v1/models") # Experimental: Compatibility with OpenAI API
  1081. async def get_models(
  1082. request: Request, refresh: bool = False, user=Depends(get_verified_user)
  1083. ):
  1084. def get_filtered_models(models, user):
  1085. filtered_models = []
  1086. for model in models:
  1087. if model.get("arena"):
  1088. if has_access(
  1089. user.id,
  1090. type="read",
  1091. access_control=model.get("info", {})
  1092. .get("meta", {})
  1093. .get("access_control", {}),
  1094. ):
  1095. filtered_models.append(model)
  1096. continue
  1097. model_info = Models.get_model_by_id(model["id"])
  1098. if model_info:
  1099. if (
  1100. (user.role == "admin" and ENABLE_ADMIN_WORKSPACE_CONTENT_ACCESS)
  1101. or user.id == model_info.user_id
  1102. or has_access(
  1103. user.id, type="read", access_control=model_info.access_control
  1104. )
  1105. ):
  1106. filtered_models.append(model)
  1107. return filtered_models
  1108. all_models = await get_all_models(request, refresh=refresh, user=user)
  1109. models = []
  1110. for model in all_models:
  1111. # Filter out filter pipelines
  1112. if "pipeline" in model and model["pipeline"].get("type", None) == "filter":
  1113. continue
  1114. try:
  1115. model_tags = [
  1116. tag.get("name")
  1117. for tag in model.get("info", {}).get("meta", {}).get("tags", [])
  1118. ]
  1119. tags = [tag.get("name") for tag in model.get("tags", [])]
  1120. tags = list(set(model_tags + tags))
  1121. model["tags"] = [{"name": tag} for tag in tags]
  1122. except Exception as e:
  1123. log.debug(f"Error processing model tags: {e}")
  1124. model["tags"] = []
  1125. pass
  1126. models.append(model)
  1127. model_order_list = request.app.state.config.MODEL_ORDER_LIST
  1128. if model_order_list:
  1129. model_order_dict = {model_id: i for i, model_id in enumerate(model_order_list)}
  1130. # Sort models by order list priority, with fallback for those not in the list
  1131. models.sort(
  1132. key=lambda model: (
  1133. model_order_dict.get(model.get("id", ""), float("inf")),
  1134. (model.get("name", "") or ""),
  1135. )
  1136. )
  1137. # Filter out models that the user does not have access to
  1138. if (
  1139. user.role == "user"
  1140. or (user.role == "admin" and not ENABLE_ADMIN_WORKSPACE_CONTENT_ACCESS)
  1141. ) and not BYPASS_MODEL_ACCESS_CONTROL:
  1142. models = get_filtered_models(models, user)
  1143. log.debug(
  1144. f"/api/models returned filtered models accessible to the user: {json.dumps([model.get('id') for model in models])}"
  1145. )
  1146. return {"data": models}
  1147. @app.get("/api/models/base")
  1148. async def get_base_models(request: Request, user=Depends(get_admin_user)):
  1149. models = await get_all_base_models(request, user=user)
  1150. return {"data": models}
  1151. ##################################
  1152. # Embeddings
  1153. ##################################
  1154. @app.post("/api/embeddings")
  1155. @app.post("/api/v1/embeddings") # Experimental: Compatibility with OpenAI API
  1156. async def embeddings(
  1157. request: Request, form_data: dict, user=Depends(get_verified_user)
  1158. ):
  1159. """
  1160. OpenAI-compatible embeddings endpoint.
  1161. This handler:
  1162. - Performs user/model checks and dispatches to the correct backend.
  1163. - Supports OpenAI, Ollama, arena models, pipelines, and any compatible provider.
  1164. Args:
  1165. request (Request): Request context.
  1166. form_data (dict): OpenAI-like payload (e.g., {"model": "...", "input": [...]})
  1167. user (UserModel): Authenticated user.
  1168. Returns:
  1169. dict: OpenAI-compatible embeddings response.
  1170. """
  1171. # Make sure models are loaded in app state
  1172. if not request.app.state.MODELS:
  1173. await get_all_models(request, user=user)
  1174. # Use generic dispatcher in utils.embeddings
  1175. return await generate_embeddings(request, form_data, user)
  1176. @app.post("/api/chat/completions")
  1177. @app.post("/api/v1/chat/completions") # Experimental: Compatibility with OpenAI API
  1178. async def chat_completion(
  1179. request: Request,
  1180. form_data: dict,
  1181. user=Depends(get_verified_user),
  1182. ):
  1183. if not request.app.state.MODELS:
  1184. await get_all_models(request, user=user)
  1185. model_id = form_data.get("model", None)
  1186. model_item = form_data.pop("model_item", {})
  1187. tasks = form_data.pop("background_tasks", None)
  1188. metadata = {}
  1189. try:
  1190. if not model_item.get("direct", False):
  1191. if model_id not in request.app.state.MODELS:
  1192. raise Exception("Model not found")
  1193. model = request.app.state.MODELS[model_id]
  1194. model_info = Models.get_model_by_id(model_id)
  1195. # Check if user has access to the model
  1196. if not BYPASS_MODEL_ACCESS_CONTROL and (
  1197. user.role != "admin" or not ENABLE_ADMIN_WORKSPACE_CONTENT_ACCESS
  1198. ):
  1199. try:
  1200. check_model_access(user, model)
  1201. except Exception as e:
  1202. raise e
  1203. else:
  1204. model = model_item
  1205. model_info = None
  1206. request.state.direct = True
  1207. request.state.model = model
  1208. model_info_params = (
  1209. model_info.params.model_dump() if model_info and model_info.params else {}
  1210. )
  1211. # Chat Params
  1212. stream_delta_chunk_size = form_data.get("params", {}).get(
  1213. "stream_delta_chunk_size"
  1214. )
  1215. # Model Params
  1216. if model_info_params.get("stream_delta_chunk_size"):
  1217. stream_delta_chunk_size = model_info_params.get("stream_delta_chunk_size")
  1218. metadata = {
  1219. "user_id": user.id,
  1220. "chat_id": form_data.pop("chat_id", None),
  1221. "message_id": form_data.pop("id", None),
  1222. "session_id": form_data.pop("session_id", None),
  1223. "filter_ids": form_data.pop("filter_ids", []),
  1224. "tool_ids": form_data.get("tool_ids", None),
  1225. "tool_servers": form_data.pop("tool_servers", None),
  1226. "files": form_data.get("files", None),
  1227. "features": form_data.get("features", {}),
  1228. "variables": form_data.get("variables", {}),
  1229. "model": model,
  1230. "direct": model_item.get("direct", False),
  1231. "params": {
  1232. "stream_delta_chunk_size": stream_delta_chunk_size,
  1233. "function_calling": (
  1234. "native"
  1235. if (
  1236. form_data.get("params", {}).get("function_calling") == "native"
  1237. or model_info_params.get("function_calling") == "native"
  1238. )
  1239. else "default"
  1240. ),
  1241. },
  1242. }
  1243. if metadata.get("chat_id") and (user and user.role != "admin"):
  1244. if metadata["chat_id"] != "local":
  1245. chat = Chats.get_chat_by_id_and_user_id(metadata["chat_id"], user.id)
  1246. if chat is None:
  1247. raise HTTPException(
  1248. status_code=status.HTTP_404_NOT_FOUND,
  1249. detail=ERROR_MESSAGES.DEFAULT(),
  1250. )
  1251. request.state.metadata = metadata
  1252. form_data["metadata"] = metadata
  1253. except Exception as e:
  1254. log.debug(f"Error processing chat metadata: {e}")
  1255. raise HTTPException(
  1256. status_code=status.HTTP_400_BAD_REQUEST,
  1257. detail=str(e),
  1258. )
  1259. async def process_chat(request, form_data, user, metadata, model):
  1260. try:
  1261. form_data, metadata, events = await process_chat_payload(
  1262. request, form_data, user, metadata, model
  1263. )
  1264. response = await chat_completion_handler(request, form_data, user)
  1265. if metadata.get("chat_id") and metadata.get("message_id"):
  1266. try:
  1267. Chats.upsert_message_to_chat_by_id_and_message_id(
  1268. metadata["chat_id"],
  1269. metadata["message_id"],
  1270. {
  1271. "model": model_id,
  1272. },
  1273. )
  1274. except:
  1275. pass
  1276. return await process_chat_response(
  1277. request, response, form_data, user, metadata, model, events, tasks
  1278. )
  1279. except asyncio.CancelledError:
  1280. log.info("Chat processing was cancelled")
  1281. try:
  1282. event_emitter = get_event_emitter(metadata)
  1283. await event_emitter(
  1284. {"type": "task-cancelled"},
  1285. )
  1286. except Exception as e:
  1287. pass
  1288. except Exception as e:
  1289. log.debug(f"Error processing chat payload: {e}")
  1290. if metadata.get("chat_id") and metadata.get("message_id"):
  1291. # Update the chat message with the error
  1292. try:
  1293. Chats.upsert_message_to_chat_by_id_and_message_id(
  1294. metadata["chat_id"],
  1295. metadata["message_id"],
  1296. {
  1297. "error": {"content": str(e)},
  1298. },
  1299. )
  1300. except:
  1301. pass
  1302. raise HTTPException(
  1303. status_code=status.HTTP_400_BAD_REQUEST,
  1304. detail=str(e),
  1305. )
  1306. if (
  1307. metadata.get("session_id")
  1308. and metadata.get("chat_id")
  1309. and metadata.get("message_id")
  1310. ):
  1311. # Asynchronous Chat Processing
  1312. task_id, _ = await create_task(
  1313. request.app.state.redis,
  1314. process_chat(request, form_data, user, metadata, model),
  1315. id=metadata["chat_id"],
  1316. )
  1317. return {"status": True, "task_id": task_id}
  1318. else:
  1319. return await process_chat(request, form_data, user, metadata, model)
  1320. # Alias for chat_completion (Legacy)
  1321. generate_chat_completions = chat_completion
  1322. generate_chat_completion = chat_completion
  1323. @app.post("/api/chat/completed")
  1324. async def chat_completed(
  1325. request: Request, form_data: dict, user=Depends(get_verified_user)
  1326. ):
  1327. try:
  1328. model_item = form_data.pop("model_item", {})
  1329. if model_item.get("direct", False):
  1330. request.state.direct = True
  1331. request.state.model = model_item
  1332. return await chat_completed_handler(request, form_data, user)
  1333. except Exception as e:
  1334. raise HTTPException(
  1335. status_code=status.HTTP_400_BAD_REQUEST,
  1336. detail=str(e),
  1337. )
  1338. @app.post("/api/chat/actions/{action_id}")
  1339. async def chat_action(
  1340. request: Request, action_id: str, form_data: dict, user=Depends(get_verified_user)
  1341. ):
  1342. try:
  1343. model_item = form_data.pop("model_item", {})
  1344. if model_item.get("direct", False):
  1345. request.state.direct = True
  1346. request.state.model = model_item
  1347. return await chat_action_handler(request, action_id, form_data, user)
  1348. except Exception as e:
  1349. raise HTTPException(
  1350. status_code=status.HTTP_400_BAD_REQUEST,
  1351. detail=str(e),
  1352. )
  1353. @app.post("/api/tasks/stop/{task_id}")
  1354. async def stop_task_endpoint(
  1355. request: Request, task_id: str, user=Depends(get_verified_user)
  1356. ):
  1357. try:
  1358. result = await stop_task(request.app.state.redis, task_id)
  1359. return result
  1360. except ValueError as e:
  1361. raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=str(e))
  1362. @app.get("/api/tasks")
  1363. async def list_tasks_endpoint(request: Request, user=Depends(get_verified_user)):
  1364. return {"tasks": await list_tasks(request.app.state.redis)}
  1365. @app.get("/api/tasks/chat/{chat_id}")
  1366. async def list_tasks_by_chat_id_endpoint(
  1367. request: Request, chat_id: str, user=Depends(get_verified_user)
  1368. ):
  1369. chat = Chats.get_chat_by_id(chat_id)
  1370. if chat is None or chat.user_id != user.id:
  1371. return {"task_ids": []}
  1372. task_ids = await list_task_ids_by_item_id(request.app.state.redis, chat_id)
  1373. log.debug(f"Task IDs for chat {chat_id}: {task_ids}")
  1374. return {"task_ids": task_ids}
  1375. ##################################
  1376. #
  1377. # Config Endpoints
  1378. #
  1379. ##################################
  1380. @app.get("/api/config")
  1381. async def get_app_config(request: Request):
  1382. user = None
  1383. if "token" in request.cookies:
  1384. token = request.cookies.get("token")
  1385. try:
  1386. data = decode_token(token)
  1387. except Exception as e:
  1388. log.debug(e)
  1389. raise HTTPException(
  1390. status_code=status.HTTP_401_UNAUTHORIZED,
  1391. detail="Invalid token",
  1392. )
  1393. if data is not None and "id" in data:
  1394. user = Users.get_user_by_id(data["id"])
  1395. user_count = Users.get_num_users()
  1396. onboarding = False
  1397. if user is None:
  1398. onboarding = user_count == 0
  1399. return {
  1400. **({"onboarding": True} if onboarding else {}),
  1401. "status": True,
  1402. "name": app.state.WEBUI_NAME,
  1403. "version": VERSION,
  1404. "default_locale": str(DEFAULT_LOCALE),
  1405. "oauth": {
  1406. "providers": {
  1407. name: config.get("name", name)
  1408. for name, config in OAUTH_PROVIDERS.items()
  1409. }
  1410. },
  1411. "features": {
  1412. "auth": WEBUI_AUTH,
  1413. "auth_trusted_header": bool(app.state.AUTH_TRUSTED_EMAIL_HEADER),
  1414. "enable_signup_password_confirmation": ENABLE_SIGNUP_PASSWORD_CONFIRMATION,
  1415. "enable_ldap": app.state.config.ENABLE_LDAP,
  1416. "enable_api_key": app.state.config.ENABLE_API_KEY,
  1417. "enable_signup": app.state.config.ENABLE_SIGNUP,
  1418. "enable_login_form": app.state.config.ENABLE_LOGIN_FORM,
  1419. "enable_websocket": ENABLE_WEBSOCKET_SUPPORT,
  1420. "enable_version_update_check": ENABLE_VERSION_UPDATE_CHECK,
  1421. **(
  1422. {
  1423. "enable_direct_connections": app.state.config.ENABLE_DIRECT_CONNECTIONS,
  1424. "enable_channels": app.state.config.ENABLE_CHANNELS,
  1425. "enable_notes": app.state.config.ENABLE_NOTES,
  1426. "enable_web_search": app.state.config.ENABLE_WEB_SEARCH,
  1427. "enable_code_execution": app.state.config.ENABLE_CODE_EXECUTION,
  1428. "enable_code_interpreter": app.state.config.ENABLE_CODE_INTERPRETER,
  1429. "enable_image_generation": app.state.config.ENABLE_IMAGE_GENERATION,
  1430. "enable_autocomplete_generation": app.state.config.ENABLE_AUTOCOMPLETE_GENERATION,
  1431. "enable_community_sharing": app.state.config.ENABLE_COMMUNITY_SHARING,
  1432. "enable_message_rating": app.state.config.ENABLE_MESSAGE_RATING,
  1433. "enable_user_webhooks": app.state.config.ENABLE_USER_WEBHOOKS,
  1434. "enable_admin_export": ENABLE_ADMIN_EXPORT,
  1435. "enable_admin_chat_access": ENABLE_ADMIN_CHAT_ACCESS,
  1436. "enable_google_drive_integration": app.state.config.ENABLE_GOOGLE_DRIVE_INTEGRATION,
  1437. "enable_onedrive_integration": app.state.config.ENABLE_ONEDRIVE_INTEGRATION,
  1438. }
  1439. if user is not None
  1440. else {}
  1441. ),
  1442. },
  1443. **(
  1444. {
  1445. "default_models": app.state.config.DEFAULT_MODELS,
  1446. "default_prompt_suggestions": app.state.config.DEFAULT_PROMPT_SUGGESTIONS,
  1447. "user_count": user_count,
  1448. "code": {
  1449. "engine": app.state.config.CODE_EXECUTION_ENGINE,
  1450. },
  1451. "audio": {
  1452. "tts": {
  1453. "engine": app.state.config.TTS_ENGINE,
  1454. "voice": app.state.config.TTS_VOICE,
  1455. "split_on": app.state.config.TTS_SPLIT_ON,
  1456. },
  1457. "stt": {
  1458. "engine": app.state.config.STT_ENGINE,
  1459. },
  1460. },
  1461. "file": {
  1462. "max_size": app.state.config.FILE_MAX_SIZE,
  1463. "max_count": app.state.config.FILE_MAX_COUNT,
  1464. "image_compression": {
  1465. "width": app.state.config.FILE_IMAGE_COMPRESSION_WIDTH,
  1466. "height": app.state.config.FILE_IMAGE_COMPRESSION_HEIGHT,
  1467. },
  1468. },
  1469. "permissions": {**app.state.config.USER_PERMISSIONS},
  1470. "google_drive": {
  1471. "client_id": GOOGLE_DRIVE_CLIENT_ID.value,
  1472. "api_key": GOOGLE_DRIVE_API_KEY.value,
  1473. },
  1474. "onedrive": {
  1475. "client_id": ONEDRIVE_CLIENT_ID.value,
  1476. "sharepoint_url": ONEDRIVE_SHAREPOINT_URL.value,
  1477. "sharepoint_tenant_id": ONEDRIVE_SHAREPOINT_TENANT_ID.value,
  1478. },
  1479. "ui": {
  1480. "pending_user_overlay_title": app.state.config.PENDING_USER_OVERLAY_TITLE,
  1481. "pending_user_overlay_content": app.state.config.PENDING_USER_OVERLAY_CONTENT,
  1482. "response_watermark": app.state.config.RESPONSE_WATERMARK,
  1483. },
  1484. "license_metadata": app.state.LICENSE_METADATA,
  1485. **(
  1486. {
  1487. "active_entries": app.state.USER_COUNT,
  1488. }
  1489. if user.role == "admin"
  1490. else {}
  1491. ),
  1492. }
  1493. if user is not None and (user.role in ["admin", "user"])
  1494. else {
  1495. **(
  1496. {
  1497. "ui": {
  1498. "pending_user_overlay_title": app.state.config.PENDING_USER_OVERLAY_TITLE,
  1499. "pending_user_overlay_content": app.state.config.PENDING_USER_OVERLAY_CONTENT,
  1500. }
  1501. }
  1502. if user and user.role == "pending"
  1503. else {}
  1504. ),
  1505. **(
  1506. {
  1507. "metadata": {
  1508. "login_footer": app.state.LICENSE_METADATA.get(
  1509. "login_footer", ""
  1510. ),
  1511. "auth_logo_position": app.state.LICENSE_METADATA.get(
  1512. "auth_logo_position", ""
  1513. ),
  1514. }
  1515. }
  1516. if app.state.LICENSE_METADATA
  1517. else {}
  1518. ),
  1519. }
  1520. ),
  1521. }
  1522. class UrlForm(BaseModel):
  1523. url: str
  1524. @app.get("/api/webhook")
  1525. async def get_webhook_url(user=Depends(get_admin_user)):
  1526. return {
  1527. "url": app.state.config.WEBHOOK_URL,
  1528. }
  1529. @app.post("/api/webhook")
  1530. async def update_webhook_url(form_data: UrlForm, user=Depends(get_admin_user)):
  1531. app.state.config.WEBHOOK_URL = form_data.url
  1532. app.state.WEBHOOK_URL = app.state.config.WEBHOOK_URL
  1533. return {"url": app.state.config.WEBHOOK_URL}
  1534. @app.get("/api/version")
  1535. async def get_app_version():
  1536. return {
  1537. "version": VERSION,
  1538. }
  1539. @app.get("/api/version/updates")
  1540. async def get_app_latest_release_version(user=Depends(get_verified_user)):
  1541. if not ENABLE_VERSION_UPDATE_CHECK:
  1542. log.debug(
  1543. f"Version update check is disabled, returning current version as latest version"
  1544. )
  1545. return {"current": VERSION, "latest": VERSION}
  1546. try:
  1547. timeout = aiohttp.ClientTimeout(total=1)
  1548. async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
  1549. async with session.get(
  1550. "https://api.github.com/repos/open-webui/open-webui/releases/latest",
  1551. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  1552. ) as response:
  1553. response.raise_for_status()
  1554. data = await response.json()
  1555. latest_version = data["tag_name"]
  1556. return {"current": VERSION, "latest": latest_version[1:]}
  1557. except Exception as e:
  1558. log.debug(e)
  1559. return {"current": VERSION, "latest": VERSION}
  1560. @app.get("/api/changelog")
  1561. async def get_app_changelog():
  1562. return {key: CHANGELOG[key] for idx, key in enumerate(CHANGELOG) if idx < 5}
  1563. @app.get("/api/usage")
  1564. async def get_current_usage(user=Depends(get_verified_user)):
  1565. """
  1566. Get current usage statistics for Open WebUI.
  1567. This is an experimental endpoint and subject to change.
  1568. """
  1569. try:
  1570. return {"model_ids": get_models_in_use(), "user_ids": get_active_user_ids()}
  1571. except Exception as e:
  1572. log.error(f"Error getting usage statistics: {e}")
  1573. raise HTTPException(status_code=500, detail="Internal Server Error")
  1574. ############################
  1575. # OAuth Login & Callback
  1576. ############################
  1577. # SessionMiddleware is used by authlib for oauth
  1578. if len(OAUTH_PROVIDERS) > 0:
  1579. app.add_middleware(
  1580. SessionMiddleware,
  1581. secret_key=WEBUI_SECRET_KEY,
  1582. session_cookie="oui-session",
  1583. same_site=WEBUI_SESSION_COOKIE_SAME_SITE,
  1584. https_only=WEBUI_SESSION_COOKIE_SECURE,
  1585. )
  1586. @app.get("/oauth/{provider}/login")
  1587. async def oauth_login(provider: str, request: Request):
  1588. return await oauth_manager.handle_login(request, provider)
  1589. # OAuth login logic is as follows:
  1590. # 1. Attempt to find a user with matching subject ID, tied to the provider
  1591. # 2. If OAUTH_MERGE_ACCOUNTS_BY_EMAIL is true, find a user with the email address provided via OAuth
  1592. # - This is considered insecure in general, as OAuth providers do not always verify email addresses
  1593. # 3. If there is no user, and ENABLE_OAUTH_SIGNUP is true, create a user
  1594. # - Email addresses are considered unique, so we fail registration if the email address is already taken
  1595. @app.get("/oauth/{provider}/callback")
  1596. async def oauth_callback(provider: str, request: Request, response: Response):
  1597. return await oauth_manager.handle_callback(request, provider, response)
  1598. @app.get("/manifest.json")
  1599. async def get_manifest_json():
  1600. if app.state.EXTERNAL_PWA_MANIFEST_URL:
  1601. return requests.get(app.state.EXTERNAL_PWA_MANIFEST_URL).json()
  1602. else:
  1603. return {
  1604. "name": app.state.WEBUI_NAME,
  1605. "short_name": app.state.WEBUI_NAME,
  1606. "description": f"{app.state.WEBUI_NAME} is an open, extensible, user-friendly interface for AI that adapts to your workflow.",
  1607. "start_url": "/",
  1608. "display": "standalone",
  1609. "background_color": "#343541",
  1610. "icons": [
  1611. {
  1612. "src": "/static/logo.png",
  1613. "type": "image/png",
  1614. "sizes": "500x500",
  1615. "purpose": "any",
  1616. },
  1617. {
  1618. "src": "/static/logo.png",
  1619. "type": "image/png",
  1620. "sizes": "500x500",
  1621. "purpose": "maskable",
  1622. },
  1623. ],
  1624. }
  1625. @app.get("/opensearch.xml")
  1626. async def get_opensearch_xml():
  1627. xml_content = rf"""
  1628. <OpenSearchDescription xmlns="http://a9.com/-/spec/opensearch/1.1/" xmlns:moz="http://www.mozilla.org/2006/browser/search/">
  1629. <ShortName>{app.state.WEBUI_NAME}</ShortName>
  1630. <Description>Search {app.state.WEBUI_NAME}</Description>
  1631. <InputEncoding>UTF-8</InputEncoding>
  1632. <Image width="16" height="16" type="image/x-icon">{app.state.config.WEBUI_URL}/static/favicon.png</Image>
  1633. <Url type="text/html" method="get" template="{app.state.config.WEBUI_URL}/?q={"{searchTerms}"}"/>
  1634. <moz:SearchForm>{app.state.config.WEBUI_URL}</moz:SearchForm>
  1635. </OpenSearchDescription>
  1636. """
  1637. return Response(content=xml_content, media_type="application/xml")
  1638. @app.get("/health")
  1639. async def healthcheck():
  1640. return {"status": True}
  1641. @app.get("/health/db")
  1642. async def healthcheck_with_db():
  1643. Session.execute(text("SELECT 1;")).all()
  1644. return {"status": True}
  1645. app.mount("/static", StaticFiles(directory=STATIC_DIR), name="static")
  1646. @app.get("/cache/{path:path}")
  1647. async def serve_cache_file(
  1648. path: str,
  1649. user=Depends(get_verified_user),
  1650. ):
  1651. file_path = os.path.abspath(os.path.join(CACHE_DIR, path))
  1652. # prevent path traversal
  1653. if not file_path.startswith(os.path.abspath(CACHE_DIR)):
  1654. raise HTTPException(status_code=404, detail="File not found")
  1655. if not os.path.isfile(file_path):
  1656. raise HTTPException(status_code=404, detail="File not found")
  1657. return FileResponse(file_path)
  1658. def swagger_ui_html(*args, **kwargs):
  1659. return get_swagger_ui_html(
  1660. *args,
  1661. **kwargs,
  1662. swagger_js_url="/static/swagger-ui/swagger-ui-bundle.js",
  1663. swagger_css_url="/static/swagger-ui/swagger-ui.css",
  1664. swagger_favicon_url="/static/swagger-ui/favicon.png",
  1665. )
  1666. applications.get_swagger_ui_html = swagger_ui_html
  1667. if os.path.exists(FRONTEND_BUILD_DIR):
  1668. mimetypes.add_type("text/javascript", ".js")
  1669. app.mount(
  1670. "/",
  1671. SPAStaticFiles(directory=FRONTEND_BUILD_DIR, html=True),
  1672. name="spa-static-files",
  1673. )
  1674. else:
  1675. log.warning(
  1676. f"Frontend build directory not found at '{FRONTEND_BUILD_DIR}'. Serving API only."
  1677. )