openai.py 38 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160
  1. import asyncio
  2. import hashlib
  3. import json
  4. import logging
  5. from typing import Optional
  6. import aiohttp
  7. from aiocache import cached
  8. import requests
  9. from urllib.parse import quote
  10. from azure.identity import DefaultAzureCredential, get_bearer_token_provider
  11. from fastapi import Depends, HTTPException, Request, APIRouter
  12. from fastapi.responses import (
  13. FileResponse,
  14. StreamingResponse,
  15. JSONResponse,
  16. PlainTextResponse,
  17. )
  18. from pydantic import BaseModel
  19. from starlette.background import BackgroundTask
  20. from open_webui.models.models import Models
  21. from open_webui.config import (
  22. CACHE_DIR,
  23. )
  24. from open_webui.env import (
  25. MODELS_CACHE_TTL,
  26. AIOHTTP_CLIENT_SESSION_SSL,
  27. AIOHTTP_CLIENT_TIMEOUT,
  28. AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST,
  29. ENABLE_FORWARD_USER_INFO_HEADERS,
  30. BYPASS_MODEL_ACCESS_CONTROL,
  31. )
  32. from open_webui.models.users import UserModel
  33. from open_webui.constants import ERROR_MESSAGES
  34. from open_webui.env import SRC_LOG_LEVELS
  35. from open_webui.utils.payload import (
  36. apply_model_params_to_body_openai,
  37. apply_system_prompt_to_body,
  38. )
  39. from open_webui.utils.misc import (
  40. convert_logit_bias_input_to_json,
  41. )
  42. from open_webui.utils.auth import get_admin_user, get_verified_user
  43. from open_webui.utils.access_control import has_access
  44. log = logging.getLogger(__name__)
  45. log.setLevel(SRC_LOG_LEVELS["OPENAI"])
  46. ##########################################
  47. #
  48. # Utility functions
  49. #
  50. ##########################################
  51. async def send_get_request(url, key=None, user: UserModel = None):
  52. timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST)
  53. try:
  54. async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
  55. async with session.get(
  56. url,
  57. headers={
  58. **({"Authorization": f"Bearer {key}"} if key else {}),
  59. **(
  60. {
  61. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  62. "X-OpenWebUI-User-Id": user.id,
  63. "X-OpenWebUI-User-Email": user.email,
  64. "X-OpenWebUI-User-Role": user.role,
  65. }
  66. if ENABLE_FORWARD_USER_INFO_HEADERS and user
  67. else {}
  68. ),
  69. },
  70. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  71. ) as response:
  72. return await response.json()
  73. except Exception as e:
  74. # Handle connection error here
  75. log.error(f"Connection error: {e}")
  76. return None
  77. async def cleanup_response(
  78. response: Optional[aiohttp.ClientResponse],
  79. session: Optional[aiohttp.ClientSession],
  80. ):
  81. if response:
  82. response.close()
  83. if session:
  84. await session.close()
  85. def openai_reasoning_model_handler(payload):
  86. """
  87. Handle reasoning model specific parameters
  88. """
  89. if "max_tokens" in payload:
  90. # Convert "max_tokens" to "max_completion_tokens" for all reasoning models
  91. payload["max_completion_tokens"] = payload["max_tokens"]
  92. del payload["max_tokens"]
  93. # Handle system role conversion based on model type
  94. if payload["messages"][0]["role"] == "system":
  95. model_lower = payload["model"].lower()
  96. # Legacy models use "user" role instead of "system"
  97. if model_lower.startswith("o1-mini") or model_lower.startswith("o1-preview"):
  98. payload["messages"][0]["role"] = "user"
  99. else:
  100. payload["messages"][0]["role"] = "developer"
  101. return payload
  102. async def get_headers_and_cookies(
  103. request: Request,
  104. url,
  105. key=None,
  106. config=None,
  107. metadata: Optional[dict] = None,
  108. user: UserModel = None,
  109. ):
  110. cookies = {}
  111. headers = {
  112. "Content-Type": "application/json",
  113. **(
  114. {
  115. "HTTP-Referer": "https://openwebui.com/",
  116. "X-Title": "Open WebUI",
  117. }
  118. if "openrouter.ai" in url
  119. else {}
  120. ),
  121. **(
  122. {
  123. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  124. "X-OpenWebUI-User-Id": user.id,
  125. "X-OpenWebUI-User-Email": user.email,
  126. "X-OpenWebUI-User-Role": user.role,
  127. **(
  128. {"X-OpenWebUI-Chat-Id": metadata.get("chat_id")}
  129. if metadata and metadata.get("chat_id")
  130. else {}
  131. ),
  132. }
  133. if ENABLE_FORWARD_USER_INFO_HEADERS
  134. else {}
  135. ),
  136. }
  137. token = None
  138. auth_type = config.get("auth_type")
  139. if auth_type == "bearer" or auth_type is None:
  140. # Default to bearer if not specified
  141. token = f"{key}"
  142. elif auth_type == "none":
  143. token = None
  144. elif auth_type == "session":
  145. cookies = request.cookies
  146. token = request.state.token.credentials
  147. elif auth_type == "system_oauth":
  148. cookies = request.cookies
  149. oauth_token = None
  150. try:
  151. if request.cookies.get("oauth_session_id", None):
  152. oauth_token = await request.app.state.oauth_manager.get_oauth_token(
  153. user.id,
  154. request.cookies.get("oauth_session_id", None),
  155. )
  156. except Exception as e:
  157. log.error(f"Error getting OAuth token: {e}")
  158. if oauth_token:
  159. token = f"{oauth_token.get('access_token', '')}"
  160. elif auth_type in ("azure_ad", "microsoft_entra_id"):
  161. token = get_microsoft_entra_id_access_token()
  162. if token:
  163. headers["Authorization"] = f"Bearer {token}"
  164. if config.get("headers") and isinstance(config.get("headers"), dict):
  165. headers = {**headers, **config.get("headers")}
  166. return headers, cookies
  167. def get_microsoft_entra_id_access_token():
  168. """
  169. Get Microsoft Entra ID access token using DefaultAzureCredential for Azure OpenAI.
  170. Returns the token string or None if authentication fails.
  171. """
  172. try:
  173. token_provider = get_bearer_token_provider(
  174. DefaultAzureCredential(), "https://cognitiveservices.azure.com/.default"
  175. )
  176. return token_provider()
  177. except Exception as e:
  178. log.error(f"Error getting Microsoft Entra ID access token: {e}")
  179. return None
  180. ##########################################
  181. #
  182. # API routes
  183. #
  184. ##########################################
  185. router = APIRouter()
  186. @router.get("/config")
  187. async def get_config(request: Request, user=Depends(get_admin_user)):
  188. return {
  189. "ENABLE_OPENAI_API": request.app.state.config.ENABLE_OPENAI_API,
  190. "OPENAI_API_BASE_URLS": request.app.state.config.OPENAI_API_BASE_URLS,
  191. "OPENAI_API_KEYS": request.app.state.config.OPENAI_API_KEYS,
  192. "OPENAI_API_CONFIGS": request.app.state.config.OPENAI_API_CONFIGS,
  193. }
  194. class OpenAIConfigForm(BaseModel):
  195. ENABLE_OPENAI_API: Optional[bool] = None
  196. OPENAI_API_BASE_URLS: list[str]
  197. OPENAI_API_KEYS: list[str]
  198. OPENAI_API_CONFIGS: dict
  199. @router.post("/config/update")
  200. async def update_config(
  201. request: Request, form_data: OpenAIConfigForm, user=Depends(get_admin_user)
  202. ):
  203. request.app.state.config.ENABLE_OPENAI_API = form_data.ENABLE_OPENAI_API
  204. request.app.state.config.OPENAI_API_BASE_URLS = form_data.OPENAI_API_BASE_URLS
  205. request.app.state.config.OPENAI_API_KEYS = form_data.OPENAI_API_KEYS
  206. # Check if API KEYS length is same than API URLS length
  207. if len(request.app.state.config.OPENAI_API_KEYS) != len(
  208. request.app.state.config.OPENAI_API_BASE_URLS
  209. ):
  210. if len(request.app.state.config.OPENAI_API_KEYS) > len(
  211. request.app.state.config.OPENAI_API_BASE_URLS
  212. ):
  213. request.app.state.config.OPENAI_API_KEYS = (
  214. request.app.state.config.OPENAI_API_KEYS[
  215. : len(request.app.state.config.OPENAI_API_BASE_URLS)
  216. ]
  217. )
  218. else:
  219. request.app.state.config.OPENAI_API_KEYS += [""] * (
  220. len(request.app.state.config.OPENAI_API_BASE_URLS)
  221. - len(request.app.state.config.OPENAI_API_KEYS)
  222. )
  223. request.app.state.config.OPENAI_API_CONFIGS = form_data.OPENAI_API_CONFIGS
  224. # Remove the API configs that are not in the API URLS
  225. keys = list(map(str, range(len(request.app.state.config.OPENAI_API_BASE_URLS))))
  226. request.app.state.config.OPENAI_API_CONFIGS = {
  227. key: value
  228. for key, value in request.app.state.config.OPENAI_API_CONFIGS.items()
  229. if key in keys
  230. }
  231. return {
  232. "ENABLE_OPENAI_API": request.app.state.config.ENABLE_OPENAI_API,
  233. "OPENAI_API_BASE_URLS": request.app.state.config.OPENAI_API_BASE_URLS,
  234. "OPENAI_API_KEYS": request.app.state.config.OPENAI_API_KEYS,
  235. "OPENAI_API_CONFIGS": request.app.state.config.OPENAI_API_CONFIGS,
  236. }
  237. @router.post("/audio/speech")
  238. async def speech(request: Request, user=Depends(get_verified_user)):
  239. idx = None
  240. try:
  241. idx = request.app.state.config.OPENAI_API_BASE_URLS.index(
  242. "https://api.openai.com/v1"
  243. )
  244. body = await request.body()
  245. name = hashlib.sha256(body).hexdigest()
  246. SPEECH_CACHE_DIR = CACHE_DIR / "audio" / "speech"
  247. SPEECH_CACHE_DIR.mkdir(parents=True, exist_ok=True)
  248. file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
  249. file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
  250. # Check if the file already exists in the cache
  251. if file_path.is_file():
  252. return FileResponse(file_path)
  253. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  254. key = request.app.state.config.OPENAI_API_KEYS[idx]
  255. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  256. str(idx),
  257. request.app.state.config.OPENAI_API_CONFIGS.get(url, {}), # Legacy support
  258. )
  259. headers, cookies = await get_headers_and_cookies(
  260. request, url, key, api_config, user=user
  261. )
  262. r = None
  263. try:
  264. r = requests.post(
  265. url=f"{url}/audio/speech",
  266. data=body,
  267. headers=headers,
  268. cookies=cookies,
  269. stream=True,
  270. )
  271. r.raise_for_status()
  272. # Save the streaming content to a file
  273. with open(file_path, "wb") as f:
  274. for chunk in r.iter_content(chunk_size=8192):
  275. f.write(chunk)
  276. with open(file_body_path, "w") as f:
  277. json.dump(json.loads(body.decode("utf-8")), f)
  278. # Return the saved file
  279. return FileResponse(file_path)
  280. except Exception as e:
  281. log.exception(e)
  282. detail = None
  283. if r is not None:
  284. try:
  285. res = r.json()
  286. if "error" in res:
  287. detail = f"External: {res['error']}"
  288. except Exception:
  289. detail = f"External: {e}"
  290. raise HTTPException(
  291. status_code=r.status_code if r else 500,
  292. detail=detail if detail else "Open WebUI: Server Connection Error",
  293. )
  294. except ValueError:
  295. raise HTTPException(status_code=401, detail=ERROR_MESSAGES.OPENAI_NOT_FOUND)
  296. async def get_all_models_responses(request: Request, user: UserModel) -> list:
  297. if not request.app.state.config.ENABLE_OPENAI_API:
  298. return []
  299. # Check if API KEYS length is same than API URLS length
  300. num_urls = len(request.app.state.config.OPENAI_API_BASE_URLS)
  301. num_keys = len(request.app.state.config.OPENAI_API_KEYS)
  302. if num_keys != num_urls:
  303. # if there are more keys than urls, remove the extra keys
  304. if num_keys > num_urls:
  305. new_keys = request.app.state.config.OPENAI_API_KEYS[:num_urls]
  306. request.app.state.config.OPENAI_API_KEYS = new_keys
  307. # if there are more urls than keys, add empty keys
  308. else:
  309. request.app.state.config.OPENAI_API_KEYS += [""] * (num_urls - num_keys)
  310. request_tasks = []
  311. for idx, url in enumerate(request.app.state.config.OPENAI_API_BASE_URLS):
  312. if (str(idx) not in request.app.state.config.OPENAI_API_CONFIGS) and (
  313. url not in request.app.state.config.OPENAI_API_CONFIGS # Legacy support
  314. ):
  315. request_tasks.append(
  316. send_get_request(
  317. f"{url}/models",
  318. request.app.state.config.OPENAI_API_KEYS[idx],
  319. user=user,
  320. )
  321. )
  322. else:
  323. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  324. str(idx),
  325. request.app.state.config.OPENAI_API_CONFIGS.get(
  326. url, {}
  327. ), # Legacy support
  328. )
  329. enable = api_config.get("enable", True)
  330. model_ids = api_config.get("model_ids", [])
  331. if enable:
  332. if len(model_ids) == 0:
  333. request_tasks.append(
  334. send_get_request(
  335. f"{url}/models",
  336. request.app.state.config.OPENAI_API_KEYS[idx],
  337. user=user,
  338. )
  339. )
  340. else:
  341. model_list = {
  342. "object": "list",
  343. "data": [
  344. {
  345. "id": model_id,
  346. "name": model_id,
  347. "owned_by": "openai",
  348. "openai": {"id": model_id},
  349. "urlIdx": idx,
  350. }
  351. for model_id in model_ids
  352. ],
  353. }
  354. request_tasks.append(
  355. asyncio.ensure_future(asyncio.sleep(0, model_list))
  356. )
  357. else:
  358. request_tasks.append(asyncio.ensure_future(asyncio.sleep(0, None)))
  359. responses = await asyncio.gather(*request_tasks)
  360. for idx, response in enumerate(responses):
  361. if response:
  362. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  363. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  364. str(idx),
  365. request.app.state.config.OPENAI_API_CONFIGS.get(
  366. url, {}
  367. ), # Legacy support
  368. )
  369. connection_type = api_config.get("connection_type", "external")
  370. prefix_id = api_config.get("prefix_id", None)
  371. tags = api_config.get("tags", [])
  372. model_list = (
  373. response if isinstance(response, list) else response.get("data", [])
  374. )
  375. if not isinstance(model_list, list):
  376. # Catch non-list responses
  377. model_list = []
  378. for model in model_list:
  379. # Remove name key if its value is None #16689
  380. if "name" in model and model["name"] is None:
  381. del model["name"]
  382. if prefix_id:
  383. model["id"] = (
  384. f"{prefix_id}.{model.get('id', model.get('name', ''))}"
  385. )
  386. if tags:
  387. model["tags"] = tags
  388. if connection_type:
  389. model["connection_type"] = connection_type
  390. log.debug(f"get_all_models:responses() {responses}")
  391. return responses
  392. async def get_filtered_models(models, user):
  393. # Filter models based on user access control
  394. filtered_models = []
  395. for model in models.get("data", []):
  396. model_info = Models.get_model_by_id(model["id"])
  397. if model_info:
  398. if user.id == model_info.user_id or has_access(
  399. user.id, type="read", access_control=model_info.access_control
  400. ):
  401. filtered_models.append(model)
  402. return filtered_models
  403. @cached(
  404. ttl=MODELS_CACHE_TTL,
  405. key=lambda _, user: f"openai_all_models_{user.id}" if user else "openai_all_models",
  406. )
  407. async def get_all_models(request: Request, user: UserModel) -> dict[str, list]:
  408. log.info("get_all_models()")
  409. if not request.app.state.config.ENABLE_OPENAI_API:
  410. return {"data": []}
  411. responses = await get_all_models_responses(request, user=user)
  412. def extract_data(response):
  413. if response and "data" in response:
  414. return response["data"]
  415. if isinstance(response, list):
  416. return response
  417. return None
  418. def is_supported_openai_models(model_id):
  419. if any(
  420. name in model_id
  421. for name in [
  422. "babbage",
  423. "dall-e",
  424. "davinci",
  425. "embedding",
  426. "tts",
  427. "whisper",
  428. ]
  429. ):
  430. return False
  431. return True
  432. def get_merged_models(model_lists):
  433. log.debug(f"merge_models_lists {model_lists}")
  434. models = {}
  435. for idx, model_list in enumerate(model_lists):
  436. if model_list is not None and "error" not in model_list:
  437. for model in model_list:
  438. model_id = model.get("id") or model.get("name")
  439. if (
  440. "api.openai.com"
  441. in request.app.state.config.OPENAI_API_BASE_URLS[idx]
  442. and not is_supported_openai_models(model_id)
  443. ):
  444. # Skip unwanted OpenAI models
  445. continue
  446. if model_id and model_id not in models:
  447. models[model_id] = {
  448. **model,
  449. "name": model.get("name", model_id),
  450. "owned_by": "openai",
  451. "openai": model,
  452. "connection_type": model.get("connection_type", "external"),
  453. "urlIdx": idx,
  454. }
  455. return models
  456. models = get_merged_models(map(extract_data, responses))
  457. log.debug(f"models: {models}")
  458. request.app.state.OPENAI_MODELS = models
  459. return {"data": list(models.values())}
  460. @router.get("/models")
  461. @router.get("/models/{url_idx}")
  462. async def get_models(
  463. request: Request, url_idx: Optional[int] = None, user=Depends(get_verified_user)
  464. ):
  465. models = {
  466. "data": [],
  467. }
  468. if url_idx is None:
  469. models = await get_all_models(request, user=user)
  470. else:
  471. url = request.app.state.config.OPENAI_API_BASE_URLS[url_idx]
  472. key = request.app.state.config.OPENAI_API_KEYS[url_idx]
  473. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  474. str(url_idx),
  475. request.app.state.config.OPENAI_API_CONFIGS.get(url, {}), # Legacy support
  476. )
  477. r = None
  478. async with aiohttp.ClientSession(
  479. trust_env=True,
  480. timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST),
  481. ) as session:
  482. try:
  483. headers, cookies = await get_headers_and_cookies(
  484. request, url, key, api_config, user=user
  485. )
  486. if api_config.get("azure", False):
  487. models = {
  488. "data": api_config.get("model_ids", []) or [],
  489. "object": "list",
  490. }
  491. else:
  492. async with session.get(
  493. f"{url}/models",
  494. headers=headers,
  495. cookies=cookies,
  496. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  497. ) as r:
  498. if r.status != 200:
  499. # Extract response error details if available
  500. error_detail = f"HTTP Error: {r.status}"
  501. res = await r.json()
  502. if "error" in res:
  503. error_detail = f"External Error: {res['error']}"
  504. raise Exception(error_detail)
  505. response_data = await r.json()
  506. # Check if we're calling OpenAI API based on the URL
  507. if "api.openai.com" in url:
  508. # Filter models according to the specified conditions
  509. response_data["data"] = [
  510. model
  511. for model in response_data.get("data", [])
  512. if not any(
  513. name in model["id"]
  514. for name in [
  515. "babbage",
  516. "dall-e",
  517. "davinci",
  518. "embedding",
  519. "tts",
  520. "whisper",
  521. ]
  522. )
  523. ]
  524. models = response_data
  525. except aiohttp.ClientError as e:
  526. # ClientError covers all aiohttp requests issues
  527. log.exception(f"Client error: {str(e)}")
  528. raise HTTPException(
  529. status_code=500, detail="Open WebUI: Server Connection Error"
  530. )
  531. except Exception as e:
  532. log.exception(f"Unexpected error: {e}")
  533. error_detail = f"Unexpected error: {str(e)}"
  534. raise HTTPException(status_code=500, detail=error_detail)
  535. if user.role == "user" and not BYPASS_MODEL_ACCESS_CONTROL:
  536. models["data"] = await get_filtered_models(models, user)
  537. return models
  538. class ConnectionVerificationForm(BaseModel):
  539. url: str
  540. key: str
  541. config: Optional[dict] = None
  542. @router.post("/verify")
  543. async def verify_connection(
  544. request: Request,
  545. form_data: ConnectionVerificationForm,
  546. user=Depends(get_admin_user),
  547. ):
  548. url = form_data.url
  549. key = form_data.key
  550. api_config = form_data.config or {}
  551. async with aiohttp.ClientSession(
  552. trust_env=True,
  553. timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST),
  554. ) as session:
  555. try:
  556. headers, cookies = await get_headers_and_cookies(
  557. request, url, key, api_config, user=user
  558. )
  559. if api_config.get("azure", False):
  560. # Only set api-key header if not using Azure Entra ID authentication
  561. auth_type = api_config.get("auth_type", "bearer")
  562. if auth_type not in ("azure_ad", "microsoft_entra_id"):
  563. headers["api-key"] = key
  564. api_version = api_config.get("api_version", "") or "2023-03-15-preview"
  565. async with session.get(
  566. url=f"{url}/openai/models?api-version={api_version}",
  567. headers=headers,
  568. cookies=cookies,
  569. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  570. ) as r:
  571. try:
  572. response_data = await r.json()
  573. except Exception:
  574. response_data = await r.text()
  575. if r.status != 200:
  576. if isinstance(response_data, (dict, list)):
  577. return JSONResponse(
  578. status_code=r.status, content=response_data
  579. )
  580. else:
  581. return PlainTextResponse(
  582. status_code=r.status, content=response_data
  583. )
  584. return response_data
  585. else:
  586. async with session.get(
  587. f"{url}/models",
  588. headers=headers,
  589. cookies=cookies,
  590. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  591. ) as r:
  592. try:
  593. response_data = await r.json()
  594. except Exception:
  595. response_data = await r.text()
  596. if r.status != 200:
  597. if isinstance(response_data, (dict, list)):
  598. return JSONResponse(
  599. status_code=r.status, content=response_data
  600. )
  601. else:
  602. return PlainTextResponse(
  603. status_code=r.status, content=response_data
  604. )
  605. return response_data
  606. except aiohttp.ClientError as e:
  607. # ClientError covers all aiohttp requests issues
  608. log.exception(f"Client error: {str(e)}")
  609. raise HTTPException(
  610. status_code=500, detail="Open WebUI: Server Connection Error"
  611. )
  612. except Exception as e:
  613. log.exception(f"Unexpected error: {e}")
  614. raise HTTPException(
  615. status_code=500, detail="Open WebUI: Server Connection Error"
  616. )
  617. def get_azure_allowed_params(api_version: str) -> set[str]:
  618. allowed_params = {
  619. "messages",
  620. "temperature",
  621. "role",
  622. "content",
  623. "contentPart",
  624. "contentPartImage",
  625. "enhancements",
  626. "dataSources",
  627. "n",
  628. "stream",
  629. "stop",
  630. "max_tokens",
  631. "presence_penalty",
  632. "frequency_penalty",
  633. "logit_bias",
  634. "user",
  635. "function_call",
  636. "functions",
  637. "tools",
  638. "tool_choice",
  639. "top_p",
  640. "log_probs",
  641. "top_logprobs",
  642. "response_format",
  643. "seed",
  644. "max_completion_tokens",
  645. }
  646. try:
  647. if api_version >= "2024-09-01-preview":
  648. allowed_params.add("stream_options")
  649. except ValueError:
  650. log.debug(
  651. f"Invalid API version {api_version} for Azure OpenAI. Defaulting to allowed parameters."
  652. )
  653. return allowed_params
  654. def is_openai_reasoning_model(model: str) -> bool:
  655. return model.lower().startswith(("o1", "o3", "o4", "gpt-5"))
  656. def convert_to_azure_payload(url, payload: dict, api_version: str):
  657. model = payload.get("model", "")
  658. # Filter allowed parameters based on Azure OpenAI API
  659. allowed_params = get_azure_allowed_params(api_version)
  660. # Special handling for o-series models
  661. if is_openai_reasoning_model(model):
  662. # Convert max_tokens to max_completion_tokens for o-series models
  663. if "max_tokens" in payload:
  664. payload["max_completion_tokens"] = payload["max_tokens"]
  665. del payload["max_tokens"]
  666. # Remove temperature if not 1 for o-series models
  667. if "temperature" in payload and payload["temperature"] != 1:
  668. log.debug(
  669. f"Removing temperature parameter for o-series model {model} as only default value (1) is supported"
  670. )
  671. del payload["temperature"]
  672. # Filter out unsupported parameters
  673. payload = {k: v for k, v in payload.items() if k in allowed_params}
  674. url = f"{url}/openai/deployments/{model}"
  675. return url, payload
  676. @router.post("/chat/completions")
  677. async def generate_chat_completion(
  678. request: Request,
  679. form_data: dict,
  680. user=Depends(get_verified_user),
  681. bypass_filter: Optional[bool] = False,
  682. ):
  683. if BYPASS_MODEL_ACCESS_CONTROL:
  684. bypass_filter = True
  685. idx = 0
  686. payload = {**form_data}
  687. metadata = payload.pop("metadata", None)
  688. model_id = form_data.get("model")
  689. model_info = Models.get_model_by_id(model_id)
  690. # Check model info and override the payload
  691. if model_info:
  692. if model_info.base_model_id:
  693. payload["model"] = model_info.base_model_id
  694. model_id = model_info.base_model_id
  695. params = model_info.params.model_dump()
  696. if params:
  697. system = params.pop("system", None)
  698. payload = apply_model_params_to_body_openai(params, payload)
  699. payload = apply_system_prompt_to_body(system, payload, metadata, user)
  700. # Check if user has access to the model
  701. if not bypass_filter and user.role == "user":
  702. if not (
  703. user.id == model_info.user_id
  704. or has_access(
  705. user.id, type="read", access_control=model_info.access_control
  706. )
  707. ):
  708. raise HTTPException(
  709. status_code=403,
  710. detail="Model not found",
  711. )
  712. elif not bypass_filter:
  713. if user.role != "admin":
  714. raise HTTPException(
  715. status_code=403,
  716. detail="Model not found",
  717. )
  718. await get_all_models(request, user=user)
  719. model = request.app.state.OPENAI_MODELS.get(model_id)
  720. if model:
  721. idx = model["urlIdx"]
  722. else:
  723. raise HTTPException(
  724. status_code=404,
  725. detail="Model not found",
  726. )
  727. # Get the API config for the model
  728. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  729. str(idx),
  730. request.app.state.config.OPENAI_API_CONFIGS.get(
  731. request.app.state.config.OPENAI_API_BASE_URLS[idx], {}
  732. ), # Legacy support
  733. )
  734. prefix_id = api_config.get("prefix_id", None)
  735. if prefix_id:
  736. payload["model"] = payload["model"].replace(f"{prefix_id}.", "")
  737. # Add user info to the payload if the model is a pipeline
  738. if "pipeline" in model and model.get("pipeline"):
  739. payload["user"] = {
  740. "name": user.name,
  741. "id": user.id,
  742. "email": user.email,
  743. "role": user.role,
  744. }
  745. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  746. key = request.app.state.config.OPENAI_API_KEYS[idx]
  747. # Check if model is a reasoning model that needs special handling
  748. if is_openai_reasoning_model(payload["model"]):
  749. payload = openai_reasoning_model_handler(payload)
  750. elif "api.openai.com" not in url:
  751. # Remove "max_completion_tokens" from the payload for backward compatibility
  752. if "max_completion_tokens" in payload:
  753. payload["max_tokens"] = payload["max_completion_tokens"]
  754. del payload["max_completion_tokens"]
  755. if "max_tokens" in payload and "max_completion_tokens" in payload:
  756. del payload["max_tokens"]
  757. # Convert the modified body back to JSON
  758. if "logit_bias" in payload:
  759. payload["logit_bias"] = json.loads(
  760. convert_logit_bias_input_to_json(payload["logit_bias"])
  761. )
  762. headers, cookies = await get_headers_and_cookies(
  763. request, url, key, api_config, metadata, user=user
  764. )
  765. if api_config.get("azure", False):
  766. api_version = api_config.get("api_version", "2023-03-15-preview")
  767. request_url, payload = convert_to_azure_payload(url, payload, api_version)
  768. # Only set api-key header if not using Azure Entra ID authentication
  769. auth_type = api_config.get("auth_type", "bearer")
  770. if auth_type not in ("azure_ad", "microsoft_entra_id"):
  771. headers["api-key"] = key
  772. headers["api-version"] = api_version
  773. request_url = f"{request_url}/chat/completions?api-version={api_version}"
  774. else:
  775. request_url = f"{url}/chat/completions"
  776. payload = json.dumps(payload)
  777. r = None
  778. session = None
  779. streaming = False
  780. response = None
  781. try:
  782. session = aiohttp.ClientSession(
  783. trust_env=True, timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT)
  784. )
  785. r = await session.request(
  786. method="POST",
  787. url=request_url,
  788. data=payload,
  789. headers=headers,
  790. cookies=cookies,
  791. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  792. )
  793. # Check if response is SSE
  794. if "text/event-stream" in r.headers.get("Content-Type", ""):
  795. streaming = True
  796. return StreamingResponse(
  797. r.content,
  798. status_code=r.status,
  799. headers=dict(r.headers),
  800. background=BackgroundTask(
  801. cleanup_response, response=r, session=session
  802. ),
  803. )
  804. else:
  805. try:
  806. response = await r.json()
  807. except Exception as e:
  808. log.error(e)
  809. response = await r.text()
  810. if r.status >= 400:
  811. if isinstance(response, (dict, list)):
  812. return JSONResponse(status_code=r.status, content=response)
  813. else:
  814. return PlainTextResponse(status_code=r.status, content=response)
  815. return response
  816. except Exception as e:
  817. log.exception(e)
  818. raise HTTPException(
  819. status_code=r.status if r else 500,
  820. detail="Open WebUI: Server Connection Error",
  821. )
  822. finally:
  823. if not streaming:
  824. await cleanup_response(r, session)
  825. async def embeddings(request: Request, form_data: dict, user):
  826. """
  827. Calls the embeddings endpoint for OpenAI-compatible providers.
  828. Args:
  829. request (Request): The FastAPI request context.
  830. form_data (dict): OpenAI-compatible embeddings payload.
  831. user (UserModel): The authenticated user.
  832. Returns:
  833. dict: OpenAI-compatible embeddings response.
  834. """
  835. idx = 0
  836. # Prepare payload/body
  837. body = json.dumps(form_data)
  838. # Find correct backend url/key based on model
  839. await get_all_models(request, user=user)
  840. model_id = form_data.get("model")
  841. models = request.app.state.OPENAI_MODELS
  842. if model_id in models:
  843. idx = models[model_id]["urlIdx"]
  844. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  845. key = request.app.state.config.OPENAI_API_KEYS[idx]
  846. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  847. str(idx),
  848. request.app.state.config.OPENAI_API_CONFIGS.get(url, {}), # Legacy support
  849. )
  850. r = None
  851. session = None
  852. streaming = False
  853. headers, cookies = await get_headers_and_cookies(
  854. request, url, key, api_config, user=user
  855. )
  856. try:
  857. session = aiohttp.ClientSession(trust_env=True)
  858. r = await session.request(
  859. method="POST",
  860. url=f"{url}/embeddings",
  861. data=body,
  862. headers=headers,
  863. cookies=cookies,
  864. )
  865. if "text/event-stream" in r.headers.get("Content-Type", ""):
  866. streaming = True
  867. return StreamingResponse(
  868. r.content,
  869. status_code=r.status,
  870. headers=dict(r.headers),
  871. background=BackgroundTask(
  872. cleanup_response, response=r, session=session
  873. ),
  874. )
  875. else:
  876. try:
  877. response_data = await r.json()
  878. except Exception:
  879. response_data = await r.text()
  880. if r.status >= 400:
  881. if isinstance(response_data, (dict, list)):
  882. return JSONResponse(status_code=r.status, content=response_data)
  883. else:
  884. return PlainTextResponse(
  885. status_code=r.status, content=response_data
  886. )
  887. return response_data
  888. except Exception as e:
  889. log.exception(e)
  890. raise HTTPException(
  891. status_code=r.status if r else 500,
  892. detail="Open WebUI: Server Connection Error",
  893. )
  894. finally:
  895. if not streaming:
  896. await cleanup_response(r, session)
  897. @router.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
  898. async def proxy(path: str, request: Request, user=Depends(get_verified_user)):
  899. """
  900. Deprecated: proxy all requests to OpenAI API
  901. """
  902. body = await request.body()
  903. idx = 0
  904. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  905. key = request.app.state.config.OPENAI_API_KEYS[idx]
  906. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  907. str(idx),
  908. request.app.state.config.OPENAI_API_CONFIGS.get(
  909. request.app.state.config.OPENAI_API_BASE_URLS[idx], {}
  910. ), # Legacy support
  911. )
  912. r = None
  913. session = None
  914. streaming = False
  915. try:
  916. headers, cookies = await get_headers_and_cookies(
  917. request, url, key, api_config, user=user
  918. )
  919. if api_config.get("azure", False):
  920. api_version = api_config.get("api_version", "2023-03-15-preview")
  921. # Only set api-key header if not using Azure Entra ID authentication
  922. auth_type = api_config.get("auth_type", "bearer")
  923. if auth_type not in ("azure_ad", "microsoft_entra_id"):
  924. headers["api-key"] = key
  925. headers["api-version"] = api_version
  926. payload = json.loads(body)
  927. url, payload = convert_to_azure_payload(url, payload, api_version)
  928. body = json.dumps(payload).encode()
  929. request_url = f"{url}/{path}?api-version={api_version}"
  930. else:
  931. request_url = f"{url}/{path}"
  932. session = aiohttp.ClientSession(trust_env=True)
  933. r = await session.request(
  934. method=request.method,
  935. url=request_url,
  936. data=body,
  937. headers=headers,
  938. cookies=cookies,
  939. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  940. )
  941. # Check if response is SSE
  942. if "text/event-stream" in r.headers.get("Content-Type", ""):
  943. streaming = True
  944. return StreamingResponse(
  945. r.content,
  946. status_code=r.status,
  947. headers=dict(r.headers),
  948. background=BackgroundTask(
  949. cleanup_response, response=r, session=session
  950. ),
  951. )
  952. else:
  953. try:
  954. response_data = await r.json()
  955. except Exception:
  956. response_data = await r.text()
  957. if r.status >= 400:
  958. if isinstance(response_data, (dict, list)):
  959. return JSONResponse(status_code=r.status, content=response_data)
  960. else:
  961. return PlainTextResponse(
  962. status_code=r.status, content=response_data
  963. )
  964. return response_data
  965. except Exception as e:
  966. log.exception(e)
  967. raise HTTPException(
  968. status_code=r.status if r else 500,
  969. detail="Open WebUI: Server Connection Error",
  970. )
  971. finally:
  972. if not streaming:
  973. await cleanup_response(r, session)