openai.py 37 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100
  1. import asyncio
  2. import hashlib
  3. import json
  4. import logging
  5. from typing import Optional
  6. import aiohttp
  7. from aiocache import cached
  8. import requests
  9. from urllib.parse import quote
  10. from fastapi import Depends, HTTPException, Request, APIRouter
  11. from fastapi.responses import (
  12. FileResponse,
  13. StreamingResponse,
  14. JSONResponse,
  15. PlainTextResponse,
  16. )
  17. from pydantic import BaseModel
  18. from starlette.background import BackgroundTask
  19. from open_webui.models.models import Models
  20. from open_webui.config import (
  21. CACHE_DIR,
  22. )
  23. from open_webui.env import (
  24. MODELS_CACHE_TTL,
  25. AIOHTTP_CLIENT_SESSION_SSL,
  26. AIOHTTP_CLIENT_TIMEOUT,
  27. AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST,
  28. ENABLE_FORWARD_USER_INFO_HEADERS,
  29. BYPASS_MODEL_ACCESS_CONTROL,
  30. )
  31. from open_webui.models.users import UserModel
  32. from open_webui.constants import ERROR_MESSAGES
  33. from open_webui.env import SRC_LOG_LEVELS
  34. from open_webui.utils.payload import (
  35. apply_model_params_to_body_openai,
  36. apply_model_system_prompt_to_body,
  37. )
  38. from open_webui.utils.misc import (
  39. convert_logit_bias_input_to_json,
  40. )
  41. from open_webui.utils.auth import get_admin_user, get_verified_user
  42. from open_webui.utils.access_control import has_access
  43. log = logging.getLogger(__name__)
  44. log.setLevel(SRC_LOG_LEVELS["OPENAI"])
  45. ##########################################
  46. #
  47. # Utility functions
  48. #
  49. ##########################################
  50. async def send_get_request(url, key=None, user: UserModel = None):
  51. timeout = aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST)
  52. try:
  53. async with aiohttp.ClientSession(timeout=timeout, trust_env=True) as session:
  54. async with session.get(
  55. url,
  56. headers={
  57. **({"Authorization": f"Bearer {key}"} if key else {}),
  58. **(
  59. {
  60. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  61. "X-OpenWebUI-User-Id": user.id,
  62. "X-OpenWebUI-User-Email": user.email,
  63. "X-OpenWebUI-User-Role": user.role,
  64. }
  65. if ENABLE_FORWARD_USER_INFO_HEADERS and user
  66. else {}
  67. ),
  68. },
  69. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  70. ) as response:
  71. return await response.json()
  72. except Exception as e:
  73. # Handle connection error here
  74. log.error(f"Connection error: {e}")
  75. return None
  76. async def cleanup_response(
  77. response: Optional[aiohttp.ClientResponse],
  78. session: Optional[aiohttp.ClientSession],
  79. ):
  80. if response:
  81. response.close()
  82. if session:
  83. await session.close()
  84. def openai_o_series_handler(payload):
  85. """
  86. Handle "o" series specific parameters
  87. """
  88. if "max_tokens" in payload:
  89. # Convert "max_tokens" to "max_completion_tokens" for all o-series models
  90. payload["max_completion_tokens"] = payload["max_tokens"]
  91. del payload["max_tokens"]
  92. # Handle system role conversion based on model type
  93. if payload["messages"][0]["role"] == "system":
  94. model_lower = payload["model"].lower()
  95. # Legacy models use "user" role instead of "system"
  96. if model_lower.startswith("o1-mini") or model_lower.startswith("o1-preview"):
  97. payload["messages"][0]["role"] = "user"
  98. else:
  99. payload["messages"][0]["role"] = "developer"
  100. return payload
  101. ##########################################
  102. #
  103. # API routes
  104. #
  105. ##########################################
  106. router = APIRouter()
  107. @router.get("/config")
  108. async def get_config(request: Request, user=Depends(get_admin_user)):
  109. return {
  110. "ENABLE_OPENAI_API": request.app.state.config.ENABLE_OPENAI_API,
  111. "OPENAI_API_BASE_URLS": request.app.state.config.OPENAI_API_BASE_URLS,
  112. "OPENAI_API_KEYS": request.app.state.config.OPENAI_API_KEYS,
  113. "OPENAI_API_CONFIGS": request.app.state.config.OPENAI_API_CONFIGS,
  114. }
  115. class OpenAIConfigForm(BaseModel):
  116. ENABLE_OPENAI_API: Optional[bool] = None
  117. OPENAI_API_BASE_URLS: list[str]
  118. OPENAI_API_KEYS: list[str]
  119. OPENAI_API_CONFIGS: dict
  120. @router.post("/config/update")
  121. async def update_config(
  122. request: Request, form_data: OpenAIConfigForm, user=Depends(get_admin_user)
  123. ):
  124. request.app.state.config.ENABLE_OPENAI_API = form_data.ENABLE_OPENAI_API
  125. request.app.state.config.OPENAI_API_BASE_URLS = form_data.OPENAI_API_BASE_URLS
  126. request.app.state.config.OPENAI_API_KEYS = form_data.OPENAI_API_KEYS
  127. # Check if API KEYS length is same than API URLS length
  128. if len(request.app.state.config.OPENAI_API_KEYS) != len(
  129. request.app.state.config.OPENAI_API_BASE_URLS
  130. ):
  131. if len(request.app.state.config.OPENAI_API_KEYS) > len(
  132. request.app.state.config.OPENAI_API_BASE_URLS
  133. ):
  134. request.app.state.config.OPENAI_API_KEYS = (
  135. request.app.state.config.OPENAI_API_KEYS[
  136. : len(request.app.state.config.OPENAI_API_BASE_URLS)
  137. ]
  138. )
  139. else:
  140. request.app.state.config.OPENAI_API_KEYS += [""] * (
  141. len(request.app.state.config.OPENAI_API_BASE_URLS)
  142. - len(request.app.state.config.OPENAI_API_KEYS)
  143. )
  144. request.app.state.config.OPENAI_API_CONFIGS = form_data.OPENAI_API_CONFIGS
  145. # Remove the API configs that are not in the API URLS
  146. keys = list(map(str, range(len(request.app.state.config.OPENAI_API_BASE_URLS))))
  147. request.app.state.config.OPENAI_API_CONFIGS = {
  148. key: value
  149. for key, value in request.app.state.config.OPENAI_API_CONFIGS.items()
  150. if key in keys
  151. }
  152. return {
  153. "ENABLE_OPENAI_API": request.app.state.config.ENABLE_OPENAI_API,
  154. "OPENAI_API_BASE_URLS": request.app.state.config.OPENAI_API_BASE_URLS,
  155. "OPENAI_API_KEYS": request.app.state.config.OPENAI_API_KEYS,
  156. "OPENAI_API_CONFIGS": request.app.state.config.OPENAI_API_CONFIGS,
  157. }
  158. @router.post("/audio/speech")
  159. async def speech(request: Request, user=Depends(get_verified_user)):
  160. idx = None
  161. try:
  162. idx = request.app.state.config.OPENAI_API_BASE_URLS.index(
  163. "https://api.openai.com/v1"
  164. )
  165. body = await request.body()
  166. name = hashlib.sha256(body).hexdigest()
  167. SPEECH_CACHE_DIR = CACHE_DIR / "audio" / "speech"
  168. SPEECH_CACHE_DIR.mkdir(parents=True, exist_ok=True)
  169. file_path = SPEECH_CACHE_DIR.joinpath(f"{name}.mp3")
  170. file_body_path = SPEECH_CACHE_DIR.joinpath(f"{name}.json")
  171. # Check if the file already exists in the cache
  172. if file_path.is_file():
  173. return FileResponse(file_path)
  174. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  175. r = None
  176. try:
  177. r = requests.post(
  178. url=f"{url}/audio/speech",
  179. data=body,
  180. headers={
  181. "Content-Type": "application/json",
  182. "Authorization": f"Bearer {request.app.state.config.OPENAI_API_KEYS[idx]}",
  183. **(
  184. {
  185. "HTTP-Referer": "https://openwebui.com/",
  186. "X-Title": "Open WebUI",
  187. }
  188. if "openrouter.ai" in url
  189. else {}
  190. ),
  191. **(
  192. {
  193. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  194. "X-OpenWebUI-User-Id": user.id,
  195. "X-OpenWebUI-User-Email": user.email,
  196. "X-OpenWebUI-User-Role": user.role,
  197. }
  198. if ENABLE_FORWARD_USER_INFO_HEADERS
  199. else {}
  200. ),
  201. },
  202. stream=True,
  203. )
  204. r.raise_for_status()
  205. # Save the streaming content to a file
  206. with open(file_path, "wb") as f:
  207. for chunk in r.iter_content(chunk_size=8192):
  208. f.write(chunk)
  209. with open(file_body_path, "w") as f:
  210. json.dump(json.loads(body.decode("utf-8")), f)
  211. # Return the saved file
  212. return FileResponse(file_path)
  213. except Exception as e:
  214. log.exception(e)
  215. detail = None
  216. if r is not None:
  217. try:
  218. res = r.json()
  219. if "error" in res:
  220. detail = f"External: {res['error']}"
  221. except Exception:
  222. detail = f"External: {e}"
  223. raise HTTPException(
  224. status_code=r.status_code if r else 500,
  225. detail=detail if detail else "Open WebUI: Server Connection Error",
  226. )
  227. except ValueError:
  228. raise HTTPException(status_code=401, detail=ERROR_MESSAGES.OPENAI_NOT_FOUND)
  229. async def get_all_models_responses(request: Request, user: UserModel) -> list:
  230. if not request.app.state.config.ENABLE_OPENAI_API:
  231. return []
  232. # Check if API KEYS length is same than API URLS length
  233. num_urls = len(request.app.state.config.OPENAI_API_BASE_URLS)
  234. num_keys = len(request.app.state.config.OPENAI_API_KEYS)
  235. if num_keys != num_urls:
  236. # if there are more keys than urls, remove the extra keys
  237. if num_keys > num_urls:
  238. new_keys = request.app.state.config.OPENAI_API_KEYS[:num_urls]
  239. request.app.state.config.OPENAI_API_KEYS = new_keys
  240. # if there are more urls than keys, add empty keys
  241. else:
  242. request.app.state.config.OPENAI_API_KEYS += [""] * (num_urls - num_keys)
  243. request_tasks = []
  244. for idx, url in enumerate(request.app.state.config.OPENAI_API_BASE_URLS):
  245. if (str(idx) not in request.app.state.config.OPENAI_API_CONFIGS) and (
  246. url not in request.app.state.config.OPENAI_API_CONFIGS # Legacy support
  247. ):
  248. request_tasks.append(
  249. send_get_request(
  250. f"{url}/models",
  251. request.app.state.config.OPENAI_API_KEYS[idx],
  252. user=user,
  253. )
  254. )
  255. else:
  256. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  257. str(idx),
  258. request.app.state.config.OPENAI_API_CONFIGS.get(
  259. url, {}
  260. ), # Legacy support
  261. )
  262. enable = api_config.get("enable", True)
  263. model_ids = api_config.get("model_ids", [])
  264. if enable:
  265. if len(model_ids) == 0:
  266. request_tasks.append(
  267. send_get_request(
  268. f"{url}/models",
  269. request.app.state.config.OPENAI_API_KEYS[idx],
  270. user=user,
  271. )
  272. )
  273. else:
  274. model_list = {
  275. "object": "list",
  276. "data": [
  277. {
  278. "id": model_id,
  279. "name": model_id,
  280. "owned_by": "openai",
  281. "openai": {"id": model_id},
  282. "urlIdx": idx,
  283. }
  284. for model_id in model_ids
  285. ],
  286. }
  287. request_tasks.append(
  288. asyncio.ensure_future(asyncio.sleep(0, model_list))
  289. )
  290. else:
  291. request_tasks.append(asyncio.ensure_future(asyncio.sleep(0, None)))
  292. responses = await asyncio.gather(*request_tasks)
  293. for idx, response in enumerate(responses):
  294. if response:
  295. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  296. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  297. str(idx),
  298. request.app.state.config.OPENAI_API_CONFIGS.get(
  299. url, {}
  300. ), # Legacy support
  301. )
  302. connection_type = api_config.get("connection_type", "external")
  303. prefix_id = api_config.get("prefix_id", None)
  304. tags = api_config.get("tags", [])
  305. for model in (
  306. response if isinstance(response, list) else response.get("data", [])
  307. ):
  308. if prefix_id:
  309. model["id"] = (
  310. f"{prefix_id}.{model.get('id', model.get('name', ''))}"
  311. )
  312. if tags:
  313. model["tags"] = tags
  314. if connection_type:
  315. model["connection_type"] = connection_type
  316. log.debug(f"get_all_models:responses() {responses}")
  317. return responses
  318. async def get_filtered_models(models, user):
  319. # Filter models based on user access control
  320. filtered_models = []
  321. for model in models.get("data", []):
  322. model_info = Models.get_model_by_id(model["id"])
  323. if model_info:
  324. if user.id == model_info.user_id or has_access(
  325. user.id, type="read", access_control=model_info.access_control
  326. ):
  327. filtered_models.append(model)
  328. return filtered_models
  329. @cached(ttl=MODELS_CACHE_TTL)
  330. async def get_all_models(request: Request, user: UserModel) -> dict[str, list]:
  331. log.info("get_all_models()")
  332. if not request.app.state.config.ENABLE_OPENAI_API:
  333. return {"data": []}
  334. responses = await get_all_models_responses(request, user=user)
  335. def extract_data(response):
  336. if response and "data" in response:
  337. return response["data"]
  338. if isinstance(response, list):
  339. return response
  340. return None
  341. def merge_models_lists(model_lists):
  342. log.debug(f"merge_models_lists {model_lists}")
  343. merged_list = []
  344. for idx, models in enumerate(model_lists):
  345. if models is not None and "error" not in models:
  346. merged_list.extend(
  347. [
  348. {
  349. **model,
  350. "name": model.get("name", model["id"]),
  351. "owned_by": "openai",
  352. "openai": model,
  353. "connection_type": model.get("connection_type", "external"),
  354. "urlIdx": idx,
  355. }
  356. for model in models
  357. if (model.get("id") or model.get("name"))
  358. and (
  359. "api.openai.com"
  360. not in request.app.state.config.OPENAI_API_BASE_URLS[idx]
  361. or not any(
  362. name in model["id"]
  363. for name in [
  364. "babbage",
  365. "dall-e",
  366. "davinci",
  367. "embedding",
  368. "tts",
  369. "whisper",
  370. ]
  371. )
  372. )
  373. ]
  374. )
  375. return merged_list
  376. models = {"data": merge_models_lists(map(extract_data, responses))}
  377. log.debug(f"models: {models}")
  378. request.app.state.OPENAI_MODELS = {model["id"]: model for model in models["data"]}
  379. return models
  380. @router.get("/models")
  381. @router.get("/models/{url_idx}")
  382. async def get_models(
  383. request: Request, url_idx: Optional[int] = None, user=Depends(get_verified_user)
  384. ):
  385. models = {
  386. "data": [],
  387. }
  388. if url_idx is None:
  389. models = await get_all_models(request, user=user)
  390. else:
  391. url = request.app.state.config.OPENAI_API_BASE_URLS[url_idx]
  392. key = request.app.state.config.OPENAI_API_KEYS[url_idx]
  393. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  394. str(url_idx),
  395. request.app.state.config.OPENAI_API_CONFIGS.get(url, {}), # Legacy support
  396. )
  397. r = None
  398. async with aiohttp.ClientSession(
  399. trust_env=True,
  400. timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST),
  401. ) as session:
  402. try:
  403. headers = {
  404. "Content-Type": "application/json",
  405. **(
  406. {
  407. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  408. "X-OpenWebUI-User-Id": user.id,
  409. "X-OpenWebUI-User-Email": user.email,
  410. "X-OpenWebUI-User-Role": user.role,
  411. }
  412. if ENABLE_FORWARD_USER_INFO_HEADERS
  413. else {}
  414. ),
  415. }
  416. if api_config.get("azure", False):
  417. models = {
  418. "data": api_config.get("model_ids", []) or [],
  419. "object": "list",
  420. }
  421. else:
  422. headers["Authorization"] = f"Bearer {key}"
  423. async with session.get(
  424. f"{url}/models",
  425. headers=headers,
  426. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  427. ) as r:
  428. if r.status != 200:
  429. # Extract response error details if available
  430. error_detail = f"HTTP Error: {r.status}"
  431. res = await r.json()
  432. if "error" in res:
  433. error_detail = f"External Error: {res['error']}"
  434. raise Exception(error_detail)
  435. response_data = await r.json()
  436. # Check if we're calling OpenAI API based on the URL
  437. if "api.openai.com" in url:
  438. # Filter models according to the specified conditions
  439. response_data["data"] = [
  440. model
  441. for model in response_data.get("data", [])
  442. if not any(
  443. name in model["id"]
  444. for name in [
  445. "babbage",
  446. "dall-e",
  447. "davinci",
  448. "embedding",
  449. "tts",
  450. "whisper",
  451. ]
  452. )
  453. ]
  454. models = response_data
  455. except aiohttp.ClientError as e:
  456. # ClientError covers all aiohttp requests issues
  457. log.exception(f"Client error: {str(e)}")
  458. raise HTTPException(
  459. status_code=500, detail="Open WebUI: Server Connection Error"
  460. )
  461. except Exception as e:
  462. log.exception(f"Unexpected error: {e}")
  463. error_detail = f"Unexpected error: {str(e)}"
  464. raise HTTPException(status_code=500, detail=error_detail)
  465. if user.role == "user" and not BYPASS_MODEL_ACCESS_CONTROL:
  466. models["data"] = await get_filtered_models(models, user)
  467. return models
  468. class ConnectionVerificationForm(BaseModel):
  469. url: str
  470. key: str
  471. config: Optional[dict] = None
  472. @router.post("/verify")
  473. async def verify_connection(
  474. form_data: ConnectionVerificationForm, user=Depends(get_admin_user)
  475. ):
  476. url = form_data.url
  477. key = form_data.key
  478. api_config = form_data.config or {}
  479. async with aiohttp.ClientSession(
  480. trust_env=True,
  481. timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT_MODEL_LIST),
  482. ) as session:
  483. try:
  484. headers = {
  485. "Content-Type": "application/json",
  486. **(
  487. {
  488. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  489. "X-OpenWebUI-User-Id": user.id,
  490. "X-OpenWebUI-User-Email": user.email,
  491. "X-OpenWebUI-User-Role": user.role,
  492. }
  493. if ENABLE_FORWARD_USER_INFO_HEADERS
  494. else {}
  495. ),
  496. }
  497. if api_config.get("azure", False):
  498. headers["api-key"] = key
  499. api_version = api_config.get("api_version", "") or "2023-03-15-preview"
  500. async with session.get(
  501. url=f"{url}/openai/models?api-version={api_version}",
  502. headers=headers,
  503. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  504. ) as r:
  505. try:
  506. response_data = await r.json()
  507. except Exception:
  508. response_data = await r.text()
  509. if r.status != 200:
  510. if isinstance(response_data, (dict, list)):
  511. return JSONResponse(
  512. status_code=r.status, content=response_data
  513. )
  514. else:
  515. return PlainTextResponse(
  516. status_code=r.status, content=response_data
  517. )
  518. return response_data
  519. else:
  520. headers["Authorization"] = f"Bearer {key}"
  521. async with session.get(
  522. f"{url}/models",
  523. headers=headers,
  524. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  525. ) as r:
  526. try:
  527. response_data = await r.json()
  528. except Exception:
  529. response_data = await r.text()
  530. if r.status != 200:
  531. if isinstance(response_data, (dict, list)):
  532. return JSONResponse(
  533. status_code=r.status, content=response_data
  534. )
  535. else:
  536. return PlainTextResponse(
  537. status_code=r.status, content=response_data
  538. )
  539. return response_data
  540. except aiohttp.ClientError as e:
  541. # ClientError covers all aiohttp requests issues
  542. log.exception(f"Client error: {str(e)}")
  543. raise HTTPException(
  544. status_code=500, detail="Open WebUI: Server Connection Error"
  545. )
  546. except Exception as e:
  547. log.exception(f"Unexpected error: {e}")
  548. raise HTTPException(
  549. status_code=500, detail="Open WebUI: Server Connection Error"
  550. )
  551. def get_azure_allowed_params(api_version: str) -> set[str]:
  552. allowed_params = {
  553. "messages",
  554. "temperature",
  555. "role",
  556. "content",
  557. "contentPart",
  558. "contentPartImage",
  559. "enhancements",
  560. "dataSources",
  561. "n",
  562. "stream",
  563. "stop",
  564. "max_tokens",
  565. "presence_penalty",
  566. "frequency_penalty",
  567. "logit_bias",
  568. "user",
  569. "function_call",
  570. "functions",
  571. "tools",
  572. "tool_choice",
  573. "top_p",
  574. "log_probs",
  575. "top_logprobs",
  576. "response_format",
  577. "seed",
  578. "max_completion_tokens",
  579. }
  580. try:
  581. if api_version >= "2024-09-01-preview":
  582. allowed_params.add("stream_options")
  583. except ValueError:
  584. log.debug(
  585. f"Invalid API version {api_version} for Azure OpenAI. Defaulting to allowed parameters."
  586. )
  587. return allowed_params
  588. def convert_to_azure_payload(url, payload: dict, api_version: str):
  589. model = payload.get("model", "")
  590. # Filter allowed parameters based on Azure OpenAI API
  591. allowed_params = get_azure_allowed_params(api_version)
  592. # Special handling for o-series models
  593. if model.startswith("o") and model.endswith("-mini"):
  594. # Convert max_tokens to max_completion_tokens for o-series models
  595. if "max_tokens" in payload:
  596. payload["max_completion_tokens"] = payload["max_tokens"]
  597. del payload["max_tokens"]
  598. # Remove temperature if not 1 for o-series models
  599. if "temperature" in payload and payload["temperature"] != 1:
  600. log.debug(
  601. f"Removing temperature parameter for o-series model {model} as only default value (1) is supported"
  602. )
  603. del payload["temperature"]
  604. # Filter out unsupported parameters
  605. payload = {k: v for k, v in payload.items() if k in allowed_params}
  606. url = f"{url}/openai/deployments/{model}"
  607. return url, payload
  608. @router.post("/chat/completions")
  609. async def generate_chat_completion(
  610. request: Request,
  611. form_data: dict,
  612. user=Depends(get_verified_user),
  613. bypass_filter: Optional[bool] = False,
  614. ):
  615. if BYPASS_MODEL_ACCESS_CONTROL:
  616. bypass_filter = True
  617. idx = 0
  618. payload = {**form_data}
  619. metadata = payload.pop("metadata", None)
  620. model_id = form_data.get("model")
  621. model_info = Models.get_model_by_id(model_id)
  622. # Check model info and override the payload
  623. if model_info:
  624. if model_info.base_model_id:
  625. payload["model"] = model_info.base_model_id
  626. model_id = model_info.base_model_id
  627. params = model_info.params.model_dump()
  628. if params:
  629. system = params.pop("system", None)
  630. payload = apply_model_params_to_body_openai(params, payload)
  631. payload = apply_model_system_prompt_to_body(system, payload, metadata, user)
  632. # Check if user has access to the model
  633. if not bypass_filter and user.role == "user":
  634. if not (
  635. user.id == model_info.user_id
  636. or has_access(
  637. user.id, type="read", access_control=model_info.access_control
  638. )
  639. ):
  640. raise HTTPException(
  641. status_code=403,
  642. detail="Model not found",
  643. )
  644. elif not bypass_filter:
  645. if user.role != "admin":
  646. raise HTTPException(
  647. status_code=403,
  648. detail="Model not found",
  649. )
  650. await get_all_models(request, user=user)
  651. model = request.app.state.OPENAI_MODELS.get(model_id)
  652. if model:
  653. idx = model["urlIdx"]
  654. else:
  655. raise HTTPException(
  656. status_code=404,
  657. detail="Model not found",
  658. )
  659. # Get the API config for the model
  660. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  661. str(idx),
  662. request.app.state.config.OPENAI_API_CONFIGS.get(
  663. request.app.state.config.OPENAI_API_BASE_URLS[idx], {}
  664. ), # Legacy support
  665. )
  666. prefix_id = api_config.get("prefix_id", None)
  667. if prefix_id:
  668. payload["model"] = payload["model"].replace(f"{prefix_id}.", "")
  669. # Add user info to the payload if the model is a pipeline
  670. if "pipeline" in model and model.get("pipeline"):
  671. payload["user"] = {
  672. "name": user.name,
  673. "id": user.id,
  674. "email": user.email,
  675. "role": user.role,
  676. }
  677. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  678. key = request.app.state.config.OPENAI_API_KEYS[idx]
  679. # Check if model is from "o" series
  680. is_o_series = payload["model"].lower().startswith(("o1", "o3", "o4"))
  681. if is_o_series:
  682. payload = openai_o_series_handler(payload)
  683. elif "api.openai.com" not in url:
  684. # Remove "max_completion_tokens" from the payload for backward compatibility
  685. if "max_completion_tokens" in payload:
  686. payload["max_tokens"] = payload["max_completion_tokens"]
  687. del payload["max_completion_tokens"]
  688. if "max_tokens" in payload and "max_completion_tokens" in payload:
  689. del payload["max_tokens"]
  690. # Convert the modified body back to JSON
  691. if "logit_bias" in payload:
  692. payload["logit_bias"] = json.loads(
  693. convert_logit_bias_input_to_json(payload["logit_bias"])
  694. )
  695. headers = {
  696. "Content-Type": "application/json",
  697. **(
  698. {
  699. "HTTP-Referer": "https://openwebui.com/",
  700. "X-Title": "Open WebUI",
  701. }
  702. if "openrouter.ai" in url
  703. else {}
  704. ),
  705. **(
  706. {
  707. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  708. "X-OpenWebUI-User-Id": user.id,
  709. "X-OpenWebUI-User-Email": user.email,
  710. "X-OpenWebUI-User-Role": user.role,
  711. **(
  712. {"X-OpenWebUI-Chat-Id": metadata.get("chat_id")}
  713. if metadata and metadata.get("chat_id")
  714. else {}
  715. ),
  716. }
  717. if ENABLE_FORWARD_USER_INFO_HEADERS
  718. else {}
  719. ),
  720. }
  721. if api_config.get("azure", False):
  722. api_version = api_config.get("api_version", "2023-03-15-preview")
  723. request_url, payload = convert_to_azure_payload(url, payload, api_version)
  724. headers["api-key"] = key
  725. headers["api-version"] = api_version
  726. request_url = f"{request_url}/chat/completions?api-version={api_version}"
  727. else:
  728. request_url = f"{url}/chat/completions"
  729. headers["Authorization"] = f"Bearer {key}"
  730. payload = json.dumps(payload)
  731. r = None
  732. session = None
  733. streaming = False
  734. response = None
  735. try:
  736. session = aiohttp.ClientSession(
  737. trust_env=True, timeout=aiohttp.ClientTimeout(total=AIOHTTP_CLIENT_TIMEOUT)
  738. )
  739. r = await session.request(
  740. method="POST",
  741. url=request_url,
  742. data=payload,
  743. headers=headers,
  744. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  745. )
  746. # Check if response is SSE
  747. if "text/event-stream" in r.headers.get("Content-Type", ""):
  748. streaming = True
  749. return StreamingResponse(
  750. r.content,
  751. status_code=r.status,
  752. headers=dict(r.headers),
  753. background=BackgroundTask(
  754. cleanup_response, response=r, session=session
  755. ),
  756. )
  757. else:
  758. try:
  759. response = await r.json()
  760. except Exception as e:
  761. log.error(e)
  762. response = await r.text()
  763. if r.status >= 400:
  764. if isinstance(response, (dict, list)):
  765. return JSONResponse(status_code=r.status, content=response)
  766. else:
  767. return PlainTextResponse(status_code=r.status, content=response)
  768. return response
  769. except Exception as e:
  770. log.exception(e)
  771. raise HTTPException(
  772. status_code=r.status if r else 500,
  773. detail="Open WebUI: Server Connection Error",
  774. )
  775. finally:
  776. if not streaming:
  777. await cleanup_response(r, session)
  778. async def embeddings(request: Request, form_data: dict, user):
  779. """
  780. Calls the embeddings endpoint for OpenAI-compatible providers.
  781. Args:
  782. request (Request): The FastAPI request context.
  783. form_data (dict): OpenAI-compatible embeddings payload.
  784. user (UserModel): The authenticated user.
  785. Returns:
  786. dict: OpenAI-compatible embeddings response.
  787. """
  788. idx = 0
  789. # Prepare payload/body
  790. body = json.dumps(form_data)
  791. # Find correct backend url/key based on model
  792. await get_all_models(request, user=user)
  793. model_id = form_data.get("model")
  794. models = request.app.state.OPENAI_MODELS
  795. if model_id in models:
  796. idx = models[model_id]["urlIdx"]
  797. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  798. key = request.app.state.config.OPENAI_API_KEYS[idx]
  799. r = None
  800. session = None
  801. streaming = False
  802. try:
  803. session = aiohttp.ClientSession(trust_env=True)
  804. r = await session.request(
  805. method="POST",
  806. url=f"{url}/embeddings",
  807. data=body,
  808. headers={
  809. "Authorization": f"Bearer {key}",
  810. "Content-Type": "application/json",
  811. **(
  812. {
  813. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  814. "X-OpenWebUI-User-Id": user.id,
  815. "X-OpenWebUI-User-Email": user.email,
  816. "X-OpenWebUI-User-Role": user.role,
  817. }
  818. if ENABLE_FORWARD_USER_INFO_HEADERS and user
  819. else {}
  820. ),
  821. },
  822. )
  823. if "text/event-stream" in r.headers.get("Content-Type", ""):
  824. streaming = True
  825. return StreamingResponse(
  826. r.content,
  827. status_code=r.status,
  828. headers=dict(r.headers),
  829. background=BackgroundTask(
  830. cleanup_response, response=r, session=session
  831. ),
  832. )
  833. else:
  834. try:
  835. response_data = await r.json()
  836. except Exception:
  837. response_data = await r.text()
  838. if r.status >= 400:
  839. if isinstance(response_data, (dict, list)):
  840. return JSONResponse(status_code=r.status, content=response_data)
  841. else:
  842. return PlainTextResponse(
  843. status_code=r.status, content=response_data
  844. )
  845. return response_data
  846. except Exception as e:
  847. log.exception(e)
  848. raise HTTPException(
  849. status_code=r.status if r else 500,
  850. detail="Open WebUI: Server Connection Error",
  851. )
  852. finally:
  853. if not streaming:
  854. await cleanup_response(r, session)
  855. @router.api_route("/{path:path}", methods=["GET", "POST", "PUT", "DELETE"])
  856. async def proxy(path: str, request: Request, user=Depends(get_verified_user)):
  857. """
  858. Deprecated: proxy all requests to OpenAI API
  859. """
  860. body = await request.body()
  861. idx = 0
  862. url = request.app.state.config.OPENAI_API_BASE_URLS[idx]
  863. key = request.app.state.config.OPENAI_API_KEYS[idx]
  864. api_config = request.app.state.config.OPENAI_API_CONFIGS.get(
  865. str(idx),
  866. request.app.state.config.OPENAI_API_CONFIGS.get(
  867. request.app.state.config.OPENAI_API_BASE_URLS[idx], {}
  868. ), # Legacy support
  869. )
  870. r = None
  871. session = None
  872. streaming = False
  873. try:
  874. headers = {
  875. "Content-Type": "application/json",
  876. **(
  877. {
  878. "X-OpenWebUI-User-Name": quote(user.name, safe=" "),
  879. "X-OpenWebUI-User-Id": user.id,
  880. "X-OpenWebUI-User-Email": user.email,
  881. "X-OpenWebUI-User-Role": user.role,
  882. }
  883. if ENABLE_FORWARD_USER_INFO_HEADERS
  884. else {}
  885. ),
  886. }
  887. if api_config.get("azure", False):
  888. api_version = api_config.get("api_version", "2023-03-15-preview")
  889. headers["api-key"] = key
  890. headers["api-version"] = api_version
  891. payload = json.loads(body)
  892. url, payload = convert_to_azure_payload(url, payload, api_version)
  893. body = json.dumps(payload).encode()
  894. request_url = f"{url}/{path}?api-version={api_version}"
  895. else:
  896. headers["Authorization"] = f"Bearer {key}"
  897. request_url = f"{url}/{path}"
  898. session = aiohttp.ClientSession(trust_env=True)
  899. r = await session.request(
  900. method=request.method,
  901. url=request_url,
  902. data=body,
  903. headers=headers,
  904. ssl=AIOHTTP_CLIENT_SESSION_SSL,
  905. )
  906. # Check if response is SSE
  907. if "text/event-stream" in r.headers.get("Content-Type", ""):
  908. streaming = True
  909. return StreamingResponse(
  910. r.content,
  911. status_code=r.status,
  912. headers=dict(r.headers),
  913. background=BackgroundTask(
  914. cleanup_response, response=r, session=session
  915. ),
  916. )
  917. else:
  918. try:
  919. response_data = await r.json()
  920. except Exception:
  921. response_data = await r.text()
  922. if r.status >= 400:
  923. if isinstance(response_data, (dict, list)):
  924. return JSONResponse(status_code=r.status, content=response_data)
  925. else:
  926. return PlainTextResponse(
  927. status_code=r.status, content=response_data
  928. )
  929. return response_data
  930. except Exception as e:
  931. log.exception(e)
  932. raise HTTPException(
  933. status_code=r.status if r else 500,
  934. detail="Open WebUI: Server Connection Error",
  935. )
  936. finally:
  937. if not streaming:
  938. await cleanup_response(r, session)