knowledge.py 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226
  1. import json
  2. import logging
  3. import time
  4. from typing import Optional
  5. import uuid
  6. from open_webui.internal.db import Base, get_db
  7. from open_webui.env import SRC_LOG_LEVELS
  8. from open_webui.models.files import FileMetadataResponse
  9. from open_webui.models.users import Users, UserResponse
  10. from pydantic import BaseModel, ConfigDict
  11. from sqlalchemy import BigInteger, Column, String, Text, JSON
  12. from open_webui.utils.access_control import has_access
  13. log = logging.getLogger(__name__)
  14. log.setLevel(SRC_LOG_LEVELS["MODELS"])
  15. ####################
  16. # Knowledge DB Schema
  17. ####################
  18. class Knowledge(Base):
  19. __tablename__ = "knowledge"
  20. id = Column(Text, unique=True, primary_key=True)
  21. user_id = Column(Text)
  22. name = Column(Text)
  23. description = Column(Text)
  24. data = Column(JSON, nullable=True)
  25. meta = Column(JSON, nullable=True)
  26. access_control = Column(JSON, nullable=True) # Controls data access levels.
  27. # Defines access control rules for this entry.
  28. # - `None`: Public access, available to all users with the "user" role.
  29. # - `{}`: Private access, restricted exclusively to the owner.
  30. # - Custom permissions: Specific access control for reading and writing;
  31. # Can specify group or user-level restrictions:
  32. # {
  33. # "read": {
  34. # "group_ids": ["group_id1", "group_id2"],
  35. # "user_ids": ["user_id1", "user_id2"]
  36. # },
  37. # "write": {
  38. # "group_ids": ["group_id1", "group_id2"],
  39. # "user_ids": ["user_id1", "user_id2"]
  40. # }
  41. # }
  42. created_at = Column(BigInteger)
  43. updated_at = Column(BigInteger)
  44. class KnowledgeModel(BaseModel):
  45. model_config = ConfigDict(from_attributes=True)
  46. id: str
  47. user_id: str
  48. name: str
  49. description: str
  50. data: Optional[dict] = None
  51. meta: Optional[dict] = None
  52. access_control: Optional[dict] = None
  53. created_at: int # timestamp in epoch
  54. updated_at: int # timestamp in epoch
  55. ####################
  56. # Forms
  57. ####################
  58. class KnowledgeUserModel(KnowledgeModel):
  59. user: Optional[UserResponse] = None
  60. class KnowledgeResponse(KnowledgeModel):
  61. files: Optional[list[FileMetadataResponse | dict]] = None
  62. class KnowledgeUserResponse(KnowledgeUserModel):
  63. files: Optional[list[FileMetadataResponse | dict]] = None
  64. class KnowledgeForm(BaseModel):
  65. name: str
  66. description: str
  67. data: Optional[dict] = None
  68. access_control: Optional[dict] = None
  69. class KnowledgeTable:
  70. def insert_new_knowledge(
  71. self, user_id: str, form_data: KnowledgeForm
  72. ) -> Optional[KnowledgeModel]:
  73. with get_db() as db:
  74. knowledge = KnowledgeModel(
  75. **{
  76. **form_data.model_dump(),
  77. "id": str(uuid.uuid4()),
  78. "user_id": user_id,
  79. "created_at": int(time.time()),
  80. "updated_at": int(time.time()),
  81. }
  82. )
  83. try:
  84. result = Knowledge(**knowledge.model_dump())
  85. db.add(result)
  86. db.commit()
  87. db.refresh(result)
  88. if result:
  89. return KnowledgeModel.model_validate(result)
  90. else:
  91. return None
  92. except Exception:
  93. return None
  94. def get_knowledge_bases(self) -> list[KnowledgeUserModel]:
  95. with get_db() as db:
  96. all_knowledge = db.query(Knowledge).order_by(Knowledge.updated_at.desc()).all()
  97. user_ids = list(set(knowledge.user_id for knowledge in all_knowledge))
  98. users = Users.get_users_by_user_ids(user_ids) if user_ids else []
  99. users_dict = {user.id: user for user in users}
  100. knowledge_bases = []
  101. for knowledge in all_knowledge:
  102. user = users_dict.get(knowledge.user_id)
  103. knowledge_bases.append(
  104. KnowledgeUserModel.model_validate(
  105. {
  106. **KnowledgeModel.model_validate(knowledge).model_dump(),
  107. "user": user.model_dump() if user else None,
  108. }
  109. )
  110. )
  111. return knowledge_bases
  112. def get_knowledge_bases_by_user_id(
  113. self, user_id: str, permission: str = "write"
  114. ) -> list[KnowledgeUserModel]:
  115. knowledge_bases = self.get_knowledge_bases()
  116. return [
  117. knowledge_base
  118. for knowledge_base in knowledge_bases
  119. if knowledge_base.user_id == user_id
  120. or has_access(user_id, permission, knowledge_base.access_control)
  121. ]
  122. def get_knowledge_by_id(self, id: str) -> Optional[KnowledgeModel]:
  123. try:
  124. with get_db() as db:
  125. knowledge = db.query(Knowledge).filter_by(id=id).first()
  126. return KnowledgeModel.model_validate(knowledge) if knowledge else None
  127. except Exception:
  128. return None
  129. def update_knowledge_by_id(
  130. self, id: str, form_data: KnowledgeForm, overwrite: bool = False
  131. ) -> Optional[KnowledgeModel]:
  132. try:
  133. with get_db() as db:
  134. knowledge = self.get_knowledge_by_id(id=id)
  135. db.query(Knowledge).filter_by(id=id).update(
  136. {
  137. **form_data.model_dump(),
  138. "updated_at": int(time.time()),
  139. }
  140. )
  141. db.commit()
  142. return self.get_knowledge_by_id(id=id)
  143. except Exception as e:
  144. log.exception(e)
  145. return None
  146. def update_knowledge_data_by_id(
  147. self, id: str, data: dict
  148. ) -> Optional[KnowledgeModel]:
  149. try:
  150. with get_db() as db:
  151. knowledge = self.get_knowledge_by_id(id=id)
  152. db.query(Knowledge).filter_by(id=id).update(
  153. {
  154. "data": data,
  155. "updated_at": int(time.time()),
  156. }
  157. )
  158. db.commit()
  159. return self.get_knowledge_by_id(id=id)
  160. except Exception as e:
  161. log.exception(e)
  162. return None
  163. def delete_knowledge_by_id(self, id: str) -> bool:
  164. try:
  165. with get_db() as db:
  166. db.query(Knowledge).filter_by(id=id).delete()
  167. db.commit()
  168. return True
  169. except Exception:
  170. return False
  171. def delete_all_knowledge(self) -> bool:
  172. with get_db() as db:
  173. try:
  174. db.query(Knowledge).delete()
  175. db.commit()
  176. return True
  177. except Exception:
  178. return False
  179. Knowledges = KnowledgeTable()