knowledge.py 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228
  1. import json
  2. import logging
  3. import time
  4. from typing import Optional
  5. import uuid
  6. from open_webui.internal.db import Base, get_db
  7. from open_webui.env import SRC_LOG_LEVELS
  8. from open_webui.models.files import FileMetadataResponse
  9. from open_webui.models.groups import Groups
  10. from open_webui.models.users import Users, UserResponse
  11. from pydantic import BaseModel, ConfigDict
  12. from sqlalchemy import BigInteger, Column, String, Text, JSON
  13. from open_webui.utils.access_control import has_access
  14. log = logging.getLogger(__name__)
  15. log.setLevel(SRC_LOG_LEVELS["MODELS"])
  16. ####################
  17. # Knowledge DB Schema
  18. ####################
  19. class Knowledge(Base):
  20. __tablename__ = "knowledge"
  21. id = Column(Text, unique=True, primary_key=True)
  22. user_id = Column(Text)
  23. name = Column(Text)
  24. description = Column(Text)
  25. data = Column(JSON, nullable=True)
  26. meta = Column(JSON, nullable=True)
  27. access_control = Column(JSON, nullable=True) # Controls data access levels.
  28. # Defines access control rules for this entry.
  29. # - `None`: Public access, available to all users with the "user" role.
  30. # - `{}`: Private access, restricted exclusively to the owner.
  31. # - Custom permissions: Specific access control for reading and writing;
  32. # Can specify group or user-level restrictions:
  33. # {
  34. # "read": {
  35. # "group_ids": ["group_id1", "group_id2"],
  36. # "user_ids": ["user_id1", "user_id2"]
  37. # },
  38. # "write": {
  39. # "group_ids": ["group_id1", "group_id2"],
  40. # "user_ids": ["user_id1", "user_id2"]
  41. # }
  42. # }
  43. created_at = Column(BigInteger)
  44. updated_at = Column(BigInteger)
  45. class KnowledgeModel(BaseModel):
  46. model_config = ConfigDict(from_attributes=True)
  47. id: str
  48. user_id: str
  49. name: str
  50. description: str
  51. data: Optional[dict] = None
  52. meta: Optional[dict] = None
  53. access_control: Optional[dict] = None
  54. created_at: int # timestamp in epoch
  55. updated_at: int # timestamp in epoch
  56. ####################
  57. # Forms
  58. ####################
  59. class KnowledgeUserModel(KnowledgeModel):
  60. user: Optional[UserResponse] = None
  61. class KnowledgeResponse(KnowledgeModel):
  62. files: Optional[list[FileMetadataResponse | dict]] = None
  63. class KnowledgeUserResponse(KnowledgeUserModel):
  64. files: Optional[list[FileMetadataResponse | dict]] = None
  65. class KnowledgeForm(BaseModel):
  66. name: str
  67. description: str
  68. data: Optional[dict] = None
  69. access_control: Optional[dict] = None
  70. class KnowledgeTable:
  71. def insert_new_knowledge(
  72. self, user_id: str, form_data: KnowledgeForm
  73. ) -> Optional[KnowledgeModel]:
  74. with get_db() as db:
  75. knowledge = KnowledgeModel(
  76. **{
  77. **form_data.model_dump(),
  78. "id": str(uuid.uuid4()),
  79. "user_id": user_id,
  80. "created_at": int(time.time()),
  81. "updated_at": int(time.time()),
  82. }
  83. )
  84. try:
  85. result = Knowledge(**knowledge.model_dump())
  86. db.add(result)
  87. db.commit()
  88. db.refresh(result)
  89. if result:
  90. return KnowledgeModel.model_validate(result)
  91. else:
  92. return None
  93. except Exception:
  94. return None
  95. def get_knowledge_bases(self) -> list[KnowledgeUserModel]:
  96. with get_db() as db:
  97. all_knowledge = db.query(Knowledge).order_by(Knowledge.updated_at.desc()).all()
  98. user_ids = list(set(knowledge.user_id for knowledge in all_knowledge))
  99. users = Users.get_users_by_user_ids(user_ids) if user_ids else []
  100. users_dict = {user.id: user for user in users}
  101. knowledge_bases = []
  102. for knowledge in all_knowledge:
  103. user = users_dict.get(knowledge.user_id)
  104. knowledge_bases.append(
  105. KnowledgeUserModel.model_validate(
  106. {
  107. **KnowledgeModel.model_validate(knowledge).model_dump(),
  108. "user": user.model_dump() if user else None,
  109. }
  110. )
  111. )
  112. return knowledge_bases
  113. def get_knowledge_bases_by_user_id(
  114. self, user_id: str, permission: str = "write"
  115. ) -> list[KnowledgeUserModel]:
  116. knowledge_bases = self.get_knowledge_bases()
  117. user_group_ids = {group.id for group in Groups.get_groups_by_member_id(user_id)}
  118. return [
  119. knowledge_base
  120. for knowledge_base in knowledge_bases
  121. if knowledge_base.user_id == user_id
  122. or has_access(user_id, permission, knowledge_base.access_control, user_group_ids)
  123. ]
  124. def get_knowledge_by_id(self, id: str) -> Optional[KnowledgeModel]:
  125. try:
  126. with get_db() as db:
  127. knowledge = db.query(Knowledge).filter_by(id=id).first()
  128. return KnowledgeModel.model_validate(knowledge) if knowledge else None
  129. except Exception:
  130. return None
  131. def update_knowledge_by_id(
  132. self, id: str, form_data: KnowledgeForm, overwrite: bool = False
  133. ) -> Optional[KnowledgeModel]:
  134. try:
  135. with get_db() as db:
  136. knowledge = self.get_knowledge_by_id(id=id)
  137. db.query(Knowledge).filter_by(id=id).update(
  138. {
  139. **form_data.model_dump(),
  140. "updated_at": int(time.time()),
  141. }
  142. )
  143. db.commit()
  144. return self.get_knowledge_by_id(id=id)
  145. except Exception as e:
  146. log.exception(e)
  147. return None
  148. def update_knowledge_data_by_id(
  149. self, id: str, data: dict
  150. ) -> Optional[KnowledgeModel]:
  151. try:
  152. with get_db() as db:
  153. knowledge = self.get_knowledge_by_id(id=id)
  154. db.query(Knowledge).filter_by(id=id).update(
  155. {
  156. "data": data,
  157. "updated_at": int(time.time()),
  158. }
  159. )
  160. db.commit()
  161. return self.get_knowledge_by_id(id=id)
  162. except Exception as e:
  163. log.exception(e)
  164. return None
  165. def delete_knowledge_by_id(self, id: str) -> bool:
  166. try:
  167. with get_db() as db:
  168. db.query(Knowledge).filter_by(id=id).delete()
  169. db.commit()
  170. return True
  171. except Exception:
  172. return False
  173. def delete_all_knowledge(self) -> bool:
  174. with get_db() as db:
  175. try:
  176. db.query(Knowledge).delete()
  177. db.commit()
  178. return True
  179. except Exception:
  180. return False
  181. Knowledges = KnowledgeTable()