瀏覽代碼

Merge pull request #17049 from rgaricano/dev-FIX_lex-sem

FIX: Hybrid Search
Tim Jaeryang Baek 1 月之前
父節點
當前提交
719d115d49
共有 2 個文件被更改,包括 4 次插入9 次删除
  1. 2 7
      backend/open_webui/retrieval/utils.py
  2. 2 2
      src/lib/components/admin/Settings/Documents.svelte

+ 2 - 7
backend/open_webui/retrieval/utils.py

@@ -128,8 +128,6 @@ def query_doc_with_hybrid_search(
             log.warning(f"query_doc_with_hybrid_search:no_docs {collection_name}")
             return {"documents": [], "metadatas": [], "distances": []}
 
-        # BM_25 required only if weight is greater than 0
-        if hybrid_bm25_weight > 0:
             log.debug(f"query_doc_with_hybrid_search:doc {collection_name}")
             bm25_retriever = BM25Retriever.from_texts(
                 texts=collection_result.documents[0],
@@ -343,8 +341,7 @@ def query_collection_with_hybrid_search(
     # Fetch collection data once per collection sequentially
     # Avoid fetching the same data multiple times later
     collection_results = {}
-    # Only retrieve entire collection if bm_25 calculation is required
-    if hybrid_bm25_weight > 0:
+
         for collection_name in collection_names:
             try:
                 log.debug(
@@ -356,9 +353,7 @@ def query_collection_with_hybrid_search(
             except Exception as e:
                 log.exception(f"Failed to fetch collection {collection_name}: {e}")
                 collection_results[collection_name] = None
-    else:
-        for collection_name in collection_names:
-            collection_results[collection_name] = []
+                
     log.info(
         f"Starting hybrid search for {len(queries)} queries in {len(collection_names)} collections..."
     )

+ 2 - 2
src/lib/components/admin/Settings/Documents.svelte

@@ -1104,10 +1104,10 @@
 												<div class="py-0.5">
 													<div class="flex w-full justify-between">
 														<div class=" text-left text-xs font-small">
-															{$i18n.t('lexical')}
+															{$i18n.t('semantic')}
 														</div>
 														<div class=" text-right text-xs font-small">
-															{$i18n.t('semantic')}
+															{$i18n.t('lexical')}
 														</div>
 													</div>
 												</div>