Explorar o código

fix: Filter to valid RAG web search URLs

Rory hai 3 meses
pai
achega
121a13d4ed
Modificáronse 1 ficheiros con 4 adicións e 0 borrados
  1. 4 0
      backend/open_webui/retrieval/web/main.py

+ 4 - 0
backend/open_webui/retrieval/web/main.py

@@ -1,3 +1,5 @@
+import validators
+
 from typing import Optional
 from urllib.parse import urlparse
 
@@ -10,6 +12,8 @@ def get_filtered_results(results, filter_list):
     filtered_results = []
     for result in results:
         url = result.get("url") or result.get("link", "")
+        if not validators.url(url):
+            continue
         domain = urlparse(url).netloc
         if any(domain.endswith(filtered_domain) for filtered_domain in filter_list):
             filtered_results.append(result)