Timothy J. Baek hai 7 meses
pai
achega
9be73ea94a
Modificáronse 2 ficheiros con 13 adicións e 1 borrados
  1. 1 1
      Dockerfile
  2. 12 0
      backend/open_webui/apps/rag/main.py

+ 1 - 1
Dockerfile

@@ -76,7 +76,7 @@ ENV RAG_EMBEDDING_MODEL="$USE_EMBEDDING_MODEL_DOCKER" \
 ENV HF_HOME="/app/backend/data/cache/embedding/models"
 
 ## Torch Extensions ##
-ENV TORCH_EXTENSIONS_DIR="/.cache/torch_extensions"
+# ENV TORCH_EXTENSIONS_DIR="/.cache/torch_extensions"
 
 #### Other models ##########################################################
 

+ 12 - 0
backend/open_webui/apps/rag/main.py

@@ -206,6 +206,18 @@ def update_reranking_model(
                     print("ColBERT: Loading model", name)
                     self.device = "cuda" if torch.cuda.is_available() else "cpu"
 
+                    if DOCKER:
+                        # This is a workaround for the issue with the docker container
+                        # where the torch extension is not loaded properly
+                        # and the following error is thrown:
+                        # /root/.cache/torch_extensions/py311_cpu/segmented_maxsim_cpp/segmented_maxsim_cpp.so: cannot open shared object file: No such file or directory
+
+                        torch_extensions = "/root/.cache/torch_extensions/py311_cpu"
+                        try:
+                            shutil.rmtree(torch_extensions)
+                        except:
+                            pass
+
                     self.ckpt = Checkpoint(
                         name,
                         colbert_config=ColBERTConfig(model_name=name),