浏览代码

Workaround buggy P2P ROCm copy on windows (#7466)

This enables the workaround code only for windows which should help windows users with muliple AMD GPUs
Daniel Hiltgen 5 月之前
父节点
当前提交
1618700c5a
共有 1 个文件被更改,包括 6 次插入0 次删除
  1. 6 0
      llama/make/Makefile.rocm

+ 6 - 0
llama/make/Makefile.rocm

@@ -92,6 +92,12 @@ GPU_COMPILER_CUFLAGS = \
 	-Wno-unused-result \
 	-I.
 
+# Workaround buggy P2P copy on some windows multi-GPU setups
+# This workaround breaks linux systems with small system RAM, so only enable on windows
+ifeq ($(OS),windows)
+	GPU_COMPILER_CUFLAGS += -DGGML_CUDA_NO_PEER_COPY=1
+endif
+
 include make/gpu.make
 
 # Adjust the rules from gpu.make to handle the ROCm dependencies properly