瀏覽代碼

Only enable numa on CPUs (#6484)

The numa flag may be having a performance impact on multi-socket systems with GPU loads
Daniel Hiltgen 8 月之前
父節點
當前提交
0f92b19bec
共有 1 個文件被更改,包括 1 次插入1 次删除
  1. 1 1
      llm/server.go

+ 1 - 1
llm/server.go

@@ -258,7 +258,7 @@ func NewLlamaServer(gpus gpu.GpuInfoList, model string, ggml *GGML, adapters, pr
 		params = append(params, "--mlock")
 		params = append(params, "--mlock")
 	}
 	}
 
 
-	if gpu.IsNUMA() {
+	if gpu.IsNUMA() && gpus[0].Library == "cpu" {
 		numaMode := "distribute"
 		numaMode := "distribute"
 		if runtime.GOOS == "linux" {
 		if runtime.GOOS == "linux" {
 			if _, err := exec.LookPath("numactl"); err == nil {
 			if _, err := exec.LookPath("numactl"); err == nil {