|
@@ -21,7 +21,8 @@ else ifeq ($(OS),linux)
|
|
|
GPU_LIB_DIR_LINUX := $(HIP_PATH)/lib
|
|
|
GPU_COMPILER_LINUX := $(shell X=$$(which hipcc 2>/dev/null) && echo $$X)
|
|
|
GPU_COMPILER:=$(GPU_COMPILER_LINUX)
|
|
|
- ROCM_TRANSITIVE_LIBS = $(shell ldd $(ROCM_LIBS) | grep "=>" | cut -f2 -d= | cut -f2 -d' ' | grep -e rocm -e amdgpu -e libtinfo -e libnuma -e libelf | sort -u )
|
|
|
+ ROCM_TRANSITIVE_LIBS_INITIAL = $(sort $(shell ldd $(ROCM_LIBS) | grep "=>" | cut -f2 -d= | cut -f2 -d' ' | grep -e rocm -e amdgpu -e libtinfo -e libnuma -e libelf))
|
|
|
+ ROCM_TRANSITIVE_LIBS = $(sort $(shell readlink -f $(ROCM_TRANSITIVE_LIBS_INITIAL)) $(ROCM_TRANSITIVE_LIBS_INITIAL))
|
|
|
endif
|
|
|
|
|
|
# TODO future multi-variant support for ROCm
|
|
@@ -36,14 +37,18 @@ GPU_RUNNER_DRIVER_LIB_LINK := -lamdhip64
|
|
|
GPU_RUNNER_LIBS_SHORT := hipblas rocblas
|
|
|
GPU_PATH_ROOT_WIN=$(dir $(GPU_LIB_DIR_WIN))
|
|
|
GPU_PATH_ROOT_LINUX=$(dir $(GPU_LIB_DIR_LINUX))
|
|
|
-GPU_COMPILER_CFLAGS_WIN = $(CFLAGS)
|
|
|
+GPU_COMPILER_CFLAGS_WIN = $(CFLAGS) -D_WIN32_WINNT=0x602
|
|
|
GPU_COMPILER_CFLAGS_LINUX = $(CFLAGS) -fPIC -D_GNU_SOURCE
|
|
|
-GPU_COMPILER_CXXFLAGS_WIN = $(CXXFLAGS)
|
|
|
+GPU_COMPILER_CXXFLAGS_WIN = $(CXXFLAGS) -D_WIN32_WINNT=0x602
|
|
|
GPU_COMPILER_CXXFLAGS_LINUX = $(CXXFLAGS) -fPIC -D_GNU_SOURCE
|
|
|
|
|
|
ROCM_LIBS = $(wildcard $(addsuffix .$(SHARED_EXT),$(addprefix $(GPU_LIB_DIR)/$(SHARED_PREFIX),$(GPU_RUNNER_LIBS_SHORT))))
|
|
|
-ROCM_DIST_DEPS_DIR = $(abspath $(SRC_DIR)/../dist/$(OS)-$(ARCH)-rocm)/lib/ollama
|
|
|
-ROCM_DIST_DEPS_LIBS = $(addprefix $(ROCM_DIST_DEPS_DIR)/,$(notdir $(ROCM_LIBS)) $(notdir $(ROCM_TRANSITIVE_LIBS)))
|
|
|
+ifeq ($(OS),windows)
|
|
|
+ ROCM_DIST_DEPS_DIR = $(abspath $(SRC_DIR)/../dist/$(OS)-$(ARCH))/lib/ollama
|
|
|
+else ifeq ($(OS),linux)
|
|
|
+ ROCM_DIST_DEPS_DIR = $(abspath $(SRC_DIR)/../dist/$(OS)-$(ARCH)-rocm)/lib/ollama
|
|
|
+endif
|
|
|
+ROCM_DIST_DEPS_LIBS= $(sort $(addprefix $(ROCM_DIST_DEPS_DIR)/,$(notdir $(ROCM_LIBS)) $(notdir $(ROCM_TRANSITIVE_LIBS))))
|
|
|
ROCBLAS_DIST_DEP_MANIFEST = $(ROCM_DIST_DEPS_DIR)/rocblas/library/TensileManifest.txt
|
|
|
|
|
|
ifeq ($(OS),linux)
|
|
@@ -84,8 +89,7 @@ GPU_COMPILER_CUFLAGS = \
|
|
|
-Wno-pass-failed \
|
|
|
-Wno-deprecated-declarations \
|
|
|
-Wno-unused-result \
|
|
|
- -I. \
|
|
|
- $(foreach arch, $(HIP_ARCHS_COMMON), --offload-arch=$(arch))
|
|
|
+ -I.
|
|
|
|
|
|
include make/gpu.make
|
|
|
|
|
@@ -98,4 +102,4 @@ $(ROCBLAS_DIST_DEP_MANIFEST):
|
|
|
@echo "rocblas library copy complete"
|
|
|
$(ROCM_DIST_DEPS_LIBS):
|
|
|
@-mkdir -p $(dir $@)
|
|
|
- $(CP) $(dir $(filter %$(notdir $@),$(ROCM_LIBS) $(ROCM_TRANSITIVE_LIBS)))/$(notdir $@)* $(dir $@)
|
|
|
+ $(CP) $(dir $(filter %$(notdir $@),$(ROCM_LIBS) $(ROCM_TRANSITIVE_LIBS)))/$(notdir $@) $(dir $@)
|