1234567891011121314151617181920212223242526272829303132333435363738394041424344 |
- hipcc \
- -parallel-jobs=12 \
- -O3 \
- --offload-arch=gfx900 \
- --offload-arch=gfx940 \
- --offload-arch=gfx941 \
- --offload-arch=gfx942 \
- --offload-arch=gfx1010 \
- --offload-arch=gfx1012 \
- --offload-arch=gfx1030 \
- --offload-arch=gfx1100 \
- --offload-arch=gfx1101 \
- --offload-arch=gfx1102 \
- -DGGML_USE_CUDA \
- -DGGML_BUILD=1 \
- -DGGML_SHARED=1 \
- -DGGML_CUDA_DMMV_X=32 \
- -DGGML_CUDA_MMV_Y=1 \
- -DGGML_SCHED_MAX_COPIES=4 \
- -DGGML_USE_HIPBLAS \
- -DGGML_USE_LLAMAFILE \
- -DHIP_FAST_MATH \
- -DNDEBUG \
- -DK_QUANTS_PER_ITERATION=2 \
- -D_CRT_SECURE_NO_WARNINGS \
- -Xclang --dependent-lib=msvcrt -Wl,/subsystem:console \
- -Wno-expansion-to-defined \
- -Wno-invalid-noreturn \
- -Wno-ignored-attributes \
- -Wno-pass-failed \
- -Wno-deprecated-declarations \
- -I. \
- -lhipblas -lamdhip64 -lrocblas \
- -shared \
- -o ggml-hipblas.dll \
- ggml-cuda.cu ggml-cuda/*.cu ggml.c ggml-backend.c ggml-alloc.c ggml-quants.c sgemm.cpp
- # --offload-arch='gfx906:xnack-' \
- # --offload-arch='gfx908:xnack-' \
- # --offload-arch='gfx90a:xnack+' \
- # --offload-arch='gfx90a:xnack-' \
- # -D_DLL \
- # -D_MT \
- # -D_XOPEN_SOURCE=600 \
|