123456789101112131415161718192021222324252627282930313233343536373839404142 |
- # common logic accross linux and darwin
- init_vars() {
- LLAMACPP_DIR=gguf
- PATCHES="0001-Expose-callable-API-for-server.patch"
- CMAKE_DEFS="-DLLAMA_ACCELERATE=on"
- # TODO - LLAMA_K_QUANTS is stale and needs to be mapped to newer cmake settings
- CMAKE_TARGETS="--target ggml --target ggml_static --target llama --target build_info --target common --target ext_server --target llava_static"
- if echo "${CGO_CFLAGS}" | grep -- '-g' >/dev/null; then
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_VERBOSE_MAKEFILE=on -DLLAMA_GPROF=on ${CMAKE_DEFS}"
- else
- # TODO - add additional optimization flags...
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=Release ${CMAKE_DEFS}"
- fi
- }
- git_module_setup() {
- if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then
- echo "Skipping submodule initialization"
- return
- fi
- git submodule init
- git submodule update --force gguf
- }
- apply_patches() {
- if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then
- echo "Skipping submodule patching"
- return
- fi
- # Workaround git apply not handling creation well for iteration
- rm -f gguf/examples/server/server.h
- for patch in ${PATCHES}; do
- git -C gguf apply ../patches/${patch}
- done
- }
- build() {
- cmake -S ${LLAMACPP_DIR} -B ${BUILD_DIR} ${CMAKE_DEFS}
- cmake --build ${BUILD_DIR} ${CMAKE_TARGETS} -j8
- }
|