1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253 |
- # common logic accross linux and darwin
- init_vars() {
- LLAMACPP_DIR=gguf
- PATCHES="0001-Expose-callable-API-for-server.patch"
- CMAKE_DEFS=""
- CMAKE_TARGETS="--target ggml --target ggml_static --target llama --target build_info --target common --target ext_server --target llava_static"
- if echo "${CGO_CFLAGS}" | grep -- '-g' >/dev/null; then
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_VERBOSE_MAKEFILE=on -DLLAMA_GPROF=on -DLLAMA_SERVER_VERBOSE=on"
- else
- # TODO - add additional optimization flags...
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=Release -DLLAMA_SERVER_VERBOSE=off"
- fi
- }
- git_module_setup() {
- if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then
- echo "Skipping submodule initialization"
- return
- fi
- git submodule init
- git submodule update --force gguf
- }
- apply_patches() {
- # Wire up our CMakefile
- if ! grep ollama gguf/examples/server/CMakeLists.txt; then
- echo 'include (../../../CMakeLists.txt) # ollama' >>gguf/examples/server/CMakeLists.txt
- fi
- # Avoid duplicate main symbols when we link into the cgo binary
- sed -e 's/int main(/int __main(/g' <./gguf/examples/server/server.cpp >./gguf/examples/server/server.cpp.tmp &&
- mv ./gguf/examples/server/server.cpp.tmp ./gguf/examples/server/server.cpp
- }
- build() {
- cmake -S ${LLAMACPP_DIR} -B ${BUILD_DIR} ${CMAKE_DEFS}
- cmake --build ${BUILD_DIR} ${CMAKE_TARGETS} -j8
- }
- install() {
- rm -rf ${BUILD_DIR}/lib
- mkdir -p ${BUILD_DIR}/lib
- cp ${BUILD_DIR}/examples/server/libext_server.a ${BUILD_DIR}/lib
- cp ${BUILD_DIR}/common/libcommon.a ${BUILD_DIR}/lib
- cp ${BUILD_DIR}/libllama.a ${BUILD_DIR}/lib
- cp ${BUILD_DIR}/libggml_static.a ${BUILD_DIR}/lib
- }
- # Keep the local tree clean after we're done with the build
- cleanup() {
- (cd gguf/examples/server/ && git checkout CMakeLists.txt server.cpp)
- }
|