123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100 |
- # common logic accross linux and darwin
- init_vars() {
- case "${GOARCH}" in
- "amd64")
- ARCH="x86_64"
- ;;
- "arm64")
- ARCH="arm64"
- ;;
- *)
- ARCH=$(uname -m | sed -e "s/aarch64/arm64/g")
- esac
- LLAMACPP_DIR=../llama.cpp
- CMAKE_DEFS=""
- CMAKE_TARGETS="--target ext_server"
- if echo "${CGO_CFLAGS}" | grep -- '-g' >/dev/null; then
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_VERBOSE_MAKEFILE=on -DLLAMA_GPROF=on -DLLAMA_SERVER_VERBOSE=on ${CMAKE_DEFS}"
- else
- # TODO - add additional optimization flags...
- CMAKE_DEFS="-DCMAKE_BUILD_TYPE=Release -DLLAMA_SERVER_VERBOSE=off ${CMAKE_DEFS}"
- fi
- case $(uname -s) in
- "Darwin")
- LIB_EXT="dylib"
- WHOLE_ARCHIVE="-Wl,-force_load"
- NO_WHOLE_ARCHIVE=""
- GCC_ARCH="-arch ${ARCH}"
- ;;
- "Linux")
- LIB_EXT="so"
- WHOLE_ARCHIVE="-Wl,--whole-archive"
- NO_WHOLE_ARCHIVE="-Wl,--no-whole-archive"
- # Cross compiling not supported on linux - Use docker
- GCC_ARCH=""
- ;;
- *)
- ;;
- esac
- }
- git_module_setup() {
- if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then
- echo "Skipping submodule initialization"
- return
- fi
- # Make sure the tree is clean after the directory moves
- if [ -d "${LLAMACPP_DIR}/gguf" ]; then
- echo "Cleaning up old submodule"
- rm -rf ${LLAMACPP_DIR}
- fi
- git submodule init
- git submodule update --force ${LLAMACPP_DIR}
- }
- apply_patches() {
- # Wire up our CMakefile
- if ! grep ollama ${LLAMACPP_DIR}/examples/server/CMakeLists.txt; then
- echo 'include (../../../ext_server/CMakeLists.txt) # ollama' >>${LLAMACPP_DIR}/examples/server/CMakeLists.txt
- fi
- # Avoid duplicate main symbols when we link into the cgo binary
- sed -e 's/int main(/int __main(/g' <${LLAMACPP_DIR}/examples/server/server.cpp >${LLAMACPP_DIR}/examples/server/server.cpp.tmp &&
- mv ${LLAMACPP_DIR}/examples/server/server.cpp.tmp ${LLAMACPP_DIR}/examples/server/server.cpp
- }
- build() {
- cmake -S ${LLAMACPP_DIR} -B ${BUILD_DIR} ${CMAKE_DEFS}
- cmake --build ${BUILD_DIR} ${CMAKE_TARGETS} -j8
- mkdir -p ${BUILD_DIR}/lib/
- g++ -fPIC -g -shared -o ${BUILD_DIR}/lib/libext_server.${LIB_EXT} \
- ${GCC_ARCH} \
- ${WHOLE_ARCHIVE} ${BUILD_DIR}/examples/server/libext_server.a ${NO_WHOLE_ARCHIVE} \
- ${BUILD_DIR}/common/libcommon.a \
- ${BUILD_DIR}/libllama.a \
- -Wl,-rpath,\$ORIGIN \
- -lpthread -ldl -lm \
- ${EXTRA_LIBS}
- }
- compress_libs() {
- echo "Compressing payloads to reduce overall binary size..."
- pids=""
- for lib in ${BUILD_DIR}/lib/*.${LIB_EXT}* ; do
- gzip --best ${lib} &
- pids+=" $!"
- done
- echo
- for pid in ${pids}; do
- wait $pid
- done
- echo "Finished compression"
- }
- # Keep the local tree clean after we're done with the build
- cleanup() {
- (cd ${LLAMACPP_DIR}/examples/server/ && git checkout CMakeLists.txt server.cpp)
- }
|