gen_darwin.sh 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384
  1. #!/bin/bash
  2. # This script is intended to run inside the go generate
  3. # working directory must be ./llm/generate/
  4. # TODO - add hardening to detect missing tools (cmake, etc.)
  5. set -ex
  6. set -o pipefail
  7. echo "Starting darwin generate script"
  8. source $(dirname $0)/gen_common.sh
  9. init_vars
  10. git_module_setup
  11. apply_patches
  12. sign() {
  13. if [ -n "$APPLE_IDENTITY" ]; then
  14. codesign -f --timestamp --deep --options=runtime --sign "$APPLE_IDENTITY" --identifier ai.ollama.ollama $1
  15. fi
  16. }
  17. COMMON_DARWIN_DEFS="-DCMAKE_OSX_DEPLOYMENT_TARGET=11.0 -DCMAKE_SYSTEM_NAME=Darwin"
  18. case "${GOARCH}" in
  19. "amd64")
  20. COMMON_CPU_DEFS="${COMMON_DARWIN_DEFS} -DCMAKE_SYSTEM_PROCESSOR=${ARCH} -DCMAKE_OSX_ARCHITECTURES=${ARCH} -DLLAMA_METAL=off -DLLAMA_NATIVE=off"
  21. #
  22. # CPU first for the default library, set up as lowest common denominator for maximum compatibility (including Rosetta)
  23. #
  24. CMAKE_DEFS="${COMMON_CPU_DEFS} -DLLAMA_ACCELERATE=off -DLLAMA_AVX=off -DLLAMA_AVX2=off -DLLAMA_AVX512=off -DLLAMA_FMA=off -DLLAMA_F16C=off ${CMAKE_DEFS}"
  25. BUILD_DIR="${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu"
  26. echo "Building LCD CPU"
  27. build
  28. sign ${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu/lib/libext_server.dylib
  29. compress_libs
  30. #
  31. # ~2011 CPU Dynamic library with more capabilities turned on to optimize performance
  32. # Approximately 400% faster than LCD on same CPU
  33. #
  34. init_vars
  35. CMAKE_DEFS="${COMMON_CPU_DEFS} -DLLAMA_ACCELERATE=off -DLLAMA_AVX=on -DLLAMA_AVX2=off -DLLAMA_AVX512=off -DLLAMA_FMA=off -DLLAMA_F16C=off ${CMAKE_DEFS}"
  36. BUILD_DIR="${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu_avx"
  37. echo "Building AVX CPU"
  38. build
  39. sign ${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu_avx/lib/libext_server.dylib
  40. compress_libs
  41. #
  42. # ~2013 CPU Dynamic library
  43. # Approximately 10% faster than AVX on same CPU
  44. #
  45. init_vars
  46. CMAKE_DEFS="${COMMON_CPU_DEFS} -DLLAMA_ACCELERATE=on -DLLAMA_AVX=on -DLLAMA_AVX2=on -DLLAMA_AVX512=off -DLLAMA_FMA=on -DLLAMA_F16C=on ${CMAKE_DEFS}"
  47. BUILD_DIR="${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu_avx2"
  48. echo "Building AVX2 CPU"
  49. EXTRA_LIBS="${EXTRA_LIBS} -framework Accelerate -framework Foundation"
  50. build
  51. sign ${LLAMACPP_DIR}/build/darwin/${ARCH}/cpu_avx2/lib/libext_server.dylib
  52. compress_libs
  53. ;;
  54. "arm64")
  55. # bundle ggml-common.h and ggml-metal.metal into a single file
  56. grep -v '#include "ggml-common.h"' "${LLAMACPP_DIR}/ggml-metal.metal" | grep -v '#pragma once' > "${LLAMACPP_DIR}/ggml-metal.metal.temp"
  57. echo '#define GGML_COMMON_IMPL_METAL' > "${LLAMACPP_DIR}/ggml-metal.metal"
  58. cat "${LLAMACPP_DIR}/ggml-common.h" | grep -v '#pragma once' >> "${LLAMACPP_DIR}/ggml-metal.metal"
  59. cat "${LLAMACPP_DIR}/ggml-metal.metal.temp" >> "${LLAMACPP_DIR}/ggml-metal.metal"
  60. rm "${LLAMACPP_DIR}/ggml-metal.metal.temp"
  61. CMAKE_DEFS="${COMMON_DARWIN_DEFS} -DLLAMA_METAL_EMBED_LIBRARY=on -DLLAMA_ACCELERATE=on -DCMAKE_SYSTEM_PROCESSOR=${ARCH} -DCMAKE_OSX_ARCHITECTURES=${ARCH} -DLLAMA_METAL=on ${CMAKE_DEFS}"
  62. BUILD_DIR="${LLAMACPP_DIR}/build/darwin/${ARCH}/metal"
  63. EXTRA_LIBS="${EXTRA_LIBS} -framework Accelerate -framework Foundation -framework Metal -framework MetalKit -framework MetalPerformanceShaders"
  64. build
  65. sign ${LLAMACPP_DIR}/build/darwin/${ARCH}/metal/lib/libext_server.dylib
  66. compress_libs
  67. (cd ${LLAMACPP_DIR} && git checkout ggml-metal.metal)
  68. ;;
  69. *)
  70. echo "GOARCH must be set"
  71. echo "this script is meant to be run from within go generate"
  72. exit 1
  73. ;;
  74. esac
  75. cleanup