123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326 |
- name: test
- env:
- ROCM_WINDOWS_URL: https://download.amd.com/developer/eula/rocm-hub/AMD-Software-PRO-Edition-24.Q3-WinSvr2022-For-HIP.exe
- MSYS2_URL: https://github.com/msys2/msys2-installer/releases/download/2024-07-27/msys2-x86_64-20240727.exe
- CUDA_12_WINDOWS_URL: https://developer.download.nvidia.com/compute/cuda/12.4.0/local_installers/cuda_12.4.0_551.61_windows.exe
- CUDA_12_WINDOWS_VER: 12.4
- concurrency:
- # For PRs, later CI runs preempt previous ones. e.g. a force push on a PR
- # cancels running CI jobs and starts all new ones.
- #
- # For non-PR pushes, concurrency.group needs to be unique for every distinct
- # CI run we want to have happen. Use run_id, which in practice means all
- # non-PR CI runs will be allowed to run without preempting each other.
- group: ${{ github.workflow }}-$${{ github.pull_request.number || github.run_id }}
- cancel-in-progress: true
- on:
- pull_request:
- paths:
- - '**/*'
- - '!docs/**'
- - '!README.md'
- jobs:
- changes:
- runs-on: ubuntu-latest
- outputs:
- RUNNERS: ${{ steps.changes.outputs.RUNNERS }}
- steps:
- - uses: actions/checkout@v4
- with:
- fetch-depth: 0
- - id: changes
- run: |
- changed() {
- git diff-tree -r --no-commit-id --name-only \
- $(git merge-base ${{ github.event.pull_request.base.sha }} ${{ github.event.pull_request.head.sha }}) \
- ${{ github.event.pull_request.head.sha }} \
- | xargs python3 -c "import sys; from pathlib import Path; print(any(Path(x).match(glob) for x in sys.argv[1:] for glob in '$*'.split(' ')))"
- }
- {
- echo RUNNERS=$(changed 'llama/**')
- } >>$GITHUB_OUTPUT
- runners-linux-cuda:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- strategy:
- matrix:
- cuda-version:
- - '11.8.0'
- runs-on: linux
- container: nvidia/cuda:${{ matrix.cuda-version }}-devel-ubuntu20.04
- steps:
- - run: |
- apt-get update && apt-get install -y git build-essential curl
- env:
- DEBIAN_FRONTEND: noninteractive
- - uses: actions/checkout@v4
- - uses: actions/setup-go@v4
- with:
- go-version-file: go.mod
- cache: true
- - run: go get ./...
- - run: |
- git config --global --add safe.directory /__w/ollama/ollama
- cores=$(grep '^core id' /proc/cpuinfo |sort -u|wc -l)
- make -j $cores cuda_v11
- runners-linux-rocm:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- strategy:
- matrix:
- rocm-version:
- - '6.1.2'
- runs-on: linux
- container: rocm/dev-ubuntu-20.04:${{ matrix.rocm-version }}
- steps:
- - run: |
- apt-get update && apt-get install -y git build-essential curl rocm-libs
- env:
- DEBIAN_FRONTEND: noninteractive
- - uses: actions/checkout@v4
- - uses: actions/setup-go@v4
- with:
- go-version-file: go.mod
- cache: true
- - run: go get ./...
- - run: |
- git config --global --add safe.directory /__w/ollama/ollama
- cores=$(grep '^core id' /proc/cpuinfo |sort -u|wc -l)
- make -j $cores rocm
- # ROCm generation step
- runners-windows-rocm:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- runs-on: windows
- steps:
- - uses: actions/checkout@v4
- - uses: actions/setup-go@v5
- with:
- go-version-file: go.mod
- cache: true
- - name: Set make jobs default
- run: |
- echo "MAKEFLAGS=--jobs=$((Get-ComputerInfo -Property CsProcessors).CsProcessors.NumberOfCores)" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- # ROCM installation steps
- - name: 'Cache ROCm installer'
- id: cache-rocm
- uses: actions/cache@v4
- with:
- path: rocm-install.exe
- key: ${{ env.ROCM_WINDOWS_URL }}
- - name: 'Conditionally Download ROCm'
- if: steps.cache-rocm.outputs.cache-hit != 'true'
- run: |
- $ErrorActionPreference = "Stop"
- Invoke-WebRequest -Uri "${env:ROCM_WINDOWS_URL}" -OutFile "rocm-install.exe"
- - name: 'Install ROCm'
- run: |
- Start-Process "rocm-install.exe" -ArgumentList '-install' -NoNewWindow -Wait
- - name: 'Verify ROCm'
- run: |
- & 'C:\Program Files\AMD\ROCm\*\bin\clang.exe' --version
- echo "HIP_PATH=$(Resolve-Path 'C:\Program Files\AMD\ROCm\*\bin\clang.exe' | split-path | split-path | select -first 1)" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- - name: Add msys paths
- run: |
- echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- - name: Install msys2 tools
- run: |
- Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang") -NoNewWindow -Wait
- - name: make rocm runner
- run: |
- import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
- Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
- if (!(gcc --version | select-string -quiet clang)) { throw "wrong gcc compiler detected - must be clang" }
- make -C llama print-HIP_PATH print-HIP_LIB_DIR
- make rocm
- # CUDA generation step
- runners-windows-cuda:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- runs-on: windows
- steps:
- - uses: actions/checkout@v4
- - uses: actions/setup-go@v5
- with:
- go-version-file: go.mod
- cache: true
- - name: Set make jobs default
- run: |
- echo "MAKEFLAGS=--jobs=$((Get-ComputerInfo -Property CsProcessors).CsProcessors.NumberOfCores)" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- # CUDA installation steps
- - name: 'Cache CUDA installer'
- id: cache-cuda
- uses: actions/cache@v4
- with:
- path: cuda-install.exe
- key: ${{ env.CUDA_12_WINDOWS_URL }}
- - name: 'Conditionally Download CUDA'
- if: steps.cache-cuda.outputs.cache-hit != 'true'
- run: |
- $ErrorActionPreference = "Stop"
- Invoke-WebRequest -Uri "${env:CUDA_12_WINDOWS_URL}" -OutFile "cuda-install.exe"
- - name: 'Install CUDA'
- run: |
- $subpackages = @("cudart", "nvcc", "cublas", "cublas_dev") | foreach-object {"${_}_${{ env.CUDA_12_WINDOWS_VER }}"}
- Start-Process "cuda-install.exe" -ArgumentList (@("-s") + $subpackages) -NoNewWindow -Wait
- - name: 'Verify CUDA'
- run: |
- & (resolve-path "c:\Program Files\NVIDIA*\CUDA\v*\bin\nvcc.exe")[0] --version
- $cudaPath=((resolve-path "c:\Program Files\NVIDIA*\CUDA\v*\bin\nvcc.exe")[0].path | split-path | split-path)
- $cudaVer=($cudaPath | split-path -leaf ) -replace 'v(\d+).(\d+)', '$1_$2'
- echo "$cudaPath\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- echo "CUDA_PATH=$cudaPath" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- echo "CUDA_PATH_V${cudaVer}=$cudaPath" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- echo "CUDA_PATH_VX_Y=CUDA_PATH_V${cudaVer}" | Out-File -FilePath $env:GITHUB_ENV -Encoding utf8 -Append
- - name: Add msys paths
- run: |
- echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- - name: Install msys2 tools
- run: |
- Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang") -NoNewWindow -Wait
- - name: make cuda runner
- run: |
- import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
- Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
- if (!(gcc --version | select-string -quiet clang)) { throw "wrong gcc compiler detected - must be clang" }
- make cuda_v$(($env:CUDA_PATH | split-path -leaf) -replace 'v(\d+).*', '$1')
- runners-cpu:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- strategy:
- matrix:
- os: [ubuntu-latest, macos-latest, windows-2019]
- arch: [amd64, arm64]
- exclude:
- - os: ubuntu-latest
- arch: arm64
- - os: windows-2019
- arch: arm64
- runs-on: ${{ matrix.os }}
- env:
- GOARCH: ${{ matrix.arch }}
- ARCH: ${{ matrix.arch }}
- CGO_ENABLED: '1'
- steps:
- - uses: actions/checkout@v4
- - uses: actions/setup-go@v5
- with:
- go-version-file: go.mod
- cache: true
- - name: Add msys paths
- if: ${{ startsWith(matrix.os, 'windows-') }}
- run: |
- echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
- - name: Install msys2 tools
- if: ${{ startsWith(matrix.os, 'windows-') }}
- run: |
- Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang") -NoNewWindow -Wait
- - name: 'Build Windows Go Runners'
- if: ${{ startsWith(matrix.os, 'windows-') }}
- run: |
- $gopath=(get-command go).source | split-path -parent
- $gccpath=(get-command gcc).source | split-path -parent
- import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
- Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
- $env:CMAKE_SYSTEM_VERSION="10.0.22621.0"
- $env:PATH="$gopath;$gccpath;$env:PATH"
- echo $env:PATH
- if (!(gcc --version | select-string -quiet clang)) { throw "wrong gcc compiler detected - must be clang" }
- make -j 4
- - name: 'Build Unix Go Runners'
- if: ${{ ! startsWith(matrix.os, 'windows-') }}
- run: make -j 4
- - run: go build .
- lint:
- strategy:
- matrix:
- os: [ubuntu-latest, macos-latest, windows-2019]
- arch: [amd64, arm64]
- exclude:
- - os: ubuntu-latest
- arch: arm64
- - os: windows-2019
- arch: arm64
- - os: macos-latest
- arch: amd64
- runs-on: ${{ matrix.os }}
- env:
- GOARCH: ${{ matrix.arch }}
- CGO_ENABLED: '1'
- steps:
- - uses: actions/checkout@v4
- with:
- submodules: recursive
- - uses: actions/setup-go@v5
- with:
- go-version-file: go.mod
- cache: false
- - run: |
- case ${{ matrix.arch }} in
- amd64) echo ARCH=x86_64 ;;
- arm64) echo ARCH=arm64 ;;
- esac >>$GITHUB_ENV
- shell: bash
- - uses: golangci/golangci-lint-action@v6
- with:
- args: --timeout 10m0s -v
- test:
- strategy:
- matrix:
- os: [ubuntu-latest, macos-latest, windows-2019]
- arch: [amd64]
- exclude:
- - os: ubuntu-latest
- arch: arm64
- - os: windows-2019
- arch: arm64
- runs-on: ${{ matrix.os }}
- env:
- GOARCH: ${{ matrix.arch }}
- CGO_ENABLED: '1'
- steps:
- - uses: actions/checkout@v4
- with:
- submodules: recursive
- - uses: actions/setup-go@v5
- with:
- go-version-file: go.mod
- cache: true
- - run: |
- case ${{ matrix.arch }} in
- amd64) echo ARCH=amd64 ;;
- arm64) echo ARCH=arm64 ;;
- esac >>$GITHUB_ENV
- shell: bash
- - run: go build
- - run: go test -v ./...
- patches:
- needs: [changes]
- if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
- runs-on: ubuntu-latest
- steps:
- - uses: actions/checkout@v4
- with:
- submodules: recursive
- - name: Verify patches carry all the changes
- run: |
- make apply-patches sync && git diff --compact-summary --exit-code llama
|