b754f5a6a3
* Remove llama.cpp submodule and shift new build to top * CI: install msys and clang gcc on win Needed for deepseek to work properly on windows
340 lines
No EOL
13 KiB
YAML
340 lines
No EOL
13 KiB
YAML
name: test
|
|
|
|
concurrency:
|
|
# For PRs, later CI runs preempt previous ones. e.g. a force push on a PR
|
|
# cancels running CI jobs and starts all new ones.
|
|
#
|
|
# For non-PR pushes, concurrency.group needs to be unique for every distinct
|
|
# CI run we want to have happen. Use run_id, which in practice means all
|
|
# non-PR CI runs will be allowed to run without preempting each other.
|
|
group: ${{ github.workflow }}-$${{ github.pull_request.number || github.run_id }}
|
|
cancel-in-progress: true
|
|
|
|
on:
|
|
pull_request:
|
|
paths:
|
|
- '**/*'
|
|
- '!docs/**'
|
|
- '!README.md'
|
|
|
|
jobs:
|
|
changes:
|
|
runs-on: ubuntu-latest
|
|
outputs:
|
|
RUNNERS: ${{ steps.changes.outputs.RUNNERS }}
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
with:
|
|
fetch-depth: 0
|
|
- id: changes
|
|
run: |
|
|
changed() {
|
|
git diff-tree -r --no-commit-id --name-only \
|
|
$(git merge-base ${{ github.event.pull_request.base.sha }} ${{ github.event.pull_request.head.sha }}) \
|
|
${{ github.event.pull_request.head.sha }} \
|
|
| xargs python3 -c "import sys; from pathlib import Path; print(any(Path(x).match(glob) for x in sys.argv[1:] for glob in '$*'.split(' ')))"
|
|
}
|
|
|
|
{
|
|
echo RUNNERS=$(changed 'llama/**')
|
|
} >>$GITHUB_OUTPUT
|
|
|
|
runners-linux-cuda:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
strategy:
|
|
matrix:
|
|
cuda-version:
|
|
- '11.8.0'
|
|
runs-on: linux
|
|
container: nvidia/cuda:${{ matrix.cuda-version }}-devel-ubuntu20.04
|
|
steps:
|
|
- run: |
|
|
apt-get update && apt-get install -y git build-essential curl
|
|
env:
|
|
DEBIAN_FRONTEND: noninteractive
|
|
- uses: actions/checkout@v4
|
|
- uses: actions/setup-go@v4
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- run: go get ./...
|
|
- run: |
|
|
git config --global --add safe.directory /__w/ollama/ollama
|
|
cores=$(grep '^core id' /proc/cpuinfo |sort -u|wc -l)
|
|
make -j $cores cuda_v11
|
|
runners-linux-rocm:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
strategy:
|
|
matrix:
|
|
rocm-version:
|
|
- '6.1.2'
|
|
runs-on: linux
|
|
container: rocm/dev-ubuntu-20.04:${{ matrix.rocm-version }}
|
|
steps:
|
|
- run: |
|
|
apt-get update && apt-get install -y git build-essential curl rocm-libs
|
|
env:
|
|
DEBIAN_FRONTEND: noninteractive
|
|
- uses: actions/checkout@v4
|
|
- uses: actions/setup-go@v4
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- run: go get ./...
|
|
- run: |
|
|
git config --global --add safe.directory /__w/ollama/ollama
|
|
cores=$(grep '^core id' /proc/cpuinfo |sort -u|wc -l)
|
|
make -j $cores rocm
|
|
|
|
# ROCm generation step
|
|
runners-windows-rocm:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
runs-on: windows
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
- uses: actions/setup-go@v5
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- name: 'Install ROCm'
|
|
run: |
|
|
$ErrorActionPreference = "Stop"
|
|
write-host "downloading AMD HIP Installer"
|
|
Invoke-WebRequest -Uri "https://download.amd.com/developer/eula/rocm-hub/AMD-Software-PRO-Edition-24.Q3-WinSvr2022-For-HIP.exe" -OutFile "${env:RUNNER_TEMP}\rocm-install.exe"
|
|
write-host "Installing AMD HIP"
|
|
Start-Process "${env:RUNNER_TEMP}\rocm-install.exe" -ArgumentList '-install' -NoNewWindow -Wait
|
|
write-host "Completed AMD HIP"
|
|
- name: 'Verify ROCm'
|
|
run: |
|
|
& 'C:\Program Files\AMD\ROCm\*\bin\clang.exe' --version
|
|
- name: Install msys2
|
|
run: |
|
|
$msys2_url="https://github.com/msys2/msys2-installer/releases/download/2024-07-27/msys2-x86_64-20240727.exe"
|
|
write-host "Downloading msys2"
|
|
Invoke-WebRequest -Uri "${msys2_url}" -OutFile "${env:RUNNER_TEMP}\msys2.exe"
|
|
write-host "Installing msys2"
|
|
Start-Process "${env:RUNNER_TEMP}\msys2.exe" -ArgumentList @("in", "--confirm-command", "--accept-messages", "--root", "C:/msys64") -NoNewWindow -Wait
|
|
echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: Install msys2 tools
|
|
run: |
|
|
Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang", "make") -NoNewWindow -Wait
|
|
echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: verify tools
|
|
run: |
|
|
get-command gcc
|
|
gcc --version
|
|
get-command make
|
|
make --version
|
|
- run: go get ./...
|
|
- run: |
|
|
$gopath=(get-command go).source | split-path -parent
|
|
import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
|
|
Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
|
|
$env:PATH="$gopath;$env:PATH"
|
|
$env:OLLAMA_SKIP_CPU_GENERATE="1"
|
|
$env:HIP_PATH=$(Resolve-Path 'C:\Program Files\AMD\ROCm\*\bin\clang.exe' | split-path | split-path)
|
|
$cores = (Get-ComputerInfo -Property CsProcessors).CsProcessors.NumberOfCores
|
|
write-host $env:HIP_PATH
|
|
make -C llama print-HIP_PATH print-HIP_LIB_DIR
|
|
make -j $cores rocm
|
|
name: make
|
|
|
|
# CUDA generation step
|
|
runners-windows-cuda:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
runs-on: windows
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
- uses: actions/setup-go@v5
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- name: 'Install CUDA'
|
|
run: |
|
|
$ErrorActionPreference = "Stop"
|
|
write-host "downloading CUDA Installer"
|
|
Invoke-WebRequest -Uri "https://developer.download.nvidia.com/compute/cuda/11.3.1/local_installers/cuda_11.3.1_465.89_win10.exe" -OutFile "${env:RUNNER_TEMP}\cuda-install.exe"
|
|
write-host "Installing CUDA"
|
|
Start-Process "${env:RUNNER_TEMP}\cuda-install.exe" -ArgumentList '-s' -NoNewWindow -Wait
|
|
write-host "Completed CUDA"
|
|
$cudaPath=((resolve-path "c:\Program Files\NVIDIA*\CUDA\v*\bin\nvcc.exe")[0].path | split-path | split-path)
|
|
$cudaVer=($cudaPath | split-path -leaf ) -replace 'v(\d+).(\d+)', '$1_$2'
|
|
echo "$cudaPath\bin" >> $env:GITHUB_PATH
|
|
echo "CUDA_PATH=$cudaPath" >> $env:GITHUB_ENV
|
|
echo "CUDA_PATH_V${cudaVer}=$cudaPath" >> $env:GITHUB_ENV
|
|
echo "CUDA_PATH_VX_Y=CUDA_PATH_V${cudaVer}" >> $env:GITHUB_ENV
|
|
- name: 'Verify CUDA'
|
|
run: nvcc -V
|
|
- name: Install msys2
|
|
run: |
|
|
$msys2_url="https://github.com/msys2/msys2-installer/releases/download/2024-07-27/msys2-x86_64-20240727.exe"
|
|
write-host "Downloading msys2"
|
|
Invoke-WebRequest -Uri "${msys2_url}" -OutFile "${env:RUNNER_TEMP}\msys2.exe"
|
|
write-host "Installing msys2"
|
|
Start-Process "${env:RUNNER_TEMP}\msys2.exe" -ArgumentList @("in", "--confirm-command", "--accept-messages", "--root", "C:/msys64") -NoNewWindow -Wait
|
|
echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: Install msys2 tools
|
|
run: |
|
|
Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang", "make") -NoNewWindow -Wait
|
|
echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: verify tools
|
|
run: |
|
|
get-command gcc
|
|
gcc --version
|
|
get-command make
|
|
make --version
|
|
- run: go get ./...
|
|
- name: make
|
|
run: |
|
|
$gopath=(get-command go).source | split-path -parent
|
|
$cudabin=(get-command nvcc).source | split-path
|
|
import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
|
|
Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
|
|
$env:CMAKE_SYSTEM_VERSION="10.0.22621.0"
|
|
$env:PATH="$gopath;$cudabin;$env:PATH"
|
|
$env:OLLAMA_SKIP_CPU_GENERATE="1"
|
|
$cores = (Get-ComputerInfo -Property CsProcessors).CsProcessors.NumberOfCores
|
|
make -j $cores cuda_v11
|
|
env:
|
|
OLLAMA_SKIP_CPU_GENERATE: '1'
|
|
|
|
runners-cpu:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
strategy:
|
|
matrix:
|
|
os: [ubuntu-latest, macos-latest, windows-2019]
|
|
arch: [amd64, arm64]
|
|
exclude:
|
|
- os: ubuntu-latest
|
|
arch: arm64
|
|
- os: windows-2019
|
|
arch: arm64
|
|
runs-on: ${{ matrix.os }}
|
|
env:
|
|
GOARCH: ${{ matrix.arch }}
|
|
ARCH: ${{ matrix.arch }}
|
|
CGO_ENABLED: '1'
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
- uses: actions/setup-go@v5
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- run: go get ./...
|
|
- name: Install msys2
|
|
if: ${{ startsWith(matrix.os, 'windows-') }}
|
|
run: |
|
|
$msys2_url="https://github.com/msys2/msys2-installer/releases/download/2024-07-27/msys2-x86_64-20240727.exe"
|
|
write-host "Downloading msys2"
|
|
Invoke-WebRequest -Uri "${msys2_url}" -OutFile "${env:RUNNER_TEMP}\msys2.exe"
|
|
write-host "Installing msys2"
|
|
Start-Process "${env:RUNNER_TEMP}\msys2.exe" -ArgumentList @("in", "--confirm-command", "--accept-messages", "--root", "C:/msys64") -NoNewWindow -Wait
|
|
echo "c:\msys64\usr\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: Install msys2 tools
|
|
if: ${{ startsWith(matrix.os, 'windows-') }}
|
|
run: |
|
|
Start-Process "c:\msys64\usr\bin\pacman.exe" -ArgumentList @("-S", "--noconfirm", "mingw-w64-clang-x86_64-gcc-compat", "mingw-w64-clang-x86_64-clang", "make") -NoNewWindow -Wait
|
|
echo "C:\msys64\clang64\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append
|
|
- name: verify tools
|
|
if: ${{ startsWith(matrix.os, 'windows-') }}
|
|
run: |
|
|
get-command gcc
|
|
gcc --version
|
|
get-command make
|
|
make --version
|
|
- name: 'Build Windows Go Runners'
|
|
if: ${{ startsWith(matrix.os, 'windows-') }}
|
|
run: |
|
|
$gopath=(get-command go).source | split-path -parent
|
|
$gccpath=(get-command gcc).source | split-path -parent
|
|
import-module 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise\Common7\Tools\Microsoft.VisualStudio.DevShell.dll'
|
|
Enter-VsDevShell -vsinstallpath 'C:\Program Files (x86)\Microsoft Visual Studio\2019\Enterprise' -skipautomaticlocation -DevCmdArguments '-arch=x64 -no_logo'
|
|
$env:CMAKE_SYSTEM_VERSION="10.0.22621.0"
|
|
$env:PATH="$gopath;$gccpath;$env:PATH"
|
|
echo $env:PATH
|
|
make -j 4
|
|
- name: 'Build Unix Go Runners'
|
|
if: ${{ ! startsWith(matrix.os, 'windows-') }}
|
|
run: make -j 4
|
|
- run: go build .
|
|
|
|
lint:
|
|
strategy:
|
|
matrix:
|
|
os: [ubuntu-latest, macos-latest, windows-2019]
|
|
arch: [amd64, arm64]
|
|
exclude:
|
|
- os: ubuntu-latest
|
|
arch: arm64
|
|
- os: windows-2019
|
|
arch: arm64
|
|
- os: macos-latest
|
|
arch: amd64
|
|
runs-on: ${{ matrix.os }}
|
|
env:
|
|
GOARCH: ${{ matrix.arch }}
|
|
CGO_ENABLED: '1'
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
with:
|
|
submodules: recursive
|
|
- uses: actions/setup-go@v5
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: false
|
|
- run: |
|
|
case ${{ matrix.arch }} in
|
|
amd64) echo ARCH=x86_64 ;;
|
|
arm64) echo ARCH=arm64 ;;
|
|
esac >>$GITHUB_ENV
|
|
shell: bash
|
|
- uses: golangci/golangci-lint-action@v6
|
|
with:
|
|
args: --timeout 8m0s -v
|
|
test:
|
|
strategy:
|
|
matrix:
|
|
os: [ubuntu-latest, macos-latest, windows-2019]
|
|
arch: [amd64]
|
|
exclude:
|
|
- os: ubuntu-latest
|
|
arch: arm64
|
|
- os: windows-2019
|
|
arch: arm64
|
|
runs-on: ${{ matrix.os }}
|
|
env:
|
|
GOARCH: ${{ matrix.arch }}
|
|
CGO_ENABLED: '1'
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
with:
|
|
submodules: recursive
|
|
- uses: actions/setup-go@v5
|
|
with:
|
|
go-version-file: go.mod
|
|
cache: true
|
|
- run: |
|
|
case ${{ matrix.arch }} in
|
|
amd64) echo ARCH=amd64 ;;
|
|
arm64) echo ARCH=arm64 ;;
|
|
esac >>$GITHUB_ENV
|
|
shell: bash
|
|
- run: go build
|
|
- run: go test -v ./...
|
|
|
|
patches:
|
|
needs: [changes]
|
|
if: ${{ needs.changes.outputs.RUNNERS == 'True' }}
|
|
runs-on: ubuntu-latest
|
|
steps:
|
|
- uses: actions/checkout@v4
|
|
with:
|
|
submodules: recursive
|
|
- name: Verify patches carry all the changes
|
|
run: |
|
|
make apply-patches sync && git diff --compact-summary --exit-code llama |