ollama/llm/llama.cpp/gen_windows.ps1

#!powershell

$ErrorActionPreference = "Stop"

function init_vars {
    $script:patches = @("0001-Expose-callable-API-for-server.patch")
    $script:cmakeDefs = @("-DBUILD_SHARED_LIBS=on", "-DLLAMA_NATIVE=off", "-DLLAMA_F16C=off", "-DLLAMA_FMA=off", "-DLLAMA_AVX512=off", "-DLLAMA_AVX2=off", "-DLLAMA_AVX=on", "-DLLAMA_K_QUANTS=on", "-DLLAMA_ACCELERATE=on", "-A","x64")

    if ($env:CGO_CFLAGS -contains "-g") {
        $script:cmakeDefs += @("-DCMAKE_VERBOSE_MAKEFILE=on", "-DLLAMA_SERVER_VERBOSE=on")
        $script:config = "RelWithDebInfo"
    } else {
        $script:cmakeDefs += @("-DLLAMA_SERVER_VERBOSE=off")
        $script:config = "Release"
    }
}

function git_module_setup {
    # TODO add flags to skip the init/patch logic to make it easier to mod llama.cpp code in-repo
    & git submodule init
    if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}
    & git submodule update --force gguf
    if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}
}

function apply_patches {
    rm -erroraction ignore -path "gguf/examples/server/server.h"
    foreach ($patch in $script:patches) {
        write-host "Applying patch $patch"
        & git -C gguf apply ../patches/$patch
        if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}
    }
}

function build {
    write-host "generating config with: cmake -S gguf -B $script:buildDir $script:cmakeDefs"
    & cmake --version
    & cmake -S gguf -B $script:buildDir $script:cmakeDefs
    if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}
    write-host "building with: cmake --build $script:buildDir --config $script:config"
    & cmake --build $script:buildDir --config $script:config
    if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}
}

function install {
    rm -erroraction ignore -recurse -force -path $script:installDir
    & cmake --install $script:buildDir --prefix $script:installDir --config $script:config
    if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}

}

init_vars
git_module_setup
apply_patches

# first build CPU based
$script:buildDir="gguf/build/wincpu"
$script:installDir="gguf/build/wincpu/dist"

build
# install

md gguf/build/lib -ea 0
md gguf/build/wincpu/dist/lib -ea 0
mv gguf/build/wincpu/bin/$script:config/ext_server_shared.dll gguf/build/wincpu/dist/lib/cpu_server.dll


# Nope, this barfs on lots of symbol problems
#mv gguf/build/wincpu/examples/server/$script:config/ext_server_shared.dll gguf/build/wincpu/dist/lib/cpu_server.lib
# Nope: this needs lots of include paths to pull in things like msvcprt.lib and other deps
# & cl.exe `
#     gguf/build/wincpu/examples/server/$script:config/ext_server.lib `
#     gguf/build/wincpu/common/$script:config/common.lib `
#     gguf/build/wincpu/$script:config/llama.lib `
#     gguf/build/wincpu/$script:config/ggml_static.lib `
#     /link /DLL /DEF:cpu_server.def /NOENTRY /MACHINE:X64  /OUT:gguf/build/wincpu/dist/lib/cpu_server.dll
# if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}

# Then build cuda as a dynamically loaded library
init_vars
$script:buildDir="gguf/build/wincuda"
$script:installDir="gguf/build/wincuda/dist"
$script:cmakeDefs += @("-DLLAMA_CUBLAS=ON", "-DBUILD_SHARED_LIBS=on")
build
install
cp gguf/build/wincuda/dist/bin/ext_server_shared.dll gguf/build/lib/cuda_server.dll

# TODO - more to do here to create a usable dll


# TODO - implement ROCm support on windows
md gguf/build/winrocm/lib -ea 0
echo $null >> gguf/build/winrocm/lib/.generated
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`#!powershell`

			`$ErrorActionPreference = "Stop"`

			`function init_vars {`
			`$script:patches = @("0001-Expose-callable-API-for-server.patch")`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`$script:cmakeDefs = @("-DBUILD_SHARED_LIBS=on", "-DLLAMA_NATIVE=off", "-DLLAMA_F16C=off", "-DLLAMA_FMA=off", "-DLLAMA_AVX512=off", "-DLLAMA_AVX2=off", "-DLLAMA_AVX=on", "-DLLAMA_K_QUANTS=on", "-DLLAMA_ACCELERATE=on", "-A","x64")`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00
			`if ($env:CGO_CFLAGS -contains "-g") {`
Quiet down llama.cpp logging by default By default builds will now produce non-debug and non-verbose binaries. To enable verbose logs in llama.cpp and debug symbols in the native code, set `CGO_CFLAGS=-g` 2023-12-22 16:47:18 +00:00			`$script:cmakeDefs += @("-DCMAKE_VERBOSE_MAKEFILE=on", "-DLLAMA_SERVER_VERBOSE=on")`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`$script:config = "RelWithDebInfo"`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`} else {`
Quiet down llama.cpp logging by default By default builds will now produce non-debug and non-verbose binaries. To enable verbose logs in llama.cpp and debug symbols in the native code, set `CGO_CFLAGS=-g` 2023-12-22 16:47:18 +00:00			`$script:cmakeDefs += @("-DLLAMA_SERVER_VERBOSE=off")`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`$script:config = "Release"`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`}`
			`}`

			`function git_module_setup {`
			`# TODO add flags to skip the init/patch logic to make it easier to mod llama.cpp code in-repo`
			`& git submodule init`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`& git submodule update --force gguf`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`}`

			`function apply_patches {`
			`rm -erroraction ignore -path "gguf/examples/server/server.h"`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`foreach ($patch in $script:patches) {`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`write-host "Applying patch $patch"`
			`& git -C gguf apply ../patches/$patch`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`}`
			`}`

			`function build {`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`write-host "generating config with: cmake -S gguf -B $script:buildDir $script:cmakeDefs"`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`& cmake --version`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`& cmake -S gguf -B $script:buildDir $script:cmakeDefs`
			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
			`write-host "building with: cmake --build $script:buildDir --config $script:config"`
			`& cmake --build $script:buildDir --config $script:config`
			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`}`

			`function install {`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`rm -erroraction ignore -recurse -force -path $script:installDir`
			`& cmake --install $script:buildDir --prefix $script:installDir --config $script:config`
			`if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00
			`}`

			`init_vars`
			`git_module_setup`
			`apply_patches`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00
			`# first build CPU based`
			`$script:buildDir="gguf/build/wincpu"`
			`$script:installDir="gguf/build/wincpu/dist"`

			`build`
			`# install`

			`md gguf/build/lib -ea 0`
			`md gguf/build/wincpu/dist/lib -ea 0`
			`mv gguf/build/wincpu/bin/$script:config/ext_server_shared.dll gguf/build/wincpu/dist/lib/cpu_server.dll`


			`# Nope, this barfs on lots of symbol problems`
			`#mv gguf/build/wincpu/examples/server/$script:config/ext_server_shared.dll gguf/build/wincpu/dist/lib/cpu_server.lib`
			`# Nope: this needs lots of include paths to pull in things like msvcprt.lib and other deps`
			# & cl.exe `
			# gguf/build/wincpu/examples/server/$script:config/ext_server.lib `
			# gguf/build/wincpu/common/$script:config/common.lib `
			# gguf/build/wincpu/$script:config/llama.lib `
			# gguf/build/wincpu/$script:config/ggml_static.lib `
			`# /link /DLL /DEF:cpu_server.def /NOENTRY /MACHINE:X64 /OUT:gguf/build/wincpu/dist/lib/cpu_server.dll`
			`# if ($LASTEXITCODE -ne 0) { exit($LASTEXITCODE)}`

			`# Then build cuda as a dynamically loaded library`
			`init_vars`
			`$script:buildDir="gguf/build/wincuda"`
			`$script:installDir="gguf/build/wincuda/dist"`
			`$script:cmakeDefs += @("-DLLAMA_CUBLAS=ON", "-DBUILD_SHARED_LIBS=on")`
Add cgo implementation for llama.cpp Run the server.cpp directly inside the Go runtime via cgo while retaining the LLM Go abstractions. 2023-11-14 01:20:34 +00:00			`build`
Adapted rocm support to cgo based llama.cpp 2023-11-29 19:00:37 +00:00			`install`
Revive windows build The windows native setup still needs some more work, but this gets it building again and if you set the PATH properly, you can run the resulting exe on a cuda system. 2023-12-20 22:46:15 +00:00			`cp gguf/build/wincuda/dist/bin/ext_server_shared.dll gguf/build/lib/cuda_server.dll`

			`# TODO - more to do here to create a usable dll`

Adapted rocm support to cgo based llama.cpp 2023-11-29 19:00:37 +00:00
			`# TODO - implement ROCm support on windows`
			`md gguf/build/winrocm/lib -ea 0`
			`echo $null >> gguf/build/winrocm/lib/.generated`