137 lines
3.9 KiB
Bash
137 lines
3.9 KiB
Bash
# common logic across linux and darwin
|
|
|
|
init_vars() {
|
|
case "${GOARCH}" in
|
|
"amd64")
|
|
ARCH="x86_64"
|
|
;;
|
|
"arm64")
|
|
ARCH="arm64"
|
|
;;
|
|
*)
|
|
echo "GOARCH must be set"
|
|
echo "this script is meant to be run from within go generate"
|
|
exit 1
|
|
;;
|
|
esac
|
|
|
|
LLAMACPP_DIR=../llama.cpp
|
|
CMAKE_DEFS="-DCMAKE_SKIP_RPATH=on"
|
|
CMAKE_TARGETS="--target ollama_llama_server"
|
|
if echo "${CGO_CFLAGS}" | grep -- '-g' >/dev/null; then
|
|
CMAKE_DEFS="-DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_VERBOSE_MAKEFILE=on -DLLAMA_GPROF=on -DLLAMA_SERVER_VERBOSE=on ${CMAKE_DEFS}"
|
|
else
|
|
# TODO - add additional optimization flags...
|
|
CMAKE_DEFS="-DCMAKE_BUILD_TYPE=Release -DLLAMA_SERVER_VERBOSE=off ${CMAKE_DEFS}"
|
|
fi
|
|
case $(uname -s) in
|
|
"Darwin")
|
|
LIB_EXT="dylib"
|
|
WHOLE_ARCHIVE="-Wl,-force_load"
|
|
NO_WHOLE_ARCHIVE=""
|
|
GCC_ARCH="-arch ${ARCH}"
|
|
DIST_BASE=../../dist/darwin-${GOARCH}/
|
|
;;
|
|
"Linux")
|
|
LIB_EXT="so"
|
|
WHOLE_ARCHIVE="-Wl,--whole-archive"
|
|
NO_WHOLE_ARCHIVE="-Wl,--no-whole-archive"
|
|
|
|
# Cross compiling not supported on linux - Use docker
|
|
GCC_ARCH=""
|
|
DIST_BASE=../../dist/linux-${GOARCH}/
|
|
;;
|
|
*)
|
|
;;
|
|
esac
|
|
if [ -z "${CMAKE_CUDA_ARCHITECTURES}" ] ; then
|
|
CMAKE_CUDA_ARCHITECTURES="50;52;61;70;75;80"
|
|
fi
|
|
GZIP=$(which pigz 2>/dev/null || echo "gzip")
|
|
}
|
|
|
|
git_module_setup() {
|
|
if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then
|
|
echo "Skipping submodule initialization"
|
|
return
|
|
fi
|
|
# Make sure the tree is clean after the directory moves
|
|
if [ -d "${LLAMACPP_DIR}/gguf" ]; then
|
|
echo "Cleaning up old submodule"
|
|
rm -rf ${LLAMACPP_DIR}
|
|
fi
|
|
git submodule init
|
|
git submodule update --force ${LLAMACPP_DIR}
|
|
|
|
}
|
|
|
|
apply_patches() {
|
|
# Wire up our CMakefile
|
|
if ! grep ollama ${LLAMACPP_DIR}/CMakeLists.txt; then
|
|
echo 'add_subdirectory(../ext_server ext_server) # ollama' >>${LLAMACPP_DIR}/CMakeLists.txt
|
|
fi
|
|
|
|
if [ -n "$(ls -A ../patches/*.diff)" ]; then
|
|
# apply temporary patches until fix is upstream
|
|
for patch in ../patches/*.diff; do
|
|
for file in $(grep "^+++ " ${patch} | cut -f2 -d' ' | cut -f2- -d/); do
|
|
(cd ${LLAMACPP_DIR}; git checkout ${file})
|
|
done
|
|
done
|
|
for patch in ../patches/*.diff; do
|
|
(cd ${LLAMACPP_DIR} && git apply ${patch})
|
|
done
|
|
fi
|
|
}
|
|
|
|
build() {
|
|
cmake -S ${LLAMACPP_DIR} -B ${BUILD_DIR} ${CMAKE_DEFS}
|
|
cmake --build ${BUILD_DIR} ${CMAKE_TARGETS} -j8
|
|
# remove unnecessary build artifacts
|
|
rm -f ${BUILD_DIR}/bin/ggml-common.h ${BUILD_DIR}/bin/ggml-metal.metal
|
|
}
|
|
|
|
compress() {
|
|
echo "Compressing payloads to reduce overall binary size..."
|
|
rm -rf ${BUILD_DIR}/bin/*.gz
|
|
for f in ${BUILD_DIR}/bin/* ; do
|
|
${GZIP} -n --best -f ${f} &
|
|
compress_pids+=" $!"
|
|
done
|
|
# check for lib directory
|
|
if [ -d ${BUILD_DIR}/lib ]; then
|
|
for f in ${BUILD_DIR}/lib/* ; do
|
|
${GZIP} -n --best -f ${f} &
|
|
compress_pids+=" $!"
|
|
done
|
|
fi
|
|
echo
|
|
}
|
|
|
|
wait_for_compress() {
|
|
for pid in ${compress_pids}; do
|
|
wait $pid
|
|
done
|
|
echo "Finished compression"
|
|
}
|
|
|
|
install() {
|
|
echo "Installing libraries to bin dir ${BUILD_DIR}/bin/"
|
|
for lib in $(find ${BUILD_DIR} -name \*.${LIB_EXT}); do
|
|
rm -f "${BUILD_DIR}/bin/$(basename ${lib})"
|
|
cp -af "${lib}" "${BUILD_DIR}/bin/"
|
|
done
|
|
}
|
|
|
|
# Keep the local tree clean after we're done with the build
|
|
cleanup() {
|
|
(cd ${LLAMACPP_DIR}/ && git checkout CMakeLists.txt)
|
|
|
|
if [ -n "$(ls -A ../patches/*.diff)" ]; then
|
|
for patch in ../patches/*.diff; do
|
|
for file in $(grep "^+++ " ${patch} | cut -f2 -d' ' | cut -f2- -d/); do
|
|
(cd ${LLAMACPP_DIR}; git checkout ${file})
|
|
done
|
|
done
|
|
fi
|
|
}
|