# common logic accross linux and darwin init_vars() { case "${GOARCH}" in "amd64") ARCH="x86_64" ;; "arm64") ARCH="arm64" ;; *) ARCH=$(uname -m | sed -e "s/aarch64/arm64/g") esac LLAMACPP_DIR=../llama.cpp CMAKE_DEFS="" CMAKE_TARGETS="--target ext_server" if echo "${CGO_CFLAGS}" | grep -- '-g' >/dev/null; then CMAKE_DEFS="-DCMAKE_BUILD_TYPE=RelWithDebInfo -DCMAKE_VERBOSE_MAKEFILE=on -DLLAMA_GPROF=on -DLLAMA_SERVER_VERBOSE=on ${CMAKE_DEFS}" else # TODO - add additional optimization flags... CMAKE_DEFS="-DCMAKE_BUILD_TYPE=Release -DLLAMA_SERVER_VERBOSE=off ${CMAKE_DEFS}" fi case $(uname -s) in "Darwin") LIB_EXT="dylib" WHOLE_ARCHIVE="-Wl,-force_load" NO_WHOLE_ARCHIVE="" GCC_ARCH="-arch ${ARCH}" ;; "Linux") LIB_EXT="so" WHOLE_ARCHIVE="-Wl,--whole-archive" NO_WHOLE_ARCHIVE="-Wl,--no-whole-archive" # Cross compiling not supported on linux - Use docker GCC_ARCH="" ;; *) ;; esac } git_module_setup() { if [ -n "${OLLAMA_SKIP_PATCHING}" ]; then echo "Skipping submodule initialization" return fi # Make sure the tree is clean after the directory moves if [ -d "${LLAMACPP_DIR}/gguf" ]; then echo "Cleaning up old submodule" rm -rf ${LLAMACPP_DIR} fi git submodule init git submodule update --force ${LLAMACPP_DIR} } apply_patches() { # Wire up our CMakefile if ! grep ollama ${LLAMACPP_DIR}/examples/server/CMakeLists.txt; then echo 'include (../../../ext_server/CMakeLists.txt) # ollama' >>${LLAMACPP_DIR}/examples/server/CMakeLists.txt fi # Avoid duplicate main symbols when we link into the cgo binary sed -e 's/int main(/int __main(/g' <${LLAMACPP_DIR}/examples/server/server.cpp >${LLAMACPP_DIR}/examples/server/server.cpp.tmp && mv ${LLAMACPP_DIR}/examples/server/server.cpp.tmp ${LLAMACPP_DIR}/examples/server/server.cpp } build() { cmake -S ${LLAMACPP_DIR} -B ${BUILD_DIR} ${CMAKE_DEFS} cmake --build ${BUILD_DIR} ${CMAKE_TARGETS} -j8 mkdir -p ${BUILD_DIR}/lib/ g++ -fPIC -g -shared -o ${BUILD_DIR}/lib/libext_server.${LIB_EXT} \ ${GCC_ARCH} \ ${WHOLE_ARCHIVE} ${BUILD_DIR}/examples/server/libext_server.a ${NO_WHOLE_ARCHIVE} \ ${BUILD_DIR}/common/libcommon.a \ ${BUILD_DIR}/libllama.a \ -Wl,-rpath,\$ORIGIN \ -lpthread -ldl -lm \ ${EXTRA_LIBS} } compress_libs() { echo "Compressing payloads to reduce overall binary size..." pids="" rm -rf ${BUILD_DIR}/lib/*.${LIB_EXT}*.gz for lib in ${BUILD_DIR}/lib/*.${LIB_EXT}* ; do gzip --best -f ${lib} & pids+=" $!" done echo for pid in ${pids}; do wait $pid done echo "Finished compression" } # Keep the local tree clean after we're done with the build cleanup() { (cd ${LLAMACPP_DIR}/examples/server/ && git checkout CMakeLists.txt server.cpp) }