f221637053
* linux gpu support * handle multiple gpus * add cuda docker image (#488) --------- Co-authored-by: Michael Yang <mxyng@pm.me>
22 lines
719 B
Text
22 lines
719 B
Text
FROM nvidia/cuda:12.2.0-devel-ubuntu22.04
|
|
|
|
WORKDIR /go/src/github.com/jmorganca/ollama
|
|
RUN apt-get update && apt-get install -y git build-essential cmake
|
|
ADD https://dl.google.com/go/go1.21.1.linux-amd64.tar.gz /tmp/go1.21.1.tar.gz
|
|
RUN mkdir -p /usr/local && tar xz -C /usr/local </tmp/go1.21.1.tar.gz
|
|
|
|
COPY . .
|
|
RUN /usr/local/go/bin/go generate ./... && /usr/local/go/bin/go build -ldflags '-linkmode external -extldflags "-static"' .
|
|
|
|
FROM nvidia/cuda:12.2.0-runtime-ubuntu22.04
|
|
ENV OLLAMA_HOST 0.0.0.0
|
|
|
|
ARG USER=ollama
|
|
ARG GROUP=ollama
|
|
RUN groupadd $GROUP && useradd -m -g $GROUP $USER
|
|
|
|
COPY --from=0 /go/src/github.com/jmorganca/ollama/ollama /bin/ollama
|
|
|
|
USER $USER:$GROUP
|
|
ENTRYPOINT ["/bin/ollama"]
|
|
CMD ["serve"]
|