2023-05-22 08:10:14 +00:00
|
|
|
ARG CUDA_IMAGE="12.1.1-devel-ubuntu22.04"
|
2023-05-31 15:16:32 +00:00
|
|
|
FROM nvidia/cuda:${CUDA_IMAGE}
|
2023-05-03 14:29:05 +00:00
|
|
|
|
|
|
|
# We need to set the host to 0.0.0.0 to allow outside access
|
|
|
|
ENV HOST 0.0.0.0
|
|
|
|
|
|
|
|
COPY . .
|
|
|
|
|
|
|
|
# Install the package
|
|
|
|
RUN apt update && apt install -y python3 python3-pip
|
|
|
|
RUN python3 -m pip install --upgrade pip pytest cmake scikit-build setuptools fastapi uvicorn sse-starlette
|
|
|
|
|
2023-05-31 15:16:32 +00:00
|
|
|
RUN LLAMA_CUBLAS=1 pip install llama-cpp-python
|
2023-05-03 14:29:05 +00:00
|
|
|
|
|
|
|
# Run the server
|
2023-05-18 14:02:42 +00:00
|
|
|
CMD python3 -m llama_cpp.server
|