0409c1fa59
* docker: set PATH, LD_LIBRARY_PATH, and capabilities * example: update k8s gpu manifest
58 lines
1.1 KiB
YAML
58 lines
1.1 KiB
YAML
---
|
|
apiVersion: v1
|
|
kind: Namespace
|
|
metadata:
|
|
name: ollama
|
|
---
|
|
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: ollama
|
|
namespace: ollama
|
|
spec:
|
|
strategy:
|
|
type: Recreate
|
|
selector:
|
|
matchLabels:
|
|
name: ollama
|
|
template:
|
|
metadata:
|
|
labels:
|
|
name: ollama
|
|
spec:
|
|
containers:
|
|
- name: ollama
|
|
image: ollama/ollama:latest
|
|
env:
|
|
- name: PATH
|
|
value: /usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin
|
|
- name: LD_LIBRARY_PATH
|
|
value: /usr/local/nvidia/lib:/usr/local/nvidia/lib64
|
|
- name: NVIDIA_DRIVER_CAPABILITIES
|
|
value: compute,utility
|
|
ports:
|
|
- name: http
|
|
containerPort: 11434
|
|
protocol: TCP
|
|
resources:
|
|
limits:
|
|
nvidia.com/gpu: 1
|
|
tolerations:
|
|
- key: nvidia.com/gpu
|
|
operator: Exists
|
|
effect: NoSchedule
|
|
---
|
|
apiVersion: v1
|
|
kind: Service
|
|
metadata:
|
|
name: ollama
|
|
namespace: ollama
|
|
spec:
|
|
type: ClusterIP
|
|
selector:
|
|
name: ollama
|
|
ports:
|
|
- port: 80
|
|
name: http
|
|
targetPort: http
|
|
protocol: TCP
|