57 lines
1 KiB
YAML
57 lines
1 KiB
YAML
|
---
|
||
|
apiVersion: v1
|
||
|
kind: Namespace
|
||
|
metadata:
|
||
|
name: ollama
|
||
|
---
|
||
|
apiVersion: apps/v1
|
||
|
kind: Deployment
|
||
|
metadata:
|
||
|
name: ollama
|
||
|
namespace: ollama
|
||
|
spec:
|
||
|
strategy:
|
||
|
type: Recreate
|
||
|
selector:
|
||
|
matchLabels:
|
||
|
name: ollama
|
||
|
template:
|
||
|
metadata:
|
||
|
labels:
|
||
|
name: ollama
|
||
|
spec:
|
||
|
containers:
|
||
|
- name: ollama
|
||
|
image: ollama/ollama:latest
|
||
|
env:
|
||
|
- name: PATH
|
||
|
value: /usr/local/nvidia/bin:/usr/local/nvidia/lib64:/usr/bin:/usr/sbin:/bin:/sbin
|
||
|
- name: LD_LIBRARY_PATH
|
||
|
value: /usr/local/nvidia/lib64
|
||
|
ports:
|
||
|
- name: http
|
||
|
containerPort: 11434
|
||
|
protocol: TCP
|
||
|
resources:
|
||
|
limits:
|
||
|
nvidia.com/gpu: 1
|
||
|
tolerations:
|
||
|
- key: nvidia.com/gpu
|
||
|
operator: Exists
|
||
|
effect: NoSchedule
|
||
|
---
|
||
|
apiVersion: v1
|
||
|
kind: Service
|
||
|
metadata:
|
||
|
name: ollama
|
||
|
namespace: ollama
|
||
|
spec:
|
||
|
type: ClusterIP
|
||
|
selector:
|
||
|
name: ollama
|
||
|
ports:
|
||
|
- port: 80
|
||
|
name: http
|
||
|
targetPort: http
|
||
|
protocol: TCP
|