Gluttony-Cluster/ollama/ollama-deployment.yaml

39 lines
802 B
YAML
Raw Normal View History

2024-05-26 16:14:21 +00:00
apiVersion: apps/v1
kind: Deployment
metadata:
name: ollama
namespace: ollama-ns
spec:
replicas: 1
selector:
matchLabels:
app: ollama
template:
metadata:
labels:
app: ollama
spec:
runtimeClassName: nvidia
containers:
- name: ollama
image: ollama/ollama
env:
- name: OLLAMA_HOST
value: 0.0.0.0
- name: OLLAMA_MODELS
value: "/models"
- name: OLLAMA_KEEP_ALIVE
value: "-1"
ports:
- containerPort: 11434
resources:
limits:
nvidia.com/gpu: 3
volumeMounts:
- name: ollama-volume
mountPath: "/models"
volumes:
- name: ollama-volume
persistentVolumeClaim:
claimName: ollama-pvc