apiVersion: apps/v1
kind: Deployment
metadata:
name: ollama
namespace: ollama-ns
spec:
replicas: 1
selector:
matchLabels:
app: ollama
template:
labels:
runtimeClassName: nvidia
containers:
- name: ollama
image: ollama/ollama
env:
- name: OLLAMA_HOST
value: 0.0.0.0
- name: OLLAMA_MODELS
value: "/models"
#- name: OLLAMA_KEEP_ALIVE
# value: "-1"
ports:
- containerPort: 11434
resources:
limits:
nvidia.com/gpu: 3
volumeMounts:
- name: ollama-volume
mountPath: "/models"
volumes:
persistentVolumeClaim:
claimName: ollama-pvc