apiVersion: apps/v1 kind: Deployment metadata: name: ollama namespace: ollama-ns spec: replicas: 1 selector: matchLabels: app: ollama template: metadata: labels: app: ollama spec: runtimeClassName: nvidia containers: - name: ollama image: ollama/ollama env: - name: OLLAMA_HOST value: 0.0.0.0 - name: OLLAMA_MODELS value: "/models" #- name: OLLAMA_KEEP_ALIVE # value: "-1" ports: - containerPort: 11434 resources: limits: nvidia.com/gpu: 3 volumeMounts: - name: ollama-volume mountPath: "/models" volumes: - name: ollama-volume persistentVolumeClaim: claimName: ollama-pvc