diff --git a/openllm/openllm-deployment.yaml b/openllm/openllm-deployment.yaml index 11b73a7..628dd9b 100644 --- a/openllm/openllm-deployment.yaml +++ b/openllm/openllm-deployment.yaml @@ -30,6 +30,6 @@ spec: - containerPort: 3000 resources: limits: - nvidia.com/gpu: 2 + nvidia.com/gpu: 1 nodeSelector: kubernetes.io/os: linux