From 964a0277c179e512c0995bd11e0d373f0fb871c1 Mon Sep 17 00:00:00 2001 From: Tyler Perkins Date: Sat, 30 Mar 2024 16:32:29 -0400 Subject: [PATCH] Update to request only one gpu --- openllm/openllm-deployment.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/openllm/openllm-deployment.yaml b/openllm/openllm-deployment.yaml index 11b73a7..628dd9b 100644 --- a/openllm/openllm-deployment.yaml +++ b/openllm/openllm-deployment.yaml @@ -30,6 +30,6 @@ spec: - containerPort: 3000 resources: limits: - nvidia.com/gpu: 2 + nvidia.com/gpu: 1 nodeSelector: kubernetes.io/os: linux