Add openllm
All checks were successful
continuous-integration/drone/push Build is passing

This commit is contained in:
Tyler Perkins 2024-03-30 16:29:24 -04:00
parent f9bdf58f7f
commit 754584d291
Signed by: tyler
GPG Key ID: 03B27509E17EFDC8
2 changed files with 47 additions and 0 deletions

View File

@ -0,0 +1,35 @@
apiVersion: apps/v1
kind: Deployment
metadata:
name: openllm-deployment
namespace: openllm-ns
spec:
replicas: 1
selector:
matchLabels:
app: openllm
template:
metadata:
labels:
app: openllm
spec:
containers:
- name: openllm-container
image: ghcr.io/bentoml/openllm
command: ["start"]
args: ["${MODEL_NAME}", "--backend", "vllm"]
env:
# Set this to desired deployment model
- name: MODEL_NAME
value: "meta-llama/Llama-2-13b-hf"
- name: TRUST_REMOVE_CODE
value: "True"
- name: OPENLLM_DO_NOT_TRACK
value: "True"
ports:
- containerPort: 3000
resources:
limits:
nvidia.com/gpu: 2
nodeSelector:
kubernetes.io/os: linux

View File

@ -0,0 +1,12 @@
apiVersion: v1
kind: Service
metadata:
name: openllm-service
namespace: openllm-ns
spec:
type: LoadBalancer
ports:
- port: 3000
targetPort: 3000
selector:
app: openllm