Update dtype param
All checks were successful
continuous-integration/drone/push Build is passing

This commit is contained in:
Tyler Perkins 2024-03-30 22:45:48 -04:00
parent 765124c106
commit ffeadbebff
Signed by: tyler
GPG Key ID: 03B27509E17EFDC8

View File

@ -21,7 +21,7 @@ spec:
resources:
limits:
nvidia.com/gpu: 1
nvidia.com/gpu: 2
env:
- name: HUGGING_FACE_HUB_TOKEN
value: ""
@ -38,6 +38,7 @@ spec:
"--disable-log-requests",
"--trust-remote-code",
"--port=8000",
"--dtype=half",
"--tensor-parallel-size=1"]
ports:
- containerPort: 8000