This commit is contained in:
parent
765124c106
commit
ffeadbebff
@ -21,7 +21,7 @@ spec:
|
|||||||
|
|
||||||
resources:
|
resources:
|
||||||
limits:
|
limits:
|
||||||
nvidia.com/gpu: 1
|
nvidia.com/gpu: 2
|
||||||
env:
|
env:
|
||||||
- name: HUGGING_FACE_HUB_TOKEN
|
- name: HUGGING_FACE_HUB_TOKEN
|
||||||
value: ""
|
value: ""
|
||||||
@ -38,6 +38,7 @@ spec:
|
|||||||
"--disable-log-requests",
|
"--disable-log-requests",
|
||||||
"--trust-remote-code",
|
"--trust-remote-code",
|
||||||
"--port=8000",
|
"--port=8000",
|
||||||
|
"--dtype=half",
|
||||||
"--tensor-parallel-size=1"]
|
"--tensor-parallel-size=1"]
|
||||||
ports:
|
ports:
|
||||||
- containerPort: 8000
|
- containerPort: 8000
|
||||||
|
Loading…
Reference in New Issue
Block a user