Update node to watch forever
All checks were successful
continuous-integration/drone/push Build is passing
All checks were successful
continuous-integration/drone/push Build is passing
This commit is contained in:
parent
e78ac932d0
commit
17e076e0c8
@ -28,13 +28,14 @@ spec:
|
|||||||
value: /.cache
|
value: /.cache
|
||||||
- name: shm-size
|
- name: shm-size
|
||||||
value: 1g
|
value: 1g
|
||||||
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
command: ["watch", "ls"]
|
||||||
args: ["--model=meta-llama/Llama-2-7b-hf",
|
#command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
||||||
"--gpu-memory-utilization=0.95",
|
#args: ["--model=meta-llama/Llama-2-7b-hf",
|
||||||
"--disable-log-requests",
|
# "--gpu-memory-utilization=0.95",
|
||||||
"--trust-remote-code",
|
# "--disable-log-requests",
|
||||||
"--port=8000",
|
# "--trust-remote-code",
|
||||||
"--tensor-parallel-size=1"]
|
# "--port=8000",
|
||||||
|
# "--tensor-parallel-size=1"]
|
||||||
ports:
|
ports:
|
||||||
- containerPort: 8000
|
- containerPort: 8000
|
||||||
name: http
|
name: http
|
||||||
|
Loading…
Reference in New Issue
Block a user