Upgrade version and use gpt2
All checks were successful
continuous-integration/drone/push Build is passing
All checks were successful
continuous-integration/drone/push Build is passing
This commit is contained in:
parent
5ca94dda0b
commit
a263684284
@ -16,7 +16,7 @@ spec:
|
|||||||
runtimeClassName: nvidia
|
runtimeClassName: nvidia
|
||||||
containers:
|
containers:
|
||||||
- name: vllm-inference-server
|
- name: vllm-inference-server
|
||||||
image: vllm/vllm-openai:v0.3.3
|
image: vllm/vllm-openai:latest
|
||||||
imagePullPolicy: IfNotPresent
|
imagePullPolicy: IfNotPresent
|
||||||
|
|
||||||
resources:
|
resources:
|
||||||
@ -33,7 +33,7 @@ spec:
|
|||||||
#args:
|
#args:
|
||||||
#- while true; do sleep 2600; done
|
#- while true; do sleep 2600; done
|
||||||
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
||||||
args: ["--model=mistralai/Mistral-7B-v0.1",
|
args: ["--model=openai-community/gpt2",
|
||||||
"--gpu-memory-utilization=0.95",
|
"--gpu-memory-utilization=0.95",
|
||||||
"--disable-log-requests",
|
"--disable-log-requests",
|
||||||
"--trust-remote-code",
|
"--trust-remote-code",
|
||||||
|
Loading…
Reference in New Issue
Block a user