Upgrade version and use gpt2
All checks were successful
continuous-integration/drone/push Build is passing
All checks were successful
continuous-integration/drone/push Build is passing
This commit is contained in:
parent
5ca94dda0b
commit
a263684284
@ -16,7 +16,7 @@ spec:
|
||||
runtimeClassName: nvidia
|
||||
containers:
|
||||
- name: vllm-inference-server
|
||||
image: vllm/vllm-openai:v0.3.3
|
||||
image: vllm/vllm-openai:latest
|
||||
imagePullPolicy: IfNotPresent
|
||||
|
||||
resources:
|
||||
@ -33,7 +33,7 @@ spec:
|
||||
#args:
|
||||
#- while true; do sleep 2600; done
|
||||
command: ["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
||||
args: ["--model=mistralai/Mistral-7B-v0.1",
|
||||
args: ["--model=openai-community/gpt2",
|
||||
"--gpu-memory-utilization=0.95",
|
||||
"--disable-log-requests",
|
||||
"--trust-remote-code",
|
||||
|
Loading…
Reference in New Issue
Block a user