RTX4090笔电操作记录
This commit is contained in:
parent
fbc162cbec
commit
8afcf49879
@ -53,6 +53,7 @@ vllm serve \
|
||||
--host 0.0.0.0 \
|
||||
--port 18778 \
|
||||
--model /home/ss/vllm-py12/qwen3-06b \
|
||||
--served-model-name qwen3-06b \
|
||||
--tensor-parallel-size 1 \
|
||||
--dtype auto \
|
||||
--gpu-memory-utilization 0.9 \
|
||||
|
||||
Loading…
Reference in New Issue
Block a user