1
0

RTX4090笔电操作记录

This commit is contained in:
liushuang 2025-10-15 10:24:57 +08:00
parent fbc162cbec
commit 8afcf49879

View File

@ -53,6 +53,7 @@ vllm serve \
--host 0.0.0.0 \
--port 18778 \
--model /home/ss/vllm-py12/qwen3-06b \
--served-model-name qwen3-06b \
--tensor-parallel-size 1 \
--dtype auto \
--gpu-memory-utilization 0.9 \