diff --git a/20251014.md b/20251014.md index bce3ea3..18534db 100644 --- a/20251014.md +++ b/20251014.md @@ -53,6 +53,7 @@ vllm serve \ --host 0.0.0.0 \ --port 18778 \ --model /home/ss/vllm-py12/qwen3-06b \ + --served-model-name qwen3-06b \ --tensor-parallel-size 1 \ --dtype auto \ --gpu-memory-utilization 0.9 \