From fcbe2da11ecbc836ef435a21a519e73c3e057b40 Mon Sep 17 00:00:00 2001 From: liushuang Date: Wed, 15 Oct 2025 10:30:12 +0800 Subject: [PATCH] add --- 20251014.md | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/20251014.md b/20251014.md index 4898a08..81b55c6 100644 --- a/20251014.md +++ b/20251014.md @@ -51,11 +51,10 @@ vllm serve \ modelscope download --model Qwen/Qwen3-0.6B --local_dir /home/ss/vllm-py12/qwen3-06b # 运行 Qwen3-8b -vllm serve \ +vllm serve /home/ss/vllm-py12/qwen3-06b \ --host 0.0.0.0 \ - --port 18778 \ - --model /home/ss/vllm-py12/qwen3-06b \ - --served-model-name qwen3-06b \ + --port 8000 \ + --served-model-name Qwen3-0.6B \ --tensor-parallel-size 1 \ --dtype auto \ --gpu-memory-utilization 0.9 \