diff --git a/20251014.md b/20251014.md index 4898a08..81b55c6 100644 --- a/20251014.md +++ b/20251014.md @@ -51,11 +51,10 @@ vllm serve \ modelscope download --model Qwen/Qwen3-0.6B --local_dir /home/ss/vllm-py12/qwen3-06b # 运行 Qwen3-8b -vllm serve \ +vllm serve /home/ss/vllm-py12/qwen3-06b \ --host 0.0.0.0 \ - --port 18778 \ - --model /home/ss/vllm-py12/qwen3-06b \ - --served-model-name qwen3-06b \ + --port 8000 \ + --served-model-name Qwen3-0.6B \ --tensor-parallel-size 1 \ --dtype auto \ --gpu-memory-utilization 0.9 \