refactor: 转移vlm到远程服务器上

2026-03-04 14:41:56 +08:00
parent cb94029ec5
commit a78e984695
2 changed files with 147 additions and 4 deletions
--- a/start_vllm.sh
+++ b/start_vllm.sh
@@ -5,6 +5,7 @@
 python -m vllm.entrypoints.openai.api_server \
    --model Qwen/Qwen3-VL-8B-Instruct \
    --trust-remote-code \
+    --host 0.0.0.0 \
    --port 8000 \
    --gpu-memory-utilization 0.85 \
    --max-model-len 32000 \