refactor: 转移vlm到远程服务器上

This commit is contained in:
JiajunLI
2026-03-04 14:41:56 +08:00
parent cb94029ec5
commit a78e984695
2 changed files with 147 additions and 4 deletions

View File

@@ -5,6 +5,7 @@
python -m vllm.entrypoints.openai.api_server \
--model Qwen/Qwen3-VL-8B-Instruct \
--trust-remote-code \
--host 0.0.0.0 \
--port 8000 \
--gpu-memory-utilization 0.85 \
--max-model-len 32000 \