File size: 329 Bytes
1f1e024 71a2ed3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
FROM vllm/vllm-openai:latest
WORKDIR /app
EXPOSE 7860
CMD exec vllm serve --model Qwen/Qwen3-0.6B \
--host 0.0.0.0 \
--port 7860 \
--max-model-len 8192 \
--dtype float32 \
--enable-reasoning \
--reasoning-parser deepseek_r1 \
--engine-use-ray \
--trust-remote-code \
--disable-log-requests
|