File size: 329 Bytes
1f1e024
 
 
 
 
 
71a2ed3
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
FROM vllm/vllm-openai:latest

WORKDIR /app

EXPOSE 7860

CMD exec vllm serve --model Qwen/Qwen3-0.6B \
    --host 0.0.0.0 \
    --port 7860 \
    --max-model-len 8192 \
    --dtype float32 \
    --enable-reasoning \
    --reasoning-parser deepseek_r1 \
    --engine-use-ray \
    --trust-remote-code \
    --disable-log-requests