Dockerfile 336 B

123456789
  1. FROM egs-registry.cn-hangzhou.cr.aliyuncs.com/egs/vllm:0.8.2-pytorch2.6-cu124-20250328
  2. COPY models/Qwen3-Embedding-4B /models/Qwen3-Embedding-4B
  3. CMD ["python3", "-m", "vllm.entrypoints.openai.api_server", \
  4. "--model", "/models/Qwen3-Embedding-4B", \
  5. "--dtype", "float16", \
  6. "--port", "8000", \
  7. "--host", "0.0.0.0"]