Dockerfile 413 B

12345678910111213
  1. FROM egs-registry.cn-hangzhou.cr.aliyuncs.com/egs/vllm:0.8.2-pytorch2.6-cu124-20250328
  2. COPY models/Qwen3-Embedding-4B /models/Qwen3-Embedding-4B
  3. COPY requirements.txt requirements.txt
  4. RUN pip install -r requirements.txt
  5. CMD ["python3", "-m", "vllm.entrypoints.openai.api_server", \
  6. "--model", "/models/Qwen3-Embedding-4B", \
  7. "--dtype", "float16", \
  8. "--port", "8000", \
  9. "--host", "0.0.0.0"]