Dockerfile 643 B

1234567891011121314151617181920212223242526
  1. FROM egs-registry.cn-hangzhou.cr.aliyuncs.com/egs/vllm:0.8.2-pytorch2.6-cu124-20250328
  2. WORKDIR /app
  3. ENV PYTHONDONTWRITEBYTECODE=1
  4. ENV PYTHONUNBUFFERED=1
  5. ENV PIP_DISABLE_PIP_VERSION_CHECK=on
  6. ENV TZ=Asia/Shanghai
  7. RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone \
  8. COPY requirements.txt .
  9. RUN pip install --no-cache-dir --upgrade pillow
  10. COPY . .
  11. EXPOSE 8000
  12. RUN ls /app/model/Qwen3-Embedding-4B
  13. CMD ["python3", "-m", "vllm.entrypoints.openai.api_server",
  14. "--model", "/app/model/Qwen3-Embedding-4B",
  15. "--dtype", "float16",
  16. "--host", "0.0.0.0",
  17. "--port", "8000",
  18. "--trust-remote-code"]