docker-compose.yml 425 B

123456789101112131415161718192021222324
  1. services:
  2. # vllm服务
  3. vllm-qwen:
  4. image: vllm-qwen
  5. container_name: vllm-qwen
  6. ports:
  7. - "8000:8000"
  8. deploy:
  9. resources:
  10. reservations:
  11. devices:
  12. - driver: nvidia
  13. count: all
  14. capabilities: [gpu]
  15. restart: always
  16. # 后端服务
  17. vector-app:
  18. build: .
  19. container_name: vector-app
  20. ports:
  21. - "8001:8001"
  22. restart: always