docker-compose.yml 2.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576
  1. #services:
  2. # # vLLM - Qwen3 0.6B
  3. # vllm-0.6b:
  4. # image: swr.cn-north-4.myhuaweicloud.com/ddn-k8s/docker.io/vllm/vllm-openai:v0.91
  5. # container_name: vllm-qwen3-0.6b
  6. # ports:
  7. # - "8100:8000"
  8. # command: >
  9. # --model Qwen/Qwen3-Embedding-0.6B
  10. # --dtype float16
  11. # --port 8000
  12. # volumes:
  13. # # 挂载预下载的模型目录
  14. # - ./models/Qwen3-Embedding-0.6B:/app/models/Qwen3-Embedding-0.6B
  15. # # 可选:挂载缓存目录
  16. # - ./cache:/root/.cache/huggingface
  17. # environment:
  18. # # 设置 Hugging Face 国内镜像
  19. # - HF_ENDPOINT=https://hf-mirror.com
  20. # # 可选:设置 Python 包索引镜像
  21. # - PIP_INDEX_URL=https://pypi.tuna.tsinghua.edu.cn/simple
  22. # deploy:
  23. # resources:
  24. # reservations:
  25. # devices:
  26. # - driver: nvidia
  27. # count: all
  28. # capabilities: [ gpu ]
  29. # # 添加健康检查
  30. # healthcheck:
  31. # test: [ "CMD", "curl", "-f", "http://localhost:8000/health" ]
  32. # interval: 30s
  33. # timeout: 10s
  34. # retries: 3
  35. # start_period: 40s
  36. ## # vLLM - Qwen3 4B
  37. ## vllm-4b:
  38. ## image: vllm/vllm-openai:latest
  39. ## container_name: vllm-qwen3-4b
  40. ## ports:
  41. ## - "8200:8000"
  42. ## command: >
  43. ## --model Qwen/Qwen3-Embedding-4B
  44. ## --dtype float16
  45. ## --api-port 8000
  46. ## volumes:
  47. ## - ./models:/root/.cache/huggingface
  48. ##
  49. ## # vLLM - Qwen3 8B
  50. ## vllm-8b:
  51. ## image: vllm/vllm-openai:latest
  52. ## container_name: vllm-qwen3-8b
  53. ## ports:
  54. ## - "8300:8000"
  55. ## command: >
  56. ## --model Qwen/Qwen3-Embedding-8B
  57. ## --dtype float16
  58. ## --api-port 8000
  59. ## volumes:
  60. ## - ./models:/root/.cache/huggingface
  61. #
  62. # # Milvus 向量数据库
  63. ## milvus:
  64. ## image: swr.cn-north-4.myhuaweicloud.com/ddn-k8s/docker.io/milvusdb/milvus:v2.4.5
  65. ### image: milvusdb/milvus:v2.4.4-standalone
  66. ## container_name: milvus
  67. ## ports:
  68. ## - "19530:19530"
  69. ## - "9091:9091"
  70. ## environment:
  71. ## - ETCD_USE_EMBED=true
  72. ## - MINIO_USE_EMBED=true
  73. ## - PULSAR_USE_EMBED=true
  74. ## volumes:
  75. ## - ./milvus_data:/var/lib/milvus
  76. ## command: ["milvus", "run", "standalone"]