vector_app.py 704 B

12345678910111213141516171819202122232425262728
  1. from quart import Quart
  2. from quart_cors import cors
  3. # from pymilvus import connections
  4. from vllm import LLM, SamplingParams
  5. from applications.config import LOCAL_MODEL_CONFIG, DEFAULT_MODEL
  6. from routes import server_routes
  7. app = Quart(__name__)
  8. MODEL_PATH = LOCAL_MODEL_CONFIG[DEFAULT_MODEL]
  9. llm = LLM(
  10. model=MODEL_PATH,
  11. dtype="float16", # 节省显存
  12. trust_remote_code=True
  13. )
  14. print(f"{MODEL_PATH} 模型加载完成!")
  15. # 连接向量数据库
  16. # connections.connect("default", host="milvus", port="19530")
  17. # connections.connect("default", host="milvus", port="19530")
  18. connections = None
  19. # 注册路由
  20. app_route = server_routes(llm, connections)
  21. app.register_blueprint(app_route)