ai_search.py 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140
  1. #!/usr/bin/env python3
  2. """
  3. AI搜索工具
  4. 调用AI搜索回答用户问题,返回多模态参考源、总结答案和追问问题
  5. """
  6. import requests
  7. import json
  8. import os
  9. import argparse
  10. from datetime import datetime
  11. from typing import Dict, Any
  12. import sys
  13. from pathlib import Path
  14. # 添加项目根目录到路径并导入配置
  15. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  16. from lib.config import get_data_dir
  17. class AISearch:
  18. """AI搜索API封装类"""
  19. BASE_URL = "http://47.84.182.56:8001"
  20. TOOL_NAME = "ai_search"
  21. def __init__(self, results_dir: str = None):
  22. """
  23. 初始化API客户端
  24. Args:
  25. results_dir: 结果输出目录,默认为项目根目录下的 data/search 文件夹
  26. """
  27. self.api_url = f"{self.BASE_URL}/tools/call/{self.TOOL_NAME}"
  28. # 设置结果输出目录
  29. if results_dir:
  30. self.results_base_dir = results_dir
  31. else:
  32. # 默认从配置读取
  33. self.results_base_dir = get_data_dir("search")
  34. def search(self, query: str, timeout: int = 60) -> Dict[str, Any]:
  35. """
  36. 执行AI搜索
  37. Args:
  38. query: 搜索查询内容
  39. timeout: 请求超时时间(秒),默认60秒(AI搜索可能需要更长时间)
  40. Returns:
  41. API响应的JSON数据
  42. 返回数据中:
  43. - type=source: 参考源(网页、图片等)
  44. - type=answer: 总结答案
  45. - type=follow_up: 追问问题
  46. Raises:
  47. requests.exceptions.RequestException: 请求失败时抛出异常
  48. """
  49. payload = {
  50. "query": query
  51. }
  52. try:
  53. response = requests.post(
  54. self.api_url,
  55. json=payload,
  56. timeout=timeout,
  57. headers={"Content-Type": "application/json"}
  58. )
  59. response.raise_for_status()
  60. return response.json()
  61. except requests.exceptions.RequestException as e:
  62. print(f"请求失败: {e}")
  63. raise
  64. def save_result(self, query: str, result: Dict[str, Any]) -> str:
  65. """
  66. 保存结果到文件
  67. 目录结构: results/ai_search/query关键词/时间戳.json
  68. Args:
  69. query: 搜索查询内容
  70. result: API返回的结果
  71. Returns:
  72. 保存的文件路径
  73. """
  74. # 从query中提取简短的关键词作为文件夹名(取前20个字符)
  75. query_short = query[:20].replace('/', '_').replace('\\', '_')
  76. # 创建目录结构: results/ai_search/query/
  77. result_dir = os.path.join(self.results_base_dir, "ai_search", query_short)
  78. os.makedirs(result_dir, exist_ok=True)
  79. # 文件名使用时间戳
  80. timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
  81. filename = f"{timestamp}.json"
  82. filepath = os.path.join(result_dir, filename)
  83. # 保存结果
  84. with open(filepath, 'w', encoding='utf-8') as f:
  85. json.dump(result, f, ensure_ascii=False, indent=2)
  86. return filepath
  87. def main():
  88. """示例使用"""
  89. # 解析命令行参数
  90. parser = argparse.ArgumentParser(description='AI搜索工具')
  91. parser.add_argument(
  92. '--results-dir',
  93. type=str,
  94. default=None,
  95. help='结果输出目录 (默认: 从配置读取,通常为 data/search)'
  96. )
  97. parser.add_argument(
  98. '--query',
  99. type=str,
  100. required=True,
  101. help='搜索查询内容 (必填)'
  102. )
  103. args = parser.parse_args()
  104. # 创建API客户端实例
  105. client = AISearch(results_dir=args.results_dir)
  106. # 执行搜索并保存
  107. try:
  108. result = client.search(args.query)
  109. filepath = client.save_result(args.query, result)
  110. print(f"Output: {filepath}")
  111. except Exception as e:
  112. print(f"Error: {e}", file=__import__('sys').stderr)
  113. if __name__ == "__main__":
  114. main()