run.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370
  1. """
  2. ToolHub 工具测试流程 — mini_restore
  3. 精简版运行脚本,仅测试 ToolHub 搜索和调用。
  4. 不启用浏览器、知识管理等复杂功能。
  5. 功能:
  6. 1. 使用框架提供的 InteractiveController
  7. 2. 支持命令行交互('p' 暂停,'q' 退出)
  8. 3. 支持通过 --trace <ID> 恢复已有 Trace 继续执行
  9. """
  10. import argparse
  11. import os
  12. import sys
  13. import asyncio
  14. from pathlib import Path
  15. # Clash Verge TUN 模式兼容:禁止 httpx/urllib 自动检测系统 HTTP 代理
  16. os.environ.setdefault("no_proxy", "*")
  17. # ToolHub 指向本地服务(tool_agent)
  18. os.environ.setdefault("TOOLHUB_BASE_URL", "http://localhost:8001")
  19. # 添加项目根目录到 Python 路径
  20. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  21. from dotenv import load_dotenv
  22. load_dotenv()
  23. from agent.llm.prompts import SimplePrompt
  24. from agent.core.runner import AgentRunner, RunConfig
  25. from agent.trace import (
  26. FileSystemTraceStore,
  27. Trace,
  28. Message,
  29. )
  30. from agent.llm import create_qwen_llm_call
  31. from agent.cli import InteractiveController
  32. from agent.utils import setup_logging
  33. # 导入 ToolHub 工具(触发 @tool 注册)
  34. from agent.tools.builtin.toolhub import toolhub_health, toolhub_search, toolhub_call # noqa: F401
  35. # 导入项目配置
  36. from config import RUN_CONFIG, SKILLS_DIR, TRACE_STORE_PATH, DEBUG, LOG_LEVEL, LOG_FILE, INPUT_DIR, OUTPUT_DIR
  37. async def main():
  38. # 解析命令行参数
  39. parser = argparse.ArgumentParser(description="ToolHub 工具测试 (mini_restore)")
  40. parser.add_argument(
  41. "--trace", type=str, default=None,
  42. help="已有的 Trace ID,用于恢复继续执行(不指定则新建)",
  43. )
  44. parser.add_argument(
  45. "--task", type=str, default=None,
  46. help="自定义任务描述(覆盖 prompt 中的默认任务)",
  47. )
  48. args = parser.parse_args()
  49. # 路径配置
  50. base_dir = Path(__file__).parent
  51. project_root = base_dir.parent.parent
  52. prompt_path = base_dir / "toolhub_test.prompt"
  53. output_dir = project_root / OUTPUT_DIR
  54. output_dir.mkdir(parents=True, exist_ok=True)
  55. # 1. 配置日志
  56. setup_logging(level=LOG_LEVEL, file=LOG_FILE)
  57. # 2. 加载项目级 presets
  58. print("2. 加载 presets...")
  59. presets_path = base_dir / "presets.json"
  60. if presets_path.exists():
  61. from agent.core.presets import load_presets_from_json
  62. load_presets_from_json(str(presets_path))
  63. print(f" - 已加载项目 presets")
  64. else:
  65. print(f" - 未找到 presets.json,跳过")
  66. # 3. 加载 prompt
  67. print("3. 加载 prompt...")
  68. prompt = SimplePrompt(prompt_path)
  69. # 4. 构建任务消息
  70. print("4. 构建任务消息...")
  71. print(f" - 输入目录: {INPUT_DIR}")
  72. print(f" - 输出目录: {OUTPUT_DIR}")
  73. if args.task:
  74. # 使用命令行自定义任务
  75. messages = prompt.build_messages(input_dir=INPUT_DIR, output_dir=OUTPUT_DIR)
  76. # 替换最后一条 user 消息为自定义任务
  77. for i in range(len(messages) - 1, -1, -1):
  78. if messages[i].get("role") == "user":
  79. messages[i]["content"] = args.task
  80. break
  81. print(f" - 自定义任务: {args.task[:80]}...")
  82. else:
  83. messages = prompt.build_messages(input_dir=INPUT_DIR, output_dir=OUTPUT_DIR)
  84. # 5. 创建 Agent Runner(无浏览器)
  85. print("5. 创建 Agent Runner...")
  86. print(f" - Skills 目录: {SKILLS_DIR}")
  87. # 从 prompt 的 frontmatter 中提取模型配置(优先于 config.py)
  88. prompt_model = prompt.config.get("model", None)
  89. if prompt_model:
  90. model_for_llm = prompt_model
  91. print(f" - 模型 (from prompt): {model_for_llm}")
  92. else:
  93. model_for_llm = RUN_CONFIG.model
  94. print(f" - 模型 (from config): {model_for_llm}")
  95. store = FileSystemTraceStore(base_path=TRACE_STORE_PATH)
  96. runner = AgentRunner(
  97. trace_store=store,
  98. llm_call=create_qwen_llm_call(model=model_for_llm),
  99. skills_dir=SKILLS_DIR,
  100. debug=DEBUG
  101. )
  102. # 6. 创建交互控制器
  103. interactive = InteractiveController(
  104. runner=runner,
  105. store=store,
  106. enable_stdin_check=True
  107. )
  108. runner.stdin_check = interactive.check_stdin
  109. # 7. 任务信息
  110. task_name = RUN_CONFIG.name or base_dir.name
  111. print("=" * 60)
  112. print(f"{task_name}")
  113. print("=" * 60)
  114. print("💡 交互提示:")
  115. print(" - 执行过程中输入 'p' 或 'pause' 暂停并进入交互模式")
  116. print(" - 执行过程中输入 'q' 或 'quit' 停止执行")
  117. print("=" * 60)
  118. print()
  119. # 8. 判断是新建还是恢复
  120. resume_trace_id = args.trace
  121. if resume_trace_id:
  122. existing_trace = await store.get_trace(resume_trace_id)
  123. if not existing_trace:
  124. print(f"\n错误: Trace 不存在: {resume_trace_id}")
  125. sys.exit(1)
  126. print(f"恢复已有 Trace: {resume_trace_id[:8]}...")
  127. print(f" - 状态: {existing_trace.status}")
  128. print(f" - 消息数: {existing_trace.total_messages}")
  129. else:
  130. print(f"启动新 Agent...")
  131. print()
  132. final_response = ""
  133. current_trace_id = resume_trace_id
  134. current_sequence = 0
  135. should_exit = False
  136. try:
  137. # 配置
  138. run_config = RUN_CONFIG
  139. if resume_trace_id:
  140. initial_messages = None
  141. run_config.trace_id = resume_trace_id
  142. else:
  143. initial_messages = messages
  144. run_config.name = f"{task_name}:测试任务"
  145. while not should_exit:
  146. if current_trace_id:
  147. run_config.trace_id = current_trace_id
  148. final_response = ""
  149. # 如果是恢复 trace,进入交互菜单
  150. if current_trace_id and initial_messages is None:
  151. check_trace = await store.get_trace(current_trace_id)
  152. if check_trace:
  153. if check_trace.status == "completed":
  154. print(f"\n[Trace] ✅ 已完成")
  155. print(f" - Total messages: {check_trace.total_messages}")
  156. print(f" - Total cost: ${check_trace.total_cost:.4f}")
  157. elif check_trace.status == "failed":
  158. print(f"\n[Trace] ❌ 已失败: {check_trace.error_message}")
  159. elif check_trace.status == "stopped":
  160. print(f"\n[Trace] ⏸️ 已停止")
  161. print(f" - Total messages: {check_trace.total_messages}")
  162. else:
  163. print(f"\n[Trace] 📊 状态: {check_trace.status}")
  164. print(f" - Total messages: {check_trace.total_messages}")
  165. current_sequence = check_trace.head_sequence
  166. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  167. if menu_result["action"] == "stop":
  168. break
  169. elif menu_result["action"] == "continue":
  170. new_messages = menu_result.get("messages", [])
  171. if new_messages:
  172. initial_messages = new_messages
  173. run_config.after_sequence = menu_result.get("after_sequence")
  174. else:
  175. initial_messages = []
  176. run_config.after_sequence = None
  177. continue
  178. break
  179. if initial_messages is None:
  180. initial_messages = []
  181. print(f"{'▶️ 开始执行...' if not current_trace_id else '▶️ 继续执行...'}")
  182. # 执行 Agent
  183. paused = False
  184. try:
  185. async for item in runner.run(messages=initial_messages, config=run_config):
  186. # 检查用户中断
  187. cmd = interactive.check_stdin()
  188. if cmd == 'pause':
  189. print("\n⏸️ 正在暂停执行...")
  190. if current_trace_id:
  191. await runner.stop(current_trace_id)
  192. await asyncio.sleep(0.5)
  193. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  194. if menu_result["action"] == "stop":
  195. should_exit = True
  196. paused = True
  197. break
  198. elif menu_result["action"] == "continue":
  199. new_messages = menu_result.get("messages", [])
  200. if new_messages:
  201. initial_messages = new_messages
  202. after_seq = menu_result.get("after_sequence")
  203. if after_seq is not None:
  204. run_config.after_sequence = after_seq
  205. paused = True
  206. break
  207. else:
  208. initial_messages = []
  209. run_config.after_sequence = None
  210. paused = True
  211. break
  212. elif cmd == 'quit':
  213. print("\n🛑 用户请求停止...")
  214. if current_trace_id:
  215. await runner.stop(current_trace_id)
  216. should_exit = True
  217. break
  218. # 处理 Trace 对象
  219. if isinstance(item, Trace):
  220. current_trace_id = item.trace_id
  221. if item.status == "running":
  222. print(f"[Trace] 开始: {item.trace_id[:8]}...")
  223. elif item.status == "completed":
  224. print(f"\n[Trace] ✅ 完成")
  225. print(f" - Total messages: {item.total_messages}")
  226. print(f" - Total cost: ${item.total_cost:.4f}")
  227. elif item.status == "failed":
  228. print(f"\n[Trace] ❌ 失败: {item.error_message}")
  229. elif item.status == "stopped":
  230. print(f"\n[Trace] ⏸️ 已停止")
  231. # 处理 Message 对象
  232. elif isinstance(item, Message):
  233. current_sequence = item.sequence
  234. if item.role == "assistant":
  235. content = item.content
  236. if isinstance(content, dict):
  237. text = content.get("text", "")
  238. tool_calls = content.get("tool_calls")
  239. if text and not tool_calls:
  240. final_response = text
  241. print(f"\n[Response] Agent 回复:")
  242. print(text)
  243. elif text:
  244. preview = text[:150] + "..." if len(text) > 150 else text
  245. print(f"[Assistant] {preview}")
  246. elif item.role == "tool":
  247. content = item.content
  248. tool_name = "unknown"
  249. if isinstance(content, dict):
  250. tool_name = content.get("tool_name", "unknown")
  251. if item.description and item.description != tool_name:
  252. desc = item.description[:80] if len(item.description) > 80 else item.description
  253. print(f"[Tool Result] ✅ {tool_name}: {desc}...")
  254. else:
  255. print(f"[Tool Result] ✅ {tool_name}")
  256. except Exception as e:
  257. print(f"\n执行出错: {e}")
  258. import traceback
  259. traceback.print_exc()
  260. if paused:
  261. if should_exit:
  262. break
  263. continue
  264. if should_exit:
  265. break
  266. # Runner 退出后显示交互菜单
  267. if current_trace_id:
  268. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  269. if menu_result["action"] == "stop":
  270. break
  271. elif menu_result["action"] == "continue":
  272. new_messages = menu_result.get("messages", [])
  273. if new_messages:
  274. initial_messages = new_messages
  275. run_config.after_sequence = menu_result.get("after_sequence")
  276. else:
  277. initial_messages = []
  278. run_config.after_sequence = None
  279. continue
  280. break
  281. except KeyboardInterrupt:
  282. print("\n\n用户中断 (Ctrl+C)")
  283. if current_trace_id:
  284. await runner.stop(current_trace_id)
  285. # 输出结果
  286. if final_response:
  287. print()
  288. print("=" * 60)
  289. print("Agent 响应:")
  290. print("=" * 60)
  291. print(final_response)
  292. print("=" * 60)
  293. print()
  294. output_file = output_dir / "result.txt"
  295. with open(output_file, 'w', encoding='utf-8') as f:
  296. f.write(final_response)
  297. print(f"✓ 结果已保存到: {output_file}")
  298. print()
  299. # 可视化提示
  300. if current_trace_id:
  301. print("=" * 60)
  302. print("可视化 Step Tree:")
  303. print("=" * 60)
  304. print("1. 启动 API Server:")
  305. print(" python3 api_server.py")
  306. print()
  307. print("2. 浏览器访问:")
  308. print(" http://localhost:8000/api/traces")
  309. print()
  310. print(f"3. Trace ID: {current_trace_id}")
  311. print("=" * 60)
  312. if __name__ == "__main__":
  313. asyncio.run(main())