run.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369
  1. """
  2. 示例(简化版 - 使用框架交互功能)
  3. 使用 Agent 模式 + Skills + 框架交互控制器
  4. 新功能:
  5. 1. 使用框架提供的 InteractiveController
  6. 2. 使用配置文件管理运行参数
  7. 3. 支持命令行随时打断(输入 'p' 暂停,'q' 退出)
  8. 4. 暂停后可插入干预消息
  9. 5. 支持触发经验总结
  10. 6. 查看当前 GoalTree
  11. 7. 支持通过 --trace <ID> 恢复已有 Trace 继续执行
  12. """
  13. import argparse
  14. import os
  15. import sys
  16. import asyncio
  17. from pathlib import Path
  18. # Clash Verge TUN 模式兼容:禁止 httpx/urllib 自动检测系统 HTTP 代理
  19. os.environ.setdefault("no_proxy", "*")
  20. # 添加项目根目录到 Python 路径
  21. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  22. from dotenv import load_dotenv
  23. load_dotenv()
  24. from agent.llm.prompts import SimplePrompt
  25. from agent.core.runner import AgentRunner, RunConfig
  26. from agent.core.presets import AgentPreset, register_preset
  27. from agent.trace import (
  28. FileSystemTraceStore,
  29. Trace,
  30. Message,
  31. )
  32. from agent.llm import create_openrouter_llm_call
  33. from agent.cli import InteractiveController
  34. from agent.utils import setup_logging
  35. from agent.tools.builtin.browser.baseClass import init_browser_session, kill_browser_session
  36. # 导入项目配置
  37. from config import RUN_CONFIG, SKILLS_DIR, TRACE_STORE_PATH, DEBUG, LOG_LEVEL, LOG_FILE, BROWSER_TYPE, HEADLESS
  38. async def main():
  39. # 解析命令行参数
  40. parser = argparse.ArgumentParser(description="任务 (Agent 模式 + 交互增强)")
  41. parser.add_argument(
  42. "--trace", type=str, default=None,
  43. help="已有的 Trace ID,用于恢复继续执行(不指定则新建)",
  44. )
  45. args = parser.parse_args()
  46. # 路径配置
  47. base_dir = Path(__file__).parent
  48. project_root = base_dir.parent.parent
  49. prompt_path = base_dir / "research.prompt"
  50. output_dir = base_dir / "output_1"
  51. output_dir.mkdir(exist_ok=True)
  52. # 1. 配置日志
  53. setup_logging(level=LOG_LEVEL, file=LOG_FILE)
  54. # 2. 加载项目级 presets
  55. print("2. 加载 presets...")
  56. presets_path = base_dir / "presets.json"
  57. if presets_path.exists():
  58. import json
  59. with open(presets_path, "r", encoding="utf-8") as f:
  60. project_presets = json.load(f)
  61. for name, cfg in project_presets.items():
  62. register_preset(name, AgentPreset(**cfg))
  63. print(f" - 已加载项目 presets: {list(project_presets.keys())}")
  64. # 3. 加载 prompt
  65. print("3. 加载 prompt...")
  66. prompt = SimplePrompt(prompt_path)
  67. # 4. 构建任务消息
  68. print("4. 构建任务消息...")
  69. messages = prompt.build_messages()
  70. # 5. 初始化浏览器
  71. import platform
  72. actual_browser_type = BROWSER_TYPE
  73. if platform.system() == "Windows" and BROWSER_TYPE == "local":
  74. actual_browser_type = "cloud"
  75. print("⚠️ Windows 平台检测到本地浏览器配置,自动切换为云浏览器模式")
  76. browser_mode_name = "云浏览器" if actual_browser_type == "cloud" else "本地浏览器"
  77. print(f"5. 正在初始化{browser_mode_name}...")
  78. await init_browser_session(
  79. browser_type=actual_browser_type,
  80. headless=HEADLESS,
  81. url="about:blank"
  82. )
  83. print(f" ✅ {browser_mode_name}初始化完成\n")
  84. # 6. 创建 Agent Runner
  85. print("6. 创建 Agent Runner...")
  86. print(f" - Skills 目录: {SKILLS_DIR}")
  87. print(f" - 模型: {RUN_CONFIG.model}")
  88. store = FileSystemTraceStore(base_path=TRACE_STORE_PATH)
  89. runner = AgentRunner(
  90. trace_store=store,
  91. llm_call=create_openrouter_llm_call(model=f"anthropic/{RUN_CONFIG.model}"),
  92. skills_dir=SKILLS_DIR,
  93. debug=DEBUG
  94. )
  95. # 7. 创建交互控制器
  96. interactive = InteractiveController(
  97. runner=runner,
  98. store=store,
  99. enable_stdin_check=True
  100. )
  101. # 8. 任务信息
  102. task_name = RUN_CONFIG.name or base_dir.name
  103. print("=" * 60)
  104. print(f"{task_name}")
  105. print("=" * 60)
  106. print("💡 交互提示:")
  107. print(" - 执行过程中输入 'p' 或 'pause' 暂停并进入交互模式")
  108. print(" - 执行过程中输入 'q' 或 'quit' 停止执行")
  109. print("=" * 60)
  110. print()
  111. # 9. 判断是新建还是恢复
  112. resume_trace_id = args.trace
  113. if resume_trace_id:
  114. existing_trace = await store.get_trace(resume_trace_id)
  115. if not existing_trace:
  116. print(f"\n错误: Trace 不存在: {resume_trace_id}")
  117. sys.exit(1)
  118. print(f"恢复已有 Trace: {resume_trace_id[:8]}...")
  119. print(f" - 状态: {existing_trace.status}")
  120. print(f" - 消息数: {existing_trace.total_messages}")
  121. print(f"\n💡 提示:恢复 Trace 时会先进入交互菜单,您可以选择从指定消息续跑")
  122. else:
  123. print(f"启动新 Agent...")
  124. print()
  125. final_response = ""
  126. current_trace_id = resume_trace_id
  127. current_sequence = 0
  128. should_exit = False
  129. try:
  130. # 配置
  131. run_config = RUN_CONFIG
  132. if resume_trace_id:
  133. initial_messages = None
  134. run_config.trace_id = resume_trace_id
  135. else:
  136. initial_messages = messages
  137. run_config.name = f"{task_name}:调研任务"
  138. while not should_exit:
  139. if current_trace_id:
  140. run_config.trace_id = current_trace_id
  141. final_response = ""
  142. # 如果是恢复 trace 或 trace 已完成/失败且没有新消息,进入交互菜单
  143. if current_trace_id and initial_messages is None:
  144. check_trace = await store.get_trace(current_trace_id)
  145. if check_trace:
  146. # 显示 trace 状态
  147. if check_trace.status == "completed":
  148. print(f"\n[Trace] ✅ 已完成")
  149. print(f" - Total messages: {check_trace.total_messages}")
  150. print(f" - Total cost: ${check_trace.total_cost:.4f}")
  151. elif check_trace.status == "failed":
  152. print(f"\n[Trace] ❌ 已失败: {check_trace.error_message}")
  153. elif check_trace.status == "stopped":
  154. print(f"\n[Trace] ⏸️ 已停止")
  155. print(f" - Total messages: {check_trace.total_messages}")
  156. else:
  157. print(f"\n[Trace] 📊 状态: {check_trace.status}")
  158. print(f" - Total messages: {check_trace.total_messages}")
  159. current_sequence = check_trace.head_sequence
  160. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  161. if menu_result["action"] == "stop":
  162. break
  163. elif menu_result["action"] == "continue":
  164. new_messages = menu_result.get("messages", [])
  165. if new_messages:
  166. initial_messages = new_messages
  167. run_config.after_sequence = menu_result.get("after_sequence")
  168. else:
  169. initial_messages = []
  170. run_config.after_sequence = None
  171. continue
  172. break
  173. # 如果没有进入菜单(新建 trace),设置初始消息
  174. if initial_messages is None:
  175. initial_messages = []
  176. print(f"{'▶️ 开始执行...' if not current_trace_id else '▶️ 继续执行...'}")
  177. # 执行 Agent
  178. paused = False
  179. try:
  180. async for item in runner.run(messages=initial_messages, config=run_config):
  181. # 检查用户中断
  182. cmd = interactive.check_stdin()
  183. if cmd == 'pause':
  184. print("\n⏸️ 正在暂停执行...")
  185. if current_trace_id:
  186. await runner.stop(current_trace_id)
  187. await asyncio.sleep(0.5)
  188. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  189. if menu_result["action"] == "stop":
  190. should_exit = True
  191. paused = True
  192. break
  193. elif menu_result["action"] == "continue":
  194. new_messages = menu_result.get("messages", [])
  195. if new_messages:
  196. initial_messages = new_messages
  197. after_seq = menu_result.get("after_sequence")
  198. if after_seq is not None:
  199. run_config.after_sequence = after_seq
  200. paused = True
  201. break
  202. else:
  203. initial_messages = []
  204. run_config.after_sequence = None
  205. paused = True
  206. break
  207. elif cmd == 'quit':
  208. print("\n🛑 用户请求停止...")
  209. if current_trace_id:
  210. await runner.stop(current_trace_id)
  211. should_exit = True
  212. break
  213. # 处理 Trace 对象
  214. if isinstance(item, Trace):
  215. current_trace_id = item.trace_id
  216. if item.status == "running":
  217. print(f"[Trace] 开始: {item.trace_id[:8]}...")
  218. elif item.status == "completed":
  219. print(f"\n[Trace] ✅ 完成")
  220. print(f" - Total messages: {item.total_messages}")
  221. print(f" - Total cost: ${item.total_cost:.4f}")
  222. elif item.status == "failed":
  223. print(f"\n[Trace] ❌ 失败: {item.error_message}")
  224. elif item.status == "stopped":
  225. print(f"\n[Trace] ⏸️ 已停止")
  226. # 处理 Message 对象
  227. elif isinstance(item, Message):
  228. current_sequence = item.sequence
  229. if item.role == "assistant":
  230. content = item.content
  231. if isinstance(content, dict):
  232. text = content.get("text", "")
  233. tool_calls = content.get("tool_calls")
  234. if text and not tool_calls:
  235. final_response = text
  236. print(f"\n[Response] Agent 回复:")
  237. print(text)
  238. elif text:
  239. preview = text[:150] + "..." if len(text) > 150 else text
  240. print(f"[Assistant] {preview}")
  241. elif item.role == "tool":
  242. content = item.content
  243. tool_name = "unknown"
  244. if isinstance(content, dict):
  245. tool_name = content.get("tool_name", "unknown")
  246. if item.description and item.description != tool_name:
  247. desc = item.description[:80] if len(item.description) > 80 else item.description
  248. print(f"[Tool Result] ✅ {tool_name}: {desc}...")
  249. else:
  250. print(f"[Tool Result] ✅ {tool_name}")
  251. except Exception as e:
  252. print(f"\n执行出错: {e}")
  253. import traceback
  254. traceback.print_exc()
  255. if paused:
  256. if should_exit:
  257. break
  258. continue
  259. if should_exit:
  260. break
  261. # Runner 退出后显示交互菜单
  262. if current_trace_id:
  263. menu_result = await interactive.show_menu(current_trace_id, current_sequence)
  264. if menu_result["action"] == "stop":
  265. break
  266. elif menu_result["action"] == "continue":
  267. new_messages = menu_result.get("messages", [])
  268. if new_messages:
  269. initial_messages = new_messages
  270. run_config.after_sequence = menu_result.get("after_sequence")
  271. else:
  272. initial_messages = []
  273. run_config.after_sequence = None
  274. continue
  275. break
  276. except KeyboardInterrupt:
  277. print("\n\n用户中断 (Ctrl+C)")
  278. if current_trace_id:
  279. await runner.stop(current_trace_id)
  280. finally:
  281. # 清理浏览器会话
  282. try:
  283. await kill_browser_session()
  284. except Exception:
  285. pass
  286. # 7. 输出结果
  287. if final_response:
  288. print()
  289. print("=" * 60)
  290. print("Agent 响应:")
  291. print("=" * 60)
  292. print(final_response)
  293. print("=" * 60)
  294. print()
  295. output_file = output_dir / "result.txt"
  296. with open(output_file, 'w', encoding='utf-8') as f:
  297. f.write(final_response)
  298. print(f"✓ 结果已保存到: {output_file}")
  299. print()
  300. # 可视化提示
  301. if current_trace_id:
  302. print("=" * 60)
  303. print("可视化 Step Tree:")
  304. print("=" * 60)
  305. print("1. 启动 API Server:")
  306. print(" python3 api_server.py")
  307. print()
  308. print("2. 浏览器访问:")
  309. print(" http://localhost:8000/api/traces")
  310. print()
  311. print(f"3. Trace ID: {current_trace_id}")
  312. print("=" * 60)
  313. if __name__ == "__main__":
  314. asyncio.run(main())