run.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503
  1. """
  2. 示例(增强版)
  3. 使用 Agent 模式 + Skills
  4. 新增功能:
  5. 1. 支持命令行随时打断(输入 'p' 暂停,'q' 退出)
  6. 2. 暂停后可插入干预消息
  7. 3. 支持触发经验总结
  8. 4. 查看当前 GoalTree
  9. 5. 框架层自动清理不完整的工具调用
  10. 6. 支持通过 --trace <ID> 恢复已有 Trace 继续执行
  11. """
  12. import argparse
  13. import os
  14. import sys
  15. import select
  16. import asyncio
  17. from pathlib import Path
  18. # Clash Verge TUN 模式兼容:禁止 httpx/urllib 自动检测系统 HTTP 代理
  19. # TUN 虚拟网卡已在网络层接管所有流量,不需要应用层再走 HTTP 代理,
  20. # 否则 httpx 检测到 macOS 系统代理 (127.0.0.1:7897) 会导致 ConnectError
  21. os.environ.setdefault("no_proxy", "*")
  22. # 添加项目根目录到 Python 路径
  23. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  24. from dotenv import load_dotenv
  25. load_dotenv()
  26. from agent.llm.prompts import SimplePrompt
  27. from agent.core.runner import AgentRunner, RunConfig
  28. from agent.trace import (
  29. FileSystemTraceStore,
  30. Trace,
  31. Message,
  32. )
  33. from agent.llm import create_yescode_llm_call
  34. # ===== 非阻塞 stdin 检测 =====
  35. def check_stdin() -> str | None:
  36. """
  37. 非阻塞检查 stdin 是否有输入。
  38. 使用 select 轮询,不开后台线程,因此不会与交互菜单的 input() 抢 stdin。
  39. """
  40. ready, _, _ = select.select([sys.stdin], [], [], 0)
  41. if ready:
  42. line = sys.stdin.readline().strip().lower()
  43. if line in ('p', 'pause'):
  44. return 'pause'
  45. if line in ('q', 'quit'):
  46. return 'quit'
  47. return None
  48. # ===== 交互菜单 =====
  49. def _read_multiline() -> str:
  50. """
  51. 读取多行输入,以连续两次回车(空行)结束。
  52. 单次回车只是换行,不会提前终止输入。
  53. """
  54. print("\n请输入干预消息(连续输入两次回车结束):")
  55. lines: list[str] = []
  56. blank_count = 0
  57. while True:
  58. line = input()
  59. if line == "":
  60. blank_count += 1
  61. if blank_count >= 2:
  62. break
  63. lines.append("") # 保留单个空行
  64. else:
  65. blank_count = 0
  66. lines.append(line)
  67. # 去掉尾部多余空行
  68. while lines and lines[-1] == "":
  69. lines.pop()
  70. return "\n".join(lines)
  71. async def show_interactive_menu(
  72. runner: AgentRunner,
  73. trace_id: str,
  74. current_sequence: int,
  75. store: FileSystemTraceStore,
  76. ):
  77. """
  78. 显示交互式菜单,让用户选择操作。
  79. 进入本函数前不再有后台线程占用 stdin,所以 input() 能正常工作。
  80. """
  81. print("\n" + "=" * 60)
  82. print(" 执行已暂停")
  83. print("=" * 60)
  84. print("请选择操作:")
  85. print(" 1. 插入干预消息并继续")
  86. print(" 2. 触发经验总结(reflect)")
  87. print(" 3. 查看当前 GoalTree")
  88. print(" 4. 继续执行")
  89. print(" 5. 停止执行")
  90. print("=" * 60)
  91. while True:
  92. choice = input("请输入选项 (1-5): ").strip()
  93. if choice == "1":
  94. text = _read_multiline()
  95. if not text:
  96. print("未输入任何内容,取消操作")
  97. continue
  98. print(f"\n将插入干预消息并继续执行...")
  99. # 从 store 读取实际的 last_sequence,避免本地 current_sequence 过时
  100. live_trace = await store.get_trace(trace_id)
  101. actual_sequence = live_trace.last_sequence if live_trace and live_trace.last_sequence else current_sequence
  102. return {
  103. "action": "continue",
  104. "messages": [{"role": "user", "content": text}],
  105. "after_sequence": actual_sequence,
  106. }
  107. elif choice == "2":
  108. # 触发经验总结
  109. print("\n触发经验总结...")
  110. focus = input("请输入反思重点(可选,直接回车跳过): ").strip()
  111. from agent.trace.compaction import build_reflect_prompt
  112. # 保存当前 head_sequence
  113. trace = await store.get_trace(trace_id)
  114. saved_head = trace.head_sequence
  115. prompt = build_reflect_prompt()
  116. if focus:
  117. prompt += f"\n\n请特别关注:{focus}"
  118. print("正在生成反思...")
  119. reflect_cfg = RunConfig(trace_id=trace_id, max_iterations=1, tools=[])
  120. reflection_text = ""
  121. try:
  122. result = await runner.run_result(
  123. messages=[{"role": "user", "content": prompt}],
  124. config=reflect_cfg,
  125. )
  126. reflection_text = result.get("summary", "")
  127. finally:
  128. # 恢复 head_sequence(反思消息成为侧枝)
  129. await store.update_trace(trace_id, head_sequence=saved_head)
  130. # 追加到 experiences 文件
  131. if reflection_text:
  132. from datetime import datetime
  133. experiences_path = runner.experiences_path or "./.cache/experiences.md"
  134. os.makedirs(os.path.dirname(experiences_path), exist_ok=True)
  135. header = f"\n\n---\n\n## {trace_id} ({datetime.now().strftime('%Y-%m-%d %H:%M')})\n\n"
  136. with open(experiences_path, "a", encoding="utf-8") as f:
  137. f.write(header + reflection_text + "\n")
  138. print(f"\n反思已保存到: {experiences_path}")
  139. print("\n--- 反思内容 ---")
  140. print(reflection_text)
  141. print("--- 结束 ---\n")
  142. else:
  143. print("未生成反思内容")
  144. continue
  145. elif choice == "3":
  146. goal_tree = await store.get_goal_tree(trace_id)
  147. if goal_tree and goal_tree.goals:
  148. print("\n当前 GoalTree:")
  149. print(goal_tree.to_prompt())
  150. else:
  151. print("\n当前没有 Goal")
  152. continue
  153. elif choice == "4":
  154. print("\n继续执行...")
  155. return {"action": "continue"}
  156. elif choice == "5":
  157. print("\n停止执行...")
  158. return {"action": "stop"}
  159. else:
  160. print("无效选项,请重新输入")
  161. async def main():
  162. # 解析命令行参数
  163. parser = argparse.ArgumentParser(description="任务 (Agent 模式 + 交互增强)")
  164. parser.add_argument(
  165. "--trace", type=str, default=None,
  166. help="已有的 Trace ID,用于恢复继续执行(不指定则新建)",
  167. )
  168. args = parser.parse_args()
  169. # 路径配置
  170. base_dir = Path(__file__).parent
  171. project_root = base_dir.parent.parent
  172. prompt_path = base_dir / "test.prompt"
  173. output_dir = base_dir / "output_1"
  174. output_dir.mkdir(exist_ok=True)
  175. # Skills 目录(可选:用户自定义 skills)
  176. # 注意:内置 skills(agent/skills/core.md)会自动加载
  177. skills_dir = None # 或者指定自定义 skills 目录,如: project_root / "skills"
  178. print("=" * 60)
  179. print("mcp/skills 发现、获取、评价 分析任务 (Agent 模式 + 交互增强)")
  180. print("=" * 60)
  181. print()
  182. print("💡 交互提示:")
  183. print(" - 执行过程中输入 'p' 或 'pause' 暂停并进入交互模式")
  184. print(" - 执行过程中输入 'q' 或 'quit' 停止执行")
  185. print("=" * 60)
  186. print()
  187. # 1. 加载 prompt
  188. print("1. 加载 prompt 配置...")
  189. prompt = SimplePrompt(prompt_path)
  190. # 2. 构建消息(仅新建时使用,恢复时消息已在 trace 中)
  191. print("2. 构建任务消息...")
  192. messages = prompt.build_messages()
  193. # 3. 创建 Agent Runner(配置 skills)
  194. print("3. 创建 Agent Runner...")
  195. print(f" - Skills 目录: {skills_dir}")
  196. print(f" - 模型: {prompt.config.get('model', 'sonnet-4.5')}")
  197. store = FileSystemTraceStore(base_path=".trace")
  198. runner = AgentRunner(
  199. trace_store=store,
  200. llm_call=create_yescode_llm_call(model=f"claude-{prompt.config.get('model', 'sonnet-4.5')}"),
  201. skills_dir=skills_dir,
  202. debug=True
  203. )
  204. # 4. 判断是新建还是恢复
  205. resume_trace_id = args.trace
  206. if resume_trace_id:
  207. # 验证 trace 存在
  208. existing_trace = await store.get_trace(resume_trace_id)
  209. if not existing_trace:
  210. print(f"\n错误: Trace 不存在: {resume_trace_id}")
  211. sys.exit(1)
  212. print(f"4. 恢复已有 Trace: {resume_trace_id[:8]}...")
  213. print(f" - 状态: {existing_trace.status}")
  214. print(f" - 消息数: {existing_trace.total_messages}")
  215. print(f" - 任务: {existing_trace.task}")
  216. else:
  217. print(f"4. 启动新 Agent 模式...")
  218. print()
  219. final_response = ""
  220. current_trace_id = resume_trace_id
  221. current_sequence = 0
  222. should_exit = False
  223. try:
  224. # 恢复模式:不发送初始消息,只指定 trace_id 续跑
  225. if resume_trace_id:
  226. initial_messages = None # None = 未设置,触发早期菜单检查
  227. config = RunConfig(
  228. model=f"claude-{prompt.config.get('model', 'sonnet-4.5')}",
  229. temperature=float(prompt.config.get('temperature', 0.3)),
  230. max_iterations=1000,
  231. trace_id=resume_trace_id,
  232. )
  233. else:
  234. initial_messages = messages
  235. config = RunConfig(
  236. model=f"claude-{prompt.config.get('model', 'sonnet-4.5')}",
  237. temperature=float(prompt.config.get('temperature', 0.3)),
  238. max_iterations=1000,
  239. name="mcp/skills 发现、获取、评价 分析任务",
  240. )
  241. while not should_exit:
  242. # 如果是续跑,需要指定 trace_id
  243. if current_trace_id:
  244. config.trace_id = current_trace_id
  245. # 清理上一轮的响应,避免失败后显示旧内容
  246. final_response = ""
  247. # 如果 trace 已完成/失败且没有新消息,直接进入交互菜单
  248. # 注意:initial_messages 为 None 表示未设置(首次加载),[] 表示有意为空(用户选择"继续")
  249. if current_trace_id and initial_messages is None:
  250. check_trace = await store.get_trace(current_trace_id)
  251. if check_trace and check_trace.status in ("completed", "failed"):
  252. if check_trace.status == "completed":
  253. print(f"\n[Trace] ✅ 已完成")
  254. print(f" - Total messages: {check_trace.total_messages}")
  255. print(f" - Total cost: ${check_trace.total_cost:.4f}")
  256. else:
  257. print(f"\n[Trace] ❌ 已失败: {check_trace.error_message}")
  258. current_sequence = check_trace.head_sequence
  259. menu_result = await show_interactive_menu(
  260. runner, current_trace_id, current_sequence, store
  261. )
  262. if menu_result["action"] == "stop":
  263. break
  264. elif menu_result["action"] == "continue":
  265. new_messages = menu_result.get("messages", [])
  266. if new_messages:
  267. initial_messages = new_messages
  268. config.after_sequence = menu_result.get("after_sequence")
  269. else:
  270. # 无新消息:对 failed trace 意味着重试,对 completed 意味着继续
  271. initial_messages = []
  272. config.after_sequence = None
  273. continue
  274. break
  275. # 对 stopped/running 等非终态的 trace,直接续跑
  276. initial_messages = []
  277. print(f"{'▶️ 开始执行...' if not current_trace_id else '▶️ 继续执行...'}")
  278. # 执行 Agent
  279. paused = False
  280. try:
  281. async for item in runner.run(messages=initial_messages, config=config):
  282. # 检查用户中断
  283. cmd = check_stdin()
  284. if cmd == 'pause':
  285. # 暂停执行
  286. print("\n⏸️ 正在暂停执行...")
  287. if current_trace_id:
  288. await runner.stop(current_trace_id)
  289. # 等待一小段时间让 runner 处理 stop 信号
  290. await asyncio.sleep(0.5)
  291. # 显示交互菜单
  292. menu_result = await show_interactive_menu(
  293. runner, current_trace_id, current_sequence, store
  294. )
  295. if menu_result["action"] == "stop":
  296. should_exit = True
  297. paused = True
  298. break
  299. elif menu_result["action"] == "continue":
  300. # 检查是否有新消息需要插入
  301. new_messages = menu_result.get("messages", [])
  302. if new_messages:
  303. # 有干预消息,需要重新启动循环
  304. initial_messages = new_messages
  305. after_seq = menu_result.get("after_sequence")
  306. if after_seq is not None:
  307. config.after_sequence = after_seq
  308. paused = True
  309. break
  310. else:
  311. # 没有新消息,需要重启执行
  312. initial_messages = []
  313. config.after_sequence = None
  314. paused = True
  315. break
  316. elif cmd == 'quit':
  317. print("\n🛑 用户请求停止...")
  318. if current_trace_id:
  319. await runner.stop(current_trace_id)
  320. should_exit = True
  321. break
  322. # 处理 Trace 对象(整体状态变化)
  323. if isinstance(item, Trace):
  324. current_trace_id = item.trace_id
  325. if item.status == "running":
  326. print(f"[Trace] 开始: {item.trace_id[:8]}...")
  327. elif item.status == "completed":
  328. print(f"\n[Trace] ✅ 完成")
  329. print(f" - Total messages: {item.total_messages}")
  330. print(f" - Total tokens: {item.total_tokens}")
  331. print(f" - Total cost: ${item.total_cost:.4f}")
  332. elif item.status == "failed":
  333. print(f"\n[Trace] ❌ 失败: {item.error_message}")
  334. elif item.status == "stopped":
  335. print(f"\n[Trace] ⏸️ 已停止")
  336. # 处理 Message 对象(执行过程)
  337. elif isinstance(item, Message):
  338. current_sequence = item.sequence
  339. if item.role == "assistant":
  340. content = item.content
  341. if isinstance(content, dict):
  342. text = content.get("text", "")
  343. tool_calls = content.get("tool_calls")
  344. if text and not tool_calls:
  345. # 纯文本回复(最终响应)
  346. final_response = text
  347. print(f"\n[Response] Agent 回复:")
  348. print(text)
  349. elif text:
  350. preview = text[:150] + "..." if len(text) > 150 else text
  351. print(f"[Assistant] {preview}")
  352. if tool_calls:
  353. for tc in tool_calls:
  354. tool_name = tc.get("function", {}).get("name", "unknown")
  355. print(f"[Tool Call] 🛠️ {tool_name}")
  356. elif item.role == "tool":
  357. content = item.content
  358. if isinstance(content, dict):
  359. tool_name = content.get("tool_name", "unknown")
  360. print(f"[Tool Result] ✅ {tool_name}")
  361. if item.description:
  362. desc = item.description[:80] if len(item.description) > 80 else item.description
  363. print(f" {desc}...")
  364. except Exception as e:
  365. print(f"\n执行出错: {e}")
  366. import traceback
  367. traceback.print_exc()
  368. # paused → 菜单已在暂停时内联显示过
  369. if paused:
  370. if should_exit:
  371. break
  372. continue
  373. # quit → 直接退出
  374. if should_exit:
  375. break
  376. # Runner 退出(完成/失败/停止/异常)→ 显示交互菜单
  377. if current_trace_id:
  378. menu_result = await show_interactive_menu(
  379. runner, current_trace_id, current_sequence, store
  380. )
  381. if menu_result["action"] == "stop":
  382. break
  383. elif menu_result["action"] == "continue":
  384. new_messages = menu_result.get("messages", [])
  385. if new_messages:
  386. initial_messages = new_messages
  387. config.after_sequence = menu_result.get("after_sequence")
  388. else:
  389. initial_messages = []
  390. config.after_sequence = None
  391. continue
  392. break
  393. except KeyboardInterrupt:
  394. print("\n\n用户中断 (Ctrl+C)")
  395. if current_trace_id:
  396. await runner.stop(current_trace_id)
  397. # 6. 输出结果
  398. if final_response:
  399. print()
  400. print("=" * 60)
  401. print("Agent 响应:")
  402. print("=" * 60)
  403. print(final_response)
  404. print("=" * 60)
  405. print()
  406. # 7. 保存结果
  407. output_file = output_dir / "result.txt"
  408. with open(output_file, 'w', encoding='utf-8') as f:
  409. f.write(final_response)
  410. print(f"✓ 结果已保存到: {output_file}")
  411. print()
  412. # 可视化提示
  413. if current_trace_id:
  414. print("=" * 60)
  415. print("可视化 Step Tree:")
  416. print("=" * 60)
  417. print("1. 启动 API Server:")
  418. print(" python3 api_server.py")
  419. print()
  420. print("2. 浏览器访问:")
  421. print(" http://localhost:8000/api/traces")
  422. print()
  423. print(f"3. Trace ID: {current_trace_id}")
  424. print("=" * 60)
  425. if __name__ == "__main__":
  426. asyncio.run(main())