run.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624
  1. """
  2. 示例(增强版)
  3. 使用 Agent 模式 + Skills
  4. 新增功能:
  5. 1. 支持命令行随时打断(输入 'p' 暂停,'q' 退出)
  6. 2. 暂停后可插入干预消息
  7. 3. 支持触发经验总结
  8. 4. 查看当前 GoalTree
  9. 5. 框架层自动清理不完整的工具调用
  10. 6. 支持通过 --trace <ID> 恢复已有 Trace 继续执行
  11. """
  12. import argparse
  13. import os
  14. import sys
  15. import select
  16. import asyncio
  17. from pathlib import Path
  18. # Clash Verge TUN 模式兼容:禁止 httpx/urllib 自动检测系统 HTTP 代理
  19. # TUN 虚拟网卡已在网络层接管所有流量,不需要应用层再走 HTTP 代理,
  20. # 否则 httpx 检测到 macOS 系统代理 (127.0.0.1:7897) 会导致 ConnectError
  21. os.environ.setdefault("no_proxy", "*")
  22. # 添加项目根目录到 Python 路径
  23. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  24. from dotenv import load_dotenv
  25. load_dotenv()
  26. from agent.llm.prompts import SimplePrompt
  27. from agent.core.runner import AgentRunner, RunConfig
  28. from agent.core.presets import AgentPreset, register_preset
  29. from agent.trace import (
  30. FileSystemTraceStore,
  31. Trace,
  32. Message,
  33. )
  34. from agent.llm import create_openrouter_llm_call
  35. from agent.tools import get_tool_registry
  36. os.environ.setdefault("no_proxy", "*")
  37. # ===== 非阻塞 stdin 检测 =====
  38. if sys.platform == 'win32':
  39. import msvcrt
  40. def check_stdin() -> str | None:
  41. """
  42. 跨平台非阻塞检查 stdin 输入。
  43. Windows: 使用 msvcrt.kbhit()
  44. macOS/Linux: 使用 select.select()
  45. """
  46. if sys.platform == 'win32':
  47. # 检查是否有按键按下
  48. if msvcrt.kbhit():
  49. # 读取按下的字符(msvcrt.getwch 是非阻塞读取宽字符)
  50. ch = msvcrt.getwch().lower()
  51. if ch == 'p':
  52. return 'pause'
  53. if ch == 'q':
  54. return 'quit'
  55. # 如果是其他按键,可以选择消耗掉或者忽略
  56. return None
  57. else:
  58. # Unix/Mac 逻辑
  59. ready, _, _ = select.select([sys.stdin], [], [], 0)
  60. if ready:
  61. line = sys.stdin.readline().strip().lower()
  62. if line in ('p', 'pause'):
  63. return 'pause'
  64. if line in ('q', 'quit'):
  65. return 'quit'
  66. return None
  67. # ===== 交互菜单 =====
  68. def _read_multiline() -> str:
  69. """
  70. 读取多行输入,以连续两次回车(空行)结束。
  71. 单次回车只是换行,不会提前终止输入。
  72. """
  73. print("\n请输入干预消息(连续输入两次回车结束):")
  74. lines: list[str] = []
  75. blank_count = 0
  76. while True:
  77. line = input()
  78. if line == "":
  79. blank_count += 1
  80. if blank_count >= 2:
  81. break
  82. lines.append("") # 保留单个空行
  83. else:
  84. blank_count = 0
  85. lines.append(line)
  86. # 去掉尾部多余空行
  87. while lines and lines[-1] == "":
  88. lines.pop()
  89. return "\n".join(lines)
  90. async def show_interactive_menu(
  91. runner: AgentRunner,
  92. trace_id: str,
  93. current_sequence: int,
  94. store: FileSystemTraceStore,
  95. ):
  96. """
  97. 显示交互式菜单,让用户选择操作。
  98. 进入本函数前不再有后台线程占用 stdin,所以 input() 能正常工作。
  99. """
  100. print("\n" + "=" * 60)
  101. print(" 执行已暂停")
  102. print("=" * 60)
  103. print("请选择操作:")
  104. print(" 1. 插入干预消息并继续")
  105. print(" 2. 触发经验总结(reflect)")
  106. print(" 3. 查看当前 GoalTree")
  107. print(" 4. 手动压缩上下文(compact)")
  108. print(" 5. 继续执行")
  109. print(" 6. 停止执行")
  110. print(" 7. 经验库瘦身(合并相似经验)")
  111. print("=" * 60)
  112. while True:
  113. choice = input("请输入选项 (1-7): ").strip()
  114. if choice == "1":
  115. text = _read_multiline()
  116. if not text:
  117. print("未输入任何内容,取消操作")
  118. continue
  119. print(f"\n将插入干预消息并继续执行...")
  120. # 从 store 读取实际的 last_sequence,避免本地 current_sequence 过时
  121. live_trace = await store.get_trace(trace_id)
  122. actual_sequence = live_trace.last_sequence if live_trace and live_trace.last_sequence else current_sequence
  123. return {
  124. "action": "continue",
  125. "messages": [{"role": "user", "content": text}],
  126. "after_sequence": actual_sequence,
  127. }
  128. elif choice == "2":
  129. # 触发经验总结
  130. print("\n触发经验总结...")
  131. focus = input("请输入反思重点(可选,直接回车跳过): ").strip()
  132. # 触发反思
  133. await perform_reflection(runner, store, trace_id, focus=focus)
  134. continue
  135. elif choice == "3":
  136. goal_tree = await store.get_goal_tree(trace_id)
  137. if goal_tree and goal_tree.goals:
  138. print("\n当前 GoalTree:")
  139. print(goal_tree.to_prompt())
  140. else:
  141. print("\n当前没有 Goal")
  142. continue
  143. elif choice == "4":
  144. # 手动压缩上下文
  145. print("\n正在执行上下文压缩(compact)...")
  146. try:
  147. goal_tree = await store.get_goal_tree(trace_id)
  148. trace = await store.get_trace(trace_id)
  149. if not trace:
  150. print("未找到 Trace,无法压缩")
  151. continue
  152. # 重建当前 history
  153. main_path = await store.get_main_path_messages(trace_id, trace.head_sequence)
  154. history = [msg.to_llm_dict() for msg in main_path]
  155. head_seq = main_path[-1].sequence if main_path else 0
  156. next_seq = head_seq + 1
  157. compact_config = RunConfig(trace_id=trace_id)
  158. new_history, new_head, new_seq = await runner._compress_history(
  159. trace_id=trace_id,
  160. history=history,
  161. goal_tree=goal_tree,
  162. config=compact_config,
  163. sequence=next_seq,
  164. head_seq=head_seq,
  165. )
  166. print(f"\n✅ 压缩完成: {len(history)} 条消息 → {len(new_history)} 条")
  167. except Exception as e:
  168. print(f"\n❌ 压缩失败: {e}")
  169. continue
  170. elif choice == "5":
  171. print("\n继续执行...")
  172. return {"action": "continue"}
  173. elif choice == "6":
  174. print("\n停止执行...")
  175. return {"action": "stop"}
  176. elif choice == "7":
  177. # 经验库瘦身
  178. print("\n正在执行经验库瘦身...")
  179. from agent.tools.builtin.experience import slim_experiences
  180. try:
  181. result = await slim_experiences()
  182. print(f"\n{result}")
  183. except Exception as e:
  184. print(f"\n经验库瘦身失败: {e}")
  185. continue
  186. else:
  187. print("无效选项,请重新输入")
  188. async def perform_reflection(runner: AgentRunner, store: FileSystemTraceStore, trace_id: str, focus: str = ""):
  189. """执行经验总结并保存(带结构化 YAML 解析)"""
  190. from agent.trace.compaction import build_reflect_prompt
  191. import re as _re2
  192. import uuid as _uuid2
  193. from datetime import datetime
  194. trace = await store.get_trace(trace_id)
  195. if not trace:
  196. return
  197. saved_head = trace.head_sequence
  198. prompt = build_reflect_prompt()
  199. if focus:
  200. prompt += f"\n\n请特别关注:{focus}"
  201. print("正在生成反思...")
  202. reflect_cfg = RunConfig(trace_id=trace_id, max_iterations=1, tools=[])
  203. reflection_text = ""
  204. try:
  205. result = await runner.run_result(
  206. messages=[{"role": "user", "content": prompt}],
  207. config=reflect_cfg,
  208. )
  209. reflection_text = result.get("summary", "")
  210. finally:
  211. # 恢复 head_sequence(反思消息成为侧枝,不污染主对话)
  212. await store.update_trace(trace_id, head_sequence=saved_head)
  213. # 追加到 experiences 文件
  214. if reflection_text:
  215. experiences_path = runner.experiences_path or "./.cache/experiences_restore.md"
  216. os.makedirs(os.path.dirname(experiences_path), exist_ok=True)
  217. pattern = r"-\s*\[(?P<tags>.*?)\]\s*(?P<content>.*)"
  218. matches = list(_re2.finditer(pattern, reflection_text))
  219. structured_entries = []
  220. for match in matches:
  221. tags_str = match.group("tags")
  222. content = match.group("content")
  223. intent_match = _re2.search(r"intent:\s*(.*?)(?:,|$)", tags_str, _re2.IGNORECASE)
  224. state_match = _re2.search(r"state:\s*(.*?)(?:,|$)", tags_str, _re2.IGNORECASE)
  225. intents = [i.strip() for i in intent_match.group(1).split(",")] if intent_match and intent_match.group(1) else []
  226. states = [s.strip() for s in state_match.group(1).split(",")] if state_match and state_match.group(1) else []
  227. ex_id = f"ex_{datetime.now().strftime('%m%d%H%M')}_{_uuid2.uuid4().hex[:4]}"
  228. entry = f"---\nid: {ex_id}\ntrace_id: {trace_id}\ntags: {{intent: {intents}, state: {states}}}\nmetrics: {{helpful: 1, harmful: 0}}\ncreated_at: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}\n---\n- {content}\n- 经验ID: [{ex_id}]"
  229. structured_entries.append(entry)
  230. if structured_entries:
  231. final_output = "\n\n" + "\n\n".join(structured_entries)
  232. with open(experiences_path, "a", encoding="utf-8") as f:
  233. f.write(final_output)
  234. print(f"\n✅ 提取了 {len(structured_entries)} 条经验,已结构化并保存到: {experiences_path}")
  235. print("\n--- 反思内容(结构化后) ---")
  236. print(final_output.strip())
  237. print("--- 结束 ---\n")
  238. else:
  239. print("\n⚠️ 未能解析出符合格式的经验条目,已保存原始纯文本以供检查。")
  240. header = f"\n\n---\n\n## [Raw] {trace_id} ({datetime.now().strftime('%Y-%m-%d %H:%M')})\n\n"
  241. with open(experiences_path, "a", encoding="utf-8") as f:
  242. f.write(header + reflection_text + "\n")
  243. print(reflection_text)
  244. else:
  245. print("未生成反思内容")
  246. async def main():
  247. # 解析命令行参数
  248. parser = argparse.ArgumentParser(description="任务 (Agent 模式 + 交互增强)")
  249. parser.add_argument(
  250. "--trace", type=str, default=None,
  251. help="已有的 Trace ID,用于恢复继续执行(不指定则新建)",
  252. )
  253. args = parser.parse_args()
  254. # 路径配置
  255. base_dir = Path(__file__).parent
  256. project_root = base_dir.parent.parent
  257. prompt_path = base_dir / "production.prompt"
  258. output_dir = base_dir / "output_1"
  259. output_dir.mkdir(exist_ok=True)
  260. # 加载项目级 presets(examples/restore/presets.json)
  261. presets_path = base_dir / "presets.json"
  262. if presets_path.exists():
  263. import json
  264. with open(presets_path, "r", encoding="utf-8") as f:
  265. project_presets = json.load(f)
  266. for name, cfg in project_presets.items():
  267. register_preset(name, AgentPreset(**cfg))
  268. print(f" - 已加载项目 presets: {list(project_presets.keys())}")
  269. # Skills 目录(可选:用户自定义 skills)
  270. # 注意:内置 skills(agent/memory/skills/)会自动加载
  271. skills_dir = str(base_dir / "skills")
  272. print("=" * 60)
  273. print("mcp/skills 发现、获取、评价 分析任务 (Agent 模式 + 交互增强)")
  274. print("=" * 60)
  275. print()
  276. print("💡 交互提示:")
  277. print(" - 执行过程中输入 'p' 或 'pause' 暂停并进入交互模式")
  278. print(" - 执行过程中输入 'q' 或 'quit' 停止执行")
  279. print("=" * 60)
  280. print()
  281. # 1. 加载 prompt
  282. print("1. 加载 prompt 配置...")
  283. prompt = SimplePrompt(prompt_path)
  284. # 2. 构建消息(仅新建时使用,恢复时消息已在 trace 中)
  285. print("2. 构建任务消息...")
  286. messages = prompt.build_messages()
  287. # 3. 创建 Agent Runner(配置 skills)
  288. print("3. 创建 Agent Runner...")
  289. print(f" - Skills 目录: {skills_dir}")
  290. print(f" - 模型: {prompt.config.get('model', 'sonnet-4.5')}")
  291. # 加载自定义工具
  292. print(" - 加载自定义工具: nanobanana")
  293. import examples.how.tool # 导入自定义工具模块,触发 @tool 装饰器注册
  294. store = FileSystemTraceStore(base_path=".trace")
  295. runner = AgentRunner(
  296. trace_store=store,
  297. llm_call=create_openrouter_llm_call(model=f"anthropic/claude-{prompt.config.get('model', 'sonnet-4.5')}"),
  298. skills_dir=skills_dir,
  299. experiences_path="./.cache/experiences_restore.md",
  300. debug=True
  301. )
  302. # 4. 判断是新建还是恢复
  303. resume_trace_id = args.trace
  304. if resume_trace_id:
  305. # 验证 trace 存在
  306. existing_trace = await store.get_trace(resume_trace_id)
  307. if not existing_trace:
  308. print(f"\n错误: Trace 不存在: {resume_trace_id}")
  309. sys.exit(1)
  310. print(f"4. 恢复已有 Trace: {resume_trace_id[:8]}...")
  311. print(f" - 状态: {existing_trace.status}")
  312. print(f" - 消息数: {existing_trace.total_messages}")
  313. print(f" - 任务: {existing_trace.task}")
  314. else:
  315. print(f"4. 启动新 Agent 模式...")
  316. print()
  317. final_response = ""
  318. current_trace_id = resume_trace_id
  319. current_sequence = 0
  320. should_exit = False
  321. try:
  322. # 恢复模式:不发送初始消息,只指定 trace_id 续跑
  323. if resume_trace_id:
  324. initial_messages = None # None = 未设置,触发早期菜单检查
  325. config = RunConfig(
  326. model=f"claude-{prompt.config.get('model', 'sonnet-4.5')}",
  327. temperature=float(prompt.config.get('temperature', 0.3)),
  328. max_iterations=1000,
  329. trace_id=resume_trace_id,
  330. )
  331. else:
  332. initial_messages = messages
  333. config = RunConfig(
  334. model=f"claude-{prompt.config.get('model', 'sonnet-4.5')}",
  335. temperature=float(prompt.config.get('temperature', 0.3)),
  336. max_iterations=1000,
  337. name="社交媒体内容解构、建构、评估任务",
  338. enable_research_flow=True, # 显式启用研究流程
  339. )
  340. while not should_exit:
  341. # 如果是续跑,需要指定 trace_id
  342. if current_trace_id:
  343. config.trace_id = current_trace_id
  344. # 清理上一轮的响应,避免失败后显示旧内容
  345. final_response = ""
  346. # 如果 trace 已完成/失败且没有新消息,直接进入交互菜单
  347. # 注意:initial_messages 为 None 表示未设置(首次加载),[] 表示有意为空(用户选择"继续")
  348. if current_trace_id and initial_messages is None:
  349. check_trace = await store.get_trace(current_trace_id)
  350. if check_trace and check_trace.status in ("completed", "failed"):
  351. if check_trace.status == "completed":
  352. print(f"\n[Trace] ✅ 已完成")
  353. print(f" - Total messages: {check_trace.total_messages}")
  354. print(f" - Total cost: ${check_trace.total_cost:.4f}")
  355. else:
  356. print(f"\n[Trace] ❌ 已失败: {check_trace.error_message}")
  357. current_sequence = check_trace.head_sequence
  358. menu_result = await show_interactive_menu(
  359. runner, current_trace_id, current_sequence, store
  360. )
  361. if menu_result["action"] == "stop":
  362. break
  363. elif menu_result["action"] == "continue":
  364. new_messages = menu_result.get("messages", [])
  365. if new_messages:
  366. initial_messages = new_messages
  367. config.after_sequence = menu_result.get("after_sequence")
  368. else:
  369. # 无新消息:对 failed trace 意味着重试,对 completed 意味着继续
  370. initial_messages = []
  371. config.after_sequence = None
  372. continue
  373. break
  374. # 对 stopped/running 等非终态的 trace,直接续跑
  375. initial_messages = []
  376. print(f"{'▶️ 开始执行...' if not current_trace_id else '▶️ 继续执行...'}")
  377. # 执行 Agent
  378. paused = False
  379. try:
  380. async for item in runner.run(messages=initial_messages, config=config):
  381. # 检查用户中断
  382. cmd = check_stdin()
  383. if cmd == 'pause':
  384. # 暂停执行
  385. print("\n⏸️ 正在暂停执行...")
  386. if current_trace_id:
  387. await runner.stop(current_trace_id)
  388. # 等待一小段时间让 runner 处理 stop 信号
  389. await asyncio.sleep(0.5)
  390. # 显示交互菜单
  391. menu_result = await show_interactive_menu(
  392. runner, current_trace_id, current_sequence, store
  393. )
  394. if menu_result["action"] == "stop":
  395. should_exit = True
  396. paused = True
  397. break
  398. elif menu_result["action"] == "continue":
  399. # 检查是否有新消息需要插入
  400. new_messages = menu_result.get("messages", [])
  401. if new_messages:
  402. # 有干预消息,需要重新启动循环
  403. initial_messages = new_messages
  404. after_seq = menu_result.get("after_sequence")
  405. if after_seq is not None:
  406. config.after_sequence = after_seq
  407. paused = True
  408. break
  409. else:
  410. # 没有新消息,需要重启执行
  411. initial_messages = []
  412. config.after_sequence = None
  413. paused = True
  414. break
  415. elif cmd == 'quit':
  416. print("\n🛑 用户请求停止...")
  417. if current_trace_id:
  418. await runner.stop(current_trace_id)
  419. should_exit = True
  420. break
  421. # 处理 Trace 对象(整体状态变化)
  422. if isinstance(item, Trace):
  423. current_trace_id = item.trace_id
  424. if item.status == "running":
  425. print(f"[Trace] 开始: {item.trace_id[:8]}...")
  426. elif item.status == "completed":
  427. print(f"\n[Trace] ✅ 完成")
  428. print(f" - Total messages: {item.total_messages}")
  429. print(f" - Total tokens: {item.total_tokens}")
  430. print(f" - Total cost: ${item.total_cost:.4f}")
  431. elif item.status == "failed":
  432. print(f"\n[Trace] ❌ 失败: {item.error_message}")
  433. elif item.status == "stopped":
  434. print(f"\n[Trace] ⏸️ 已停止")
  435. # 处理 Message 对象(执行过程)
  436. elif isinstance(item, Message):
  437. current_sequence = item.sequence
  438. if item.role == "assistant":
  439. content = item.content
  440. if isinstance(content, dict):
  441. text = content.get("text", "")
  442. tool_calls = content.get("tool_calls")
  443. if text and not tool_calls:
  444. # 纯文本回复(最终响应)
  445. final_response = text
  446. print(f"\n[Response] Agent 回复:")
  447. print(text)
  448. elif text:
  449. preview = text[:150] + "..." if len(text) > 150 else text
  450. print(f"[Assistant] {preview}")
  451. if tool_calls:
  452. for tc in tool_calls:
  453. tool_name = tc.get("function", {}).get("name", "unknown")
  454. print(f"[Tool Call] 🛠️ {tool_name}")
  455. elif item.role == "tool":
  456. content = item.content
  457. if isinstance(content, dict):
  458. tool_name = content.get("tool_name", "unknown")
  459. print(f"[Tool Result] ✅ {tool_name}")
  460. if item.description:
  461. desc = item.description[:80] if len(item.description) > 80 else item.description
  462. print(f" {desc}...")
  463. except Exception as e:
  464. print(f"\n执行出错: {e}")
  465. import traceback
  466. traceback.print_exc()
  467. # paused → 菜单已在暂停时内联显示过
  468. if paused:
  469. if should_exit:
  470. break
  471. continue
  472. # quit → 直接退出
  473. if should_exit:
  474. break
  475. # Runner 退出(完成/失败/停止/异常)→ 显示交互菜单
  476. if current_trace_id:
  477. # 🌟 新增:自动触发反思的生命周期钩子
  478. check_trace = await store.get_trace(current_trace_id)
  479. if check_trace and check_trace.status in ("completed", "failed"):
  480. print(f"\n⚙️ 任务已结束 (状态: {check_trace.status}),正在自动触发经验总结...")
  481. # 如果是失败状态,自动带上针对性的 focus 提示
  482. auto_focus = "本次任务执行失败了,请重点反思失败的原因、踩坑点以及未来应如何避免。" if check_trace.status == "failed" else ""
  483. await perform_reflection(runner, store, current_trace_id, focus=auto_focus)
  484. # 自动反思结束后,依然弹出菜单,让用户决定是彻底退出(6)还是查看总结(3)
  485. menu_result = await show_interactive_menu(
  486. runner, current_trace_id, current_sequence, store
  487. )
  488. if menu_result["action"] == "stop":
  489. break
  490. elif menu_result["action"] == "continue":
  491. new_messages = menu_result.get("messages", [])
  492. if new_messages:
  493. initial_messages = new_messages
  494. config.after_sequence = menu_result.get("after_sequence")
  495. else:
  496. initial_messages = []
  497. config.after_sequence = None
  498. continue
  499. break
  500. except KeyboardInterrupt:
  501. print("\n\n用户中断 (Ctrl+C)")
  502. if current_trace_id:
  503. await runner.stop(current_trace_id)
  504. # 6. 输出结果
  505. if final_response:
  506. print()
  507. print("=" * 60)
  508. print("Agent 响应:")
  509. print("=" * 60)
  510. print(final_response)
  511. print("=" * 60)
  512. print()
  513. # 7. 保存结果
  514. output_file = output_dir / "result.txt"
  515. with open(output_file, 'w', encoding='utf-8') as f:
  516. f.write(final_response)
  517. print(f"✓ 结果已保存到: {output_file}")
  518. print()
  519. # 可视化提示
  520. if current_trace_id:
  521. print("=" * 60)
  522. print("可视化 Step Tree:")
  523. print("=" * 60)
  524. print("1. 启动 API Server:")
  525. print(" python3 api_server.py")
  526. print()
  527. print("2. 浏览器访问:")
  528. print(" http://localhost:8000/api/traces")
  529. print()
  530. print(f"3. Trace ID: {current_trace_id}")
  531. print("=" * 60)
  532. if __name__ == "__main__":
  533. asyncio.run(main())