run.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187
  1. """
  2. 浏览器调研示例 (增强版)
  3. 功能:
  4. 1. 使用 Agent 模式进行网络调研
  5. 2. 任务结束自动关闭浏览器并杀掉进程
  6. 3. 异常安全:即使程序崩溃也能清理环境
  7. """
  8. import os
  9. import sys
  10. import asyncio
  11. from pathlib import Path
  12. # 添加项目根目录到 Python 路径
  13. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  14. from dotenv import load_dotenv
  15. load_dotenv()
  16. import logging
  17. # 配置感知日志
  18. logging.basicConfig(level=logging.WARNING) # 默认 WARNING
  19. logging.getLogger("agent.core.message_manager").setLevel(logging.INFO) # 开启感知日志
  20. logging.getLogger("tools").setLevel(logging.INFO) # 开启工具日志
  21. from agent.llm.prompts import SimplePrompt
  22. from agent.core.runner import AgentRunner, RunConfig
  23. from agent.trace import (
  24. FileSystemTraceStore,
  25. Trace,
  26. Message,
  27. )
  28. from agent.llm import create_openrouter_llm_call
  29. # 导入浏览器清理工具
  30. from agent.tools.builtin.browser.baseClass import kill_browser_session, init_browser_session
  31. async def main():
  32. # 路径配置
  33. base_dir = Path(__file__).parent
  34. project_root = base_dir.parent.parent
  35. trace_dir = project_root / ".trace"
  36. prompt_path = base_dir / "test.prompt"
  37. output_dir = base_dir / "output"
  38. output_dir.mkdir(exist_ok=True)
  39. # Skills 目录
  40. skills_dir = None
  41. print("=" * 60)
  42. print("🚀 浏览器调研任务 (Agent 模式)")
  43. print("=" * 60)
  44. print()
  45. # 1. 加载 prompt
  46. print("1. 加载 prompt...")
  47. prompt = SimplePrompt(prompt_path)
  48. # 提取配置
  49. system_prompt = prompt._messages.get("system", "")
  50. user_task = prompt._messages.get("user", "")
  51. model_name = prompt.config.get('model', 'gemini-2.5-flash')
  52. temperature = float(prompt.config.get('temperature', 0.3))
  53. print(f" - 任务: {user_task[:80]}...")
  54. print(f" - 模型: {model_name}")
  55. # 2. 构建消息
  56. print("2. 构建任务消息...")
  57. messages = prompt.build_messages()
  58. # 3. 创建 Agent Runner
  59. print("3. 创建 Agent Runner...")
  60. runner = AgentRunner(
  61. trace_store=FileSystemTraceStore(base_path=str(trace_dir)),
  62. llm_call=create_openrouter_llm_call(model=f"google/{model_name}"),
  63. skills_dir=skills_dir,
  64. debug=True
  65. )
  66. final_response = ""
  67. current_trace_id = None
  68. # 4. Agent 模式执行(使用 try...finally 确保清理)
  69. try:
  70. print(f"4. 启动 Agent 模式执行...")
  71. print()
  72. async for item in runner.run(
  73. messages=messages,
  74. config=RunConfig(
  75. system_prompt=system_prompt,
  76. model=f"google/{model_name}",
  77. temperature=temperature,
  78. max_iterations=20,
  79. name=user_task[:50],
  80. ),
  81. ):
  82. # 处理 Trace 对象(整体状态变化)
  83. if isinstance(item, Trace):
  84. current_trace_id = item.trace_id
  85. if item.status == "running":
  86. print(f"[Trace] 开始: {item.trace_id[:8]}")
  87. elif item.status == "completed":
  88. print(f"[Trace] 完成")
  89. print(f" - Total tokens: {item.total_tokens}")
  90. print(f" - Total cost: ${item.total_cost:.4f}")
  91. elif item.status == "failed":
  92. print(f"[Trace] 失败: {item.error_message}")
  93. # 处理 Message 对象(执行过程)
  94. elif isinstance(item, Message):
  95. if item.role == "assistant":
  96. content = item.content
  97. if isinstance(content, dict):
  98. text = content.get("text", "")
  99. tool_calls = content.get("tool_calls")
  100. if text and not tool_calls:
  101. final_response = text
  102. print(f"[Response] Agent 给出最终回复")
  103. elif text:
  104. # 增加打印长度到 300,方便观察
  105. print(f"[Assistant] {text[:300]}...")
  106. if tool_calls:
  107. for tc in tool_calls:
  108. tool_name = tc.get("function", {}).get("name", "unknown")
  109. print(f"[Tool Call] 🛠️ {tool_name}")
  110. elif item.role == "tool":
  111. content = item.content
  112. if isinstance(content, dict):
  113. tool_name = content.get("tool_name", "unknown")
  114. print(f"[Tool Result] ✅ {tool_name}")
  115. if item.description:
  116. desc = item.description[:80] if len(item.description) > 80 else item.description
  117. print(f" {desc}...")
  118. # 5. 输出结果
  119. print()
  120. print("=" * 60)
  121. print("Final Agent Response:")
  122. print("=" * 60)
  123. print(final_response)
  124. print("=" * 60)
  125. print()
  126. # 6. 保存结果
  127. output_file = output_dir / "research_result.txt"
  128. with open(output_file, 'w', encoding='utf-8') as f:
  129. f.write(final_response)
  130. print(f"✓ 结果已保存到: {output_file}")
  131. except Exception as e:
  132. print(f"\n❌ 程序运行崩溃: {str(e)}")
  133. import traceback
  134. traceback.print_exc()
  135. finally:
  136. # --- 核心逻辑:无论成功失败,必须关闭浏览器进程 ---
  137. print("\n" + "·" * 40)
  138. print("🧹 正在清理浏览器环境,关闭 CDP 会话并终止进程...")
  139. try:
  140. # 强制杀掉浏览器进程,释放容器或本地端口
  141. await kill_browser_session()
  142. print("✅ 浏览器已安全关闭。")
  143. except Exception as cleanup_err:
  144. print(f"⚠️ 清理浏览器时出现错误: {cleanup_err}")
  145. print("·" * 40 + "\n")
  146. # 7. 可视化提示
  147. if current_trace_id:
  148. print("=" * 60)
  149. print("可视化 Step Tree:")
  150. print("=" * 60)
  151. print("1. 启动 API Server: python3 api_server.py")
  152. print(f"2. 访问: http://localhost:8000/api/traces")
  153. print(f"3. Trace ID: {current_trace_id}")
  154. print("=" * 60)
  155. if __name__ == "__main__":
  156. try:
  157. asyncio.run(main())
  158. except KeyboardInterrupt:
  159. print("\n🛑 用户手动终止 (KeyboardInterrupt),正在强制退出...")