run.py 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. """
  2. 浏览器调研示例 (增强版)
  3. 功能:
  4. 1. 使用 Agent 模式进行网络调研
  5. 2. 任务结束自动关闭浏览器并杀掉进程
  6. 3. 异常安全:即使程序崩溃也能清理环境
  7. """
  8. import os
  9. import sys
  10. import asyncio
  11. from pathlib import Path
  12. # 添加项目根目录到 Python 路径
  13. sys.path.insert(0, str(Path(__file__).parent.parent.parent))
  14. from dotenv import load_dotenv
  15. load_dotenv()
  16. import logging
  17. # 配置感知日志
  18. logging.basicConfig(level=logging.WARNING) # 默认 WARNING
  19. logging.getLogger("agent.core.message_manager").setLevel(logging.INFO) # 开启感知日志
  20. logging.getLogger("tools").setLevel(logging.INFO) # 开启工具日志
  21. from agent.llm.prompts import SimplePrompt
  22. from agent.core.runner import AgentRunner
  23. from agent.trace import (
  24. FileSystemTraceStore,
  25. Trace,
  26. Message,
  27. )
  28. from agent.llm import create_openrouter_llm_call
  29. # 导入浏览器清理工具
  30. from agent.tools.builtin.browser.baseClass import kill_browser_session
  31. async def main():
  32. # 路径配置
  33. base_dir = Path(__file__).parent
  34. project_root = base_dir.parent.parent
  35. prompt_path = base_dir / "test.prompt"
  36. output_dir = base_dir / "output"
  37. output_dir.mkdir(exist_ok=True)
  38. # Skills 目录
  39. skills_dir = None
  40. print("=" * 60)
  41. print("🚀 浏览器调研任务 (Agent 模式)")
  42. print("=" * 60)
  43. print()
  44. # 1. 加载 prompt
  45. print("1. 加载 prompt...")
  46. prompt = SimplePrompt(prompt_path)
  47. # 提取配置
  48. system_prompt = prompt._messages.get("system", "")
  49. user_task = prompt._messages.get("user", "")
  50. model_name = prompt.config.get('model', 'gemini-2.5-flash')
  51. temperature = float(prompt.config.get('temperature', 0.3))
  52. print(f" - 任务: {user_task[:80]}...")
  53. print(f" - 模型: {model_name}")
  54. # 2. 构建消息
  55. print("2. 构建任务消息...")
  56. messages = prompt.build_messages()
  57. # 3. 创建 Agent Runner
  58. print("3. 创建 Agent Runner...")
  59. runner = AgentRunner(
  60. trace_store=FileSystemTraceStore(base_path=str(trace_dir)),
  61. llm_call=create_openrouter_llm_call(model=f"google/{model_name}"),
  62. skills_dir=skills_dir,
  63. debug=True
  64. )
  65. final_response = ""
  66. current_trace_id = None
  67. # 4. Agent 模式执行(使用 try...finally 确保清理)
  68. try:
  69. print(f"4. 启动 Agent 模式执行...")
  70. print()
  71. async for item in runner.run(
  72. task=user_task,
  73. messages=messages,
  74. system_prompt=system_prompt,
  75. model=f"google/{model_name}",
  76. temperature=temperature,
  77. max_iterations=20,
  78. ):
  79. # 处理 Trace 对象(整体状态变化)
  80. if isinstance(item, Trace):
  81. current_trace_id = item.trace_id
  82. if item.status == "running":
  83. print(f"[Trace] 开始: {item.trace_id[:8]}")
  84. elif item.status == "completed":
  85. print(f"[Trace] 完成")
  86. print(f" - Total tokens: {item.total_tokens}")
  87. print(f" - Total cost: ${item.total_cost:.4f}")
  88. elif item.status == "failed":
  89. print(f"[Trace] 失败: {item.error_message}")
  90. # 处理 Message 对象(执行过程)
  91. elif isinstance(item, Message):
  92. if item.role == "assistant":
  93. content = item.content
  94. if isinstance(content, dict):
  95. text = content.get("text", "")
  96. tool_calls = content.get("tool_calls")
  97. if text and not tool_calls:
  98. final_response = text
  99. print(f"[Response] Agent 给出最终回复")
  100. elif text:
  101. # 增加打印长度到 300,方便观察
  102. print(f"[Assistant] {text[:300]}...")
  103. if tool_calls:
  104. for tc in tool_calls:
  105. tool_name = tc.get("function", {}).get("name", "unknown")
  106. print(f"[Tool Call] 🛠️ {tool_name}")
  107. elif item.role == "tool":
  108. content = item.content
  109. if isinstance(content, dict):
  110. tool_name = content.get("tool_name", "unknown")
  111. print(f"[Tool Result] ✅ {tool_name}")
  112. if item.description:
  113. desc = item.description[:80] if len(item.description) > 80 else item.description
  114. print(f" {desc}...")
  115. # 5. 输出结果
  116. print()
  117. print("=" * 60)
  118. print("Final Agent Response:")
  119. print("=" * 60)
  120. print(final_response)
  121. print("=" * 60)
  122. print()
  123. # 6. 保存结果
  124. output_file = output_dir / "research_result.txt"
  125. with open(output_file, 'w', encoding='utf-8') as f:
  126. f.write(final_response)
  127. print(f"✓ 结果已保存到: {output_file}")
  128. except Exception as e:
  129. print(f"\n❌ 程序运行崩溃: {str(e)}")
  130. import traceback
  131. traceback.print_exc()
  132. finally:
  133. # --- 核心逻辑:无论成功失败,必须关闭浏览器进程 ---
  134. print("\n" + "·" * 40)
  135. print("🧹 正在清理浏览器环境,关闭 CDP 会话并终止进程...")
  136. try:
  137. # 强制杀掉浏览器进程,释放容器或本地端口
  138. await kill_browser_session()
  139. print("✅ 浏览器已安全关闭。")
  140. except Exception as cleanup_err:
  141. print(f"⚠️ 清理浏览器时出现错误: {cleanup_err}")
  142. print("·" * 40 + "\n")
  143. # 7. 可视化提示
  144. if current_trace_id:
  145. print("=" * 60)
  146. print("可视化 Step Tree:")
  147. print("=" * 60)
  148. print("1. 启动 API Server: python3 api_server.py")
  149. print(f"2. 访问: http://localhost:8000/api/traces")
  150. print(f"3. Trace ID: {current_trace_id}")
  151. print("=" * 60)
  152. if __name__ == "__main__":
  153. try:
  154. asyncio.run(main())
  155. except KeyboardInterrupt:
  156. print("\n🛑 用户手动终止 (KeyboardInterrupt),正在强制退出...")