3 months ago · ee727bea75
--- a/agent/core/runner.py
+++ b/agent/core/runner.py
@@ -28,15 +28,54 @@ logger = logging.getLogger(__name__)
 
				 
			
 
				 # 内置工具列表（始终自动加载）
			
 
				 BUILTIN_TOOLS = [
			
 
				+    # 文件操作工具
			
 
				     "read_file",
			
 
				     "edit_file",
			
 
				     "write_file",
			
 
				     "glob_files",
			
 
				     "grep_content",
			
 
				+
			
 
				+    # 系统工具
			
 
				     "bash_command",
			
 
				+
			
 
				+    # 技能和目标管理
			
 
				     "skill",
			
 
				     "list_skills",
			
 
				     "goal",
			
 
				+
			
 
				+    # 搜索工具
			
 
				+    "search_posts",
			
 
				+    "get_search_suggestions",
			
 
				+
			
 
				+    # 沙箱工具
			
 
				+    "sandbox_create_environment",
			
 
				+    "sandbox_run_shell",
			
 
				+    "sandbox_rebuild_with_ports",
			
 
				+    "sandbox_destroy_environment",
			
 
				+
			
 
				+    # 浏览器工具
			
 
				+    "browser_navigate_to_url",
			
 
				+    "browser_search_web",
			
 
				+    "browser_go_back",
			
 
				+    "browser_wait",
			
 
				+    "browser_click_element",
			
 
				+    "browser_input_text",
			
 
				+    "browser_send_keys",
			
 
				+    "browser_upload_file",
			
 
				+    "browser_scroll_page",
			
 
				+    "browser_find_text",
			
 
				+    "browser_screenshot",
			
 
				+    "browser_switch_tab",
			
 
				+    "browser_close_tab",
			
 
				+    "browser_get_dropdown_options",
			
 
				+    "browser_select_dropdown_option",
			
 
				+    "browser_extract_content",
			
 
				+    "browser_get_page_html",
			
 
				+    "browser_get_selector_map",
			
 
				+    "browser_evaluate",
			
 
				+    "browser_ensure_login_with_cookies",
			
 
				+    "browser_wait_for_user_action",
			
 
				+    "browser_done",
			
 
				 ]
			
 
				 
			
 
				 
			
@@ -121,15 +160,6 @@ class AgentRunner:
 
				         trace_id = None
			
 
				         message_id = None
			
 
				 
			
 
				-        # 创建 Trace
			
 
				-        if trace and self.trace_store:
			
 
				-            trace_obj = Trace.create(
			
 
				-                mode="call",
			
 
				-                uid=uid,
			
 
				-                context={"model": model}
			
 
				-            )
			
 
				-            trace_id = await self.trace_store.create_trace(trace_obj)
			
 
				-
			
 
				         # 准备工具 Schema
			
 
				         tool_names = BUILTIN_TOOLS.copy()
			
 
				         if tools:
			
@@ -139,6 +169,17 @@ class AgentRunner:
 
				 
			
 
				         tool_schemas = self.tools.get_schemas(tool_names)
			
 
				 
			
 
				+        # 创建 Trace
			
 
				+        if trace and self.trace_store:
			
 
				+            trace_obj = Trace.create(
			
 
				+                mode="call",
			
 
				+                uid=uid,
			
 
				+                model=model,
			
 
				+                tools=tool_schemas,  # 保存工具定义
			
 
				+                llm_params=kwargs,  # 保存 LLM 参数
			
 
				+            )
			
 
				+            trace_id = await self.trace_store.create_trace(trace_obj)
			
 
				+
			
 
				         # 调用 LLM
			
 
				         result = await self.llm_call(
			
 
				             messages=messages,
			
@@ -155,7 +196,9 @@ class AgentRunner:
 
				                 sequence=1,
			
 
				                 goal_id=None,  # 单次调用没有 goal
			
 
				                 content={"text": result.get("content", ""), "tool_calls": result.get("tool_calls")},
			
 
				-                tokens=result.get("prompt_tokens", 0) + result.get("completion_tokens", 0),
			
 
				+                prompt_tokens=result.get("prompt_tokens", 0),
			
 
				+                completion_tokens=result.get("completion_tokens", 0),
			
 
				+                finish_reason=result.get("finish_reason"),
			
 
				                 cost=result.get("cost", 0),
			
 
				             )
			
 
				             message_id = await self.trace_store.add_message(msg)
			
@@ -223,6 +266,14 @@ class AgentRunner:
 
				         enable_memory = enable_memory if enable_memory is not None else self.config.enable_memory
			
 
				         auto_execute_tools = auto_execute_tools if auto_execute_tools is not None else self.config.auto_execute_tools
			
 
				 
			
 
				+        # 准备工具 Schema（提前准备，用于 Trace）
			
 
				+        tool_names = BUILTIN_TOOLS.copy()
			
 
				+        if tools:
			
 
				+            for tool in tools:
			
 
				+                if tool not in tool_names:
			
 
				+                    tool_names.append(tool)
			
 
				+        tool_schemas = self.tools.get_schemas(tool_names)
			
 
				+
			
 
				         # 创建 Trace
			
 
				         trace_id = self._generate_id()
			
 
				         trace_obj = Trace(
			
@@ -231,7 +282,9 @@ class AgentRunner:
 
				             task=task,
			
 
				             agent_type=agent_type,
			
 
				             uid=uid,
			
 
				-            context={"model": model, **kwargs},
			
 
				+            model=model,
			
 
				+            tools=tool_schemas,  # 保存工具定义
			
 
				+            llm_params=kwargs,  # 保存 LLM 参数
			
 
				             status="running"
			
 
				         )
			
 
				 
			
@@ -269,6 +322,9 @@ class AgentRunner:
 
				             if messages is None:
			
 
				                 messages = []
			
 
				 
			
 
				+            # 记录初始 system 和 user 消息到 trace
			
 
				+            sequence = 1
			
 
				+
			
 
				             if system_prompt:
			
 
				                 # 注入记忆和 skills 到 system prompt
			
 
				                 full_system = system_prompt
			
@@ -279,9 +335,35 @@ class AgentRunner:
 
				 
			
 
				                 messages = [{"role": "system", "content": full_system}] + messages
			
 
				 
			
 
				+                # 保存 system 消息
			
 
				+                if self.trace_store:
			
 
				+                    system_msg = Message.create(
			
 
				+                        trace_id=trace_id,
			
 
				+                        role="system",
			
 
				+                        sequence=sequence,
			
 
				+                        goal_id=None,  # 初始消息没有 goal
			
 
				+                        content=full_system,
			
 
				+                    )
			
 
				+                    await self.trace_store.add_message(system_msg)
			
 
				+                    yield system_msg
			
 
				+                    sequence += 1
			
 
				+
			
 
				             # 添加任务描述
			
 
				             messages.append({"role": "user", "content": task})
			
 
				 
			
 
				+            # 保存 user 消息（任务描述）
			
 
				+            if self.trace_store:
			
 
				+                user_msg = Message.create(
			
 
				+                    trace_id=trace_id,
			
 
				+                    role="user",
			
 
				+                    sequence=sequence,
			
 
				+                    goal_id=None,  # 初始消息没有 goal
			
 
				+                    content=task,
			
 
				+                )
			
 
				+                await self.trace_store.add_message(user_msg)
			
 
				+                yield user_msg
			
 
				+                sequence += 1
			
 
				+
			
 
				             # 获取 GoalTree
			
 
				             goal_tree = None
			
 
				             if self.trace_store:
			
@@ -291,18 +373,7 @@ class AgentRunner:
 
				                 from agent.tools.builtin.goal import set_goal_tree
			
 
				                 set_goal_tree(goal_tree)
			
 
				 
			
 
				-            # 准备工具 Schema
			
 
				-            tool_names = BUILTIN_TOOLS.copy()
			
 
				-            if tools:
			
 
				-                for tool in tools:
			
 
				-                    if tool not in tool_names:
			
 
				-                        tool_names.append(tool)
			
 
				-
			
 
				-            tool_schemas = self.tools.get_schemas(tool_names)
			
 
				-
			
 
				             # 执行循环
			
 
				-            sequence = 1
			
 
				-
			
 
				             for iteration in range(max_iterations):
			
 
				                 # 注入当前计划到 messages（如果有 goals）
			
 
				                 llm_messages = list(messages)
			
@@ -321,7 +392,10 @@ class AgentRunner:
 
				 
			
 
				                 response_content = result.get("content", "")
			
 
				                 tool_calls = result.get("tool_calls")
			
 
				-                step_tokens = result.get("prompt_tokens", 0) + result.get("completion_tokens", 0)
			
 
				+                finish_reason = result.get("finish_reason")
			
 
				+                prompt_tokens = result.get("prompt_tokens", 0)
			
 
				+                completion_tokens = result.get("completion_tokens", 0)
			
 
				+                step_tokens = prompt_tokens + completion_tokens
			
 
				                 step_cost = result.get("cost", 0)
			
 
				 
			
 
				                 # 获取当前 goal_id
			
@@ -334,7 +408,9 @@ class AgentRunner:
 
				                     sequence=sequence,
			
 
				                     goal_id=current_goal_id,
			
 
				                     content={"text": response_content, "tool_calls": tool_calls},
			
 
				-                    tokens=step_tokens,
			
 
				+                    prompt_tokens=prompt_tokens,
			
 
				+                    completion_tokens=completion_tokens,
			
 
				+                    finish_reason=finish_reason,
			
 
				                     cost=step_cost,
			
 
				                 )
			
 
				 
			
@@ -429,6 +505,7 @@ class AgentRunner:
 
				                 await self.trace_store.update_trace(
			
 
				                     trace_id,
			
 
				                     status="failed",
			
 
				+                    error_message=str(e),
			
 
				                     completed_at=datetime.now()
			
 
				                 )
			
 
				                 trace_obj = await self.trace_store.get_trace(trace_id)
			
--- a/agent/execution/fs_store.py
+++ b/agent/execution/fs_store.py
@@ -316,8 +316,17 @@ class FileSystemTraceStore:
 
				             trace.total_messages += 1
			
 
				             trace.last_sequence = max(trace.last_sequence, message.sequence)
			
 
				 
			
 
				+            # 累计 tokens（拆分）
			
 
				+            if message.prompt_tokens:
			
 
				+                trace.total_prompt_tokens += message.prompt_tokens
			
 
				+            if message.completion_tokens:
			
 
				+                trace.total_completion_tokens += message.completion_tokens
			
 
				+            # 向后兼容：也更新 total_tokens
			
 
				             if message.tokens:
			
 
				                 trace.total_tokens += message.tokens
			
 
				+            elif message.prompt_tokens or message.completion_tokens:
			
 
				+                trace.total_tokens += (message.prompt_tokens or 0) + (message.completion_tokens or 0)
			
 
				+
			
 
				             if message.cost:
			
 
				                 trace.total_cost += message.cost
			
 
				             if message.duration_ms:
			
@@ -329,6 +338,8 @@ class FileSystemTraceStore:
 
				                 total_messages=trace.total_messages,
			
 
				                 last_sequence=trace.last_sequence,
			
 
				                 total_tokens=trace.total_tokens,
			
 
				+                total_prompt_tokens=trace.total_prompt_tokens,
			
 
				+                total_completion_tokens=trace.total_completion_tokens,
			
 
				                 total_cost=trace.total_cost,
			
 
				                 total_duration_ms=trace.total_duration_ms
			
 
				             )
			
@@ -439,9 +450,7 @@ class FileSystemTraceStore:
 
				             if message_file.exists():
			
 
				                 try:
			
 
				                     data = json.loads(message_file.read_text())
			
 
				-                    if data.get("created_at"):
			
 
				-                        data["created_at"] = datetime.fromisoformat(data["created_at"])
			
 
				-                    return Message(**data)
			
 
				+                    return Message.from_dict(data)
			
 
				                 except Exception:
			
 
				                     pass
			
 
				 
			
@@ -461,9 +470,7 @@ class FileSystemTraceStore:
 
				         for message_file in messages_dir.glob("*.json"):
			
 
				             try:
			
 
				                 data = json.loads(message_file.read_text())
			
 
				-                if data.get("created_at"):
			
 
				-                    data["created_at"] = datetime.fromisoformat(data["created_at"])
			
 
				-                messages.append(Message(**data))
			
 
				+                messages.append(Message.from_dict(data))
			
 
				             except Exception:
			
 
				                 continue
			
 
				 
			
--- a/agent/execution/models.py
+++ b/agent/execution/models.py
@@ -41,21 +41,30 @@ class Trace:
 
				 
			
 
				     # 统计
			
 
				     total_messages: int = 0      # 消息总数（改名自 total_steps）
			
 
				-    total_tokens: int = 0
			
 
				+    total_tokens: int = 0        # 总 tokens（向后兼容，= prompt + completion）
			
 
				+    total_prompt_tokens: int = 0      # 总输入 tokens
			
 
				+    total_completion_tokens: int = 0  # 总输出 tokens
			
 
				     total_cost: float = 0.0
			
 
				-    total_duration_ms: int = 0  # 总耗时（毫秒）
			
 
				+    total_duration_ms: int = 0   # 总耗时（毫秒）
			
 
				 
			
 
				     # 进度追踪（head）
			
 
				     last_sequence: int = 0      # 最新 message 的 sequence
			
 
				     last_event_id: int = 0      # 最新事件 ID（用于 WS 续传）
			
 
				 
			
 
				-    # 上下文
			
 
				+    # 配置
			
 
				     uid: Optional[str] = None
			
 
				-    context: Dict[str, Any] = field(default_factory=dict)
			
 
				+    model: Optional[str] = None              # 默认模型
			
 
				+    tools: Optional[List[Dict]] = None       # 工具定义（整个 trace 共享）
			
 
				+    llm_params: Dict[str, Any] = field(default_factory=dict)  # LLM 参数（temperature 等）
			
 
				+    context: Dict[str, Any] = field(default_factory=dict)     # 其他元数据
			
 
				 
			
 
				     # 当前焦点 goal
			
 
				     current_goal_id: Optional[str] = None
			
 
				 
			
 
				+    # 结果
			
 
				+    result_summary: Optional[str] = None     # 执行结果摘要
			
 
				+    error_message: Optional[str] = None      # 错误信息
			
 
				+
			
 
				     # 时间
			
 
				     created_at: datetime = field(default_factory=datetime.now)
			
 
				     completed_at: Optional[datetime] = None
			
@@ -86,13 +95,20 @@ class Trace:
 
				             "status": self.status,
			
 
				             "total_messages": self.total_messages,
			
 
				             "total_tokens": self.total_tokens,
			
 
				+            "total_prompt_tokens": self.total_prompt_tokens,
			
 
				+            "total_completion_tokens": self.total_completion_tokens,
			
 
				             "total_cost": self.total_cost,
			
 
				             "total_duration_ms": self.total_duration_ms,
			
 
				             "last_sequence": self.last_sequence,
			
 
				             "last_event_id": self.last_event_id,
			
 
				             "uid": self.uid,
			
 
				+            "model": self.model,
			
 
				+            "tools": self.tools,
			
 
				+            "llm_params": self.llm_params,
			
 
				             "context": self.context,
			
 
				             "current_goal_id": self.current_goal_id,
			
 
				+            "result_summary": self.result_summary,
			
 
				+            "error_message": self.error_message,
			
 
				             "created_at": self.created_at.isoformat() if self.created_at else None,
			
 
				             "completed_at": self.completed_at.isoformat() if self.completed_at else None,
			
 
				         }
			
@@ -103,15 +119,17 @@ class Message:
 
				     """
			
 
				     执行消息 - Trace 中的 LLM 消息
			
 
				 
			
 
				-    对应 LLM API 消息格式（assistant/tool），通过 goal_id 关联 Goal。
			
 
				+    对应 LLM API 消息格式（system/user/assistant/tool），通过 goal_id 关联 Goal。
			
 
				 
			
 
				     description 字段自动生成规则：
			
 
				+    - system: 取 content 前 200 字符
			
 
				+    - user: 取 content 前 200 字符
			
 
				     - assistant: 优先取 content，若无 content 则生成 "tool call: XX, XX"
			
 
				     - tool: 使用 tool name
			
 
				     """
			
 
				     message_id: str
			
 
				     trace_id: str
			
 
				-    role: Literal["assistant", "tool"]   # 和 LLM API 一致
			
 
				+    role: Literal["system", "user", "assistant", "tool"]   # 和 LLM API 一致
			
 
				     sequence: int                        # 全局顺序
			
 
				     goal_id: Optional[str] = None        # 关联的 Goal 内部 ID（None = 还没有创建 Goal）
			
 
				     description: str = ""                # 消息描述（系统自动生成）
			
@@ -119,23 +137,46 @@ class Message:
 
				     content: Any = None                  # 消息内容（和 LLM API 格式一致）
			
 
				 
			
 
				     # 元数据
			
 
				-    tokens: Optional[int] = None
			
 
				+    prompt_tokens: Optional[int] = None  # 输入 tokens
			
 
				+    completion_tokens: Optional[int] = None  # 输出 tokens
			
 
				     cost: Optional[float] = None
			
 
				     duration_ms: Optional[int] = None
			
 
				     created_at: datetime = field(default_factory=datetime.now)
			
 
				 
			
 
				+    # LLM 响应信息（仅 role="assistant" 时使用）
			
 
				+    finish_reason: Optional[str] = None  # stop, length, tool_calls, content_filter 等
			
 
				+
			
 
				+    @property
			
 
				+    def tokens(self) -> int:
			
 
				+        """动态计算总 tokens（向后兼容）"""
			
 
				+        return (self.prompt_tokens or 0) + (self.completion_tokens or 0)
			
 
				+
			
 
				+    @classmethod
			
 
				+    def from_dict(cls, data: Dict[str, Any]) -> "Message":
			
 
				+        """从字典创建 Message（处理向后兼容）"""
			
 
				+        # 过滤掉已删除的字段
			
 
				+        filtered_data = {k: v for k, v in data.items() if k not in ["tokens", "available_tools"]}
			
 
				+
			
 
				+        # 解析 datetime
			
 
				+        if filtered_data.get("created_at") and isinstance(filtered_data["created_at"], str):
			
 
				+            filtered_data["created_at"] = datetime.fromisoformat(filtered_data["created_at"])
			
 
				+
			
 
				+        return cls(**filtered_data)
			
 
				+
			
 
				     @classmethod
			
 
				     def create(
			
 
				         cls,
			
 
				         trace_id: str,
			
 
				-        role: Literal["assistant", "tool"],
			
 
				+        role: Literal["system", "user", "assistant", "tool"],
			
 
				         sequence: int,
			
 
				         goal_id: Optional[str] = None,
			
 
				         content: Any = None,
			
 
				         tool_call_id: Optional[str] = None,
			
 
				-        tokens: Optional[int] = None,
			
 
				+        prompt_tokens: Optional[int] = None,
			
 
				+        completion_tokens: Optional[int] = None,
			
 
				         cost: Optional[float] = None,
			
 
				         duration_ms: Optional[int] = None,
			
 
				+        finish_reason: Optional[str] = None,
			
 
				     ) -> "Message":
			
 
				         """创建新的 Message，自动生成 description"""
			
 
				         description = cls._generate_description(role, content)
			
@@ -149,9 +190,11 @@ class Message:
 
				             content=content,
			
 
				             description=description,
			
 
				             tool_call_id=tool_call_id,
			
 
				-            tokens=tokens,
			
 
				+            prompt_tokens=prompt_tokens,
			
 
				+            completion_tokens=completion_tokens,
			
 
				             cost=cost,
			
 
				             duration_ms=duration_ms,
			
 
				+            finish_reason=finish_reason,
			
 
				         )
			
 
				 
			
 
				     @staticmethod
			
@@ -159,10 +202,24 @@ class Message:
 
				         """
			
 
				         自动生成 description
			
 
				 
			
 
				+        - system: 取 content 前 200 字符
			
 
				+        - user: 取 content 前 200 字符
			
 
				         - assistant: 优先取 content，若无 content 则生成 "tool call: XX, XX"
			
 
				         - tool: 使用 tool name
			
 
				         """
			
 
				-        if role == "assistant":
			
 
				+        if role == "system":
			
 
				+            # system 消息：直接截取文本
			
 
				+            if isinstance(content, str):
			
 
				+                return content[:200] + "..." if len(content) > 200 else content
			
 
				+            return "system prompt"
			
 
				+
			
 
				+        elif role == "user":
			
 
				+            # user 消息：直接截取文本
			
 
				+            if isinstance(content, str):
			
 
				+                return content[:200] + "..." if len(content) > 200 else content
			
 
				+            return "user message"
			
 
				+
			
 
				+        elif role == "assistant":
			
 
				             # assistant 消息：content 是字典，可能包含 text 和 tool_calls
			
 
				             if isinstance(content, dict):
			
 
				                 # 优先返回文本内容
			
@@ -213,9 +270,12 @@ class Message:
 
				             "tool_call_id": self.tool_call_id,
			
 
				             "content": self.content,
			
 
				             "description": self.description,
			
 
				-            "tokens": self.tokens,
			
 
				+            "tokens": self.tokens,  # 使用 @property 动态计算
			
 
				+            "prompt_tokens": self.prompt_tokens,
			
 
				+            "completion_tokens": self.completion_tokens,
			
 
				             "cost": self.cost,
			
 
				             "duration_ms": self.duration_ms,
			
 
				+            "finish_reason": self.finish_reason,
			
 
				             "created_at": self.created_at.isoformat() if self.created_at else None,
			
 
				         }
			
 
				 
			
--- a/agent/goal/models.py
+++ b/agent/goal/models.py
@@ -142,6 +142,13 @@ class GoalTree:
 
				                 return goal
			
 
				         return None
			
 
				 
			
 
				+    def find_by_display_id(self, display_id: str) -> Optional[Goal]:
			
 
				+        """按显示 ID 查找 Goal（如 "1", "2.1", "2.2"）"""
			
 
				+        for goal in self.goals:
			
 
				+            if self._generate_display_id(goal) == display_id:
			
 
				+                return goal
			
 
				+        return None
			
 
				+
			
 
				     def find_parent(self, goal_id: str) -> Optional[Goal]:
			
 
				         """查找指定 Goal 的父节点"""
			
 
				         goal = self.find(goal_id)
			
@@ -270,8 +277,15 @@ class GoalTree:
 
				         self.current_id = goal_id
			
 
				         return goal
			
 
				 
			
 
				-    def complete(self, goal_id: str, summary: str) -> Goal:
			
 
				-        """完成指定 Goal"""
			
 
				+    def complete(self, goal_id: str, summary: str, clear_focus: bool = True) -> Goal:
			
 
				+        """
			
 
				+        完成指定 Goal
			
 
				+
			
 
				+        Args:
			
 
				+            goal_id: 要完成的目标 ID
			
 
				+            summary: 完成总结
			
 
				+            clear_focus: 如果完成的是当前焦点，是否清除焦点（默认 True）
			
 
				+        """
			
 
				         goal = self.find(goal_id)
			
 
				         if not goal:
			
 
				             raise ValueError(f"Goal not found: {goal_id}")
			
@@ -279,8 +293,8 @@ class GoalTree:
 
				         goal.status = "completed"
			
 
				         goal.summary = summary
			
 
				 
			
 
				-        # 如果完成的是当前焦点，清除焦点
			
 
				-        if self.current_id == goal_id:
			
 
				+        # 如果完成的是当前焦点，根据参数决定是否清除焦点
			
 
				+        if clear_focus and self.current_id == goal_id:
			
 
				             self.current_id = None
			
 
				 
			
 
				         # 检查是否所有兄弟都完成了，如果是则自动完成父节点
			
--- a/agent/goal/tool.py
+++ b/agent/goal/tool.py
@@ -36,33 +36,23 @@ async def goal_tool(
 
				         under: 为指定目标添加子目标
			
 
				         done: 完成当前目标，值为 summary
			
 
				         abandon: 放弃当前目标，值为原因
			
 
				-        focus: 切换焦点到指定内部 id
			
 
				+        focus: 切换焦点到指定 ID
			
 
				 
			
 
				     Returns:
			
 
				         更新后的计划状态文本
			
 
				     """
			
 
				     changes = []
			
 
				 
			
 
				-    # 1. 处理 abandon（先处理，因为可能需要在 add 新目标前放弃旧的）
			
 
				-    if abandon is not None:
			
 
				-        if not tree.current_id:
			
 
				-            return "错误：没有当前目标可以放弃"
			
 
				-        goal = tree.abandon(tree.current_id, abandon)
			
 
				-        display_id = tree._generate_display_id(goal)
			
 
				-        changes.append(f"已放弃: {display_id}. {goal.description}")
			
 
				-
			
 
				-        # 推送事件
			
 
				-        if store and trace_id:
			
 
				-            print(f"[DEBUG] goal_tool: calling store.update_goal for abandon: goal_id={goal.id}")
			
 
				-            await store.update_goal(trace_id, goal.id, status="abandoned", summary=abandon)
			
 
				-        else:
			
 
				-            print(f"[DEBUG] goal_tool: skip event push (store={store}, trace_id={trace_id})")
			
 
				-
			
 
				-    # 2. 处理 done
			
 
				+    # 1. 处理 done（完成当前目标）
			
 
				     if done is not None:
			
 
				         if not tree.current_id:
			
 
				-            return "错误：没有当前目标可以完成"
			
 
				-        goal = tree.complete(tree.current_id, done)
			
 
				+            return f"错误：没有当前目标可以完成。当前焦点为空，请先使用 focus 参数切换到要完成的目标。\n\n当前计划：\n{tree.to_prompt()}"
			
 
				+
			
 
				+        # 完成当前目标
			
 
				+        # 如果同时指定了 focus，则不清空焦点（后面会切换到新目标）
			
 
				+        # 如果只有 done，则清空焦点
			
 
				+        clear_focus = (focus is None)
			
 
				+        goal = tree.complete(tree.current_id, done, clear_focus=clear_focus)
			
 
				         display_id = tree._generate_display_id(goal)
			
 
				         changes.append(f"已完成: {display_id}. {goal.description}")
			
 
				 
			
@@ -73,34 +63,39 @@ async def goal_tool(
 
				         else:
			
 
				             print(f"[DEBUG] goal_tool: skip event push (store={store}, trace_id={trace_id})")
			
 
				 
			
 
				-        # 检查是否有级联完成的父目标
			
 
				+        # 检查是否有级联完成的父目标（complete方法已经处理，这里只需要记录）
			
 
				         if goal.parent_id:
			
 
				             parent = tree.find(goal.parent_id)
			
 
				             if parent and parent.status == "completed":
			
 
				                 parent_display_id = tree._generate_display_id(parent)
			
 
				                 changes.append(f"自动完成: {parent_display_id}. {parent.description}（所有子目标已完成）")
			
 
				 
			
 
				-    # 3. 处理 focus（在 add 之前，这样 add 可以添加到新焦点下）
			
 
				+    # 2. 处理 focus（切换焦点到新目标）
			
 
				     if focus is not None:
			
 
				-        # focus 参数可以是内部 ID 或显示 ID
			
 
				-        # 先尝试作为内部 ID 查找
			
 
				-        goal = tree.find(focus)
			
 
				-
			
 
				-        # 如果找不到，尝试根据显示 ID 查找
			
 
				-        if not goal:
			
 
				-            # 通过遍历所有 goal 查找匹配的显示 ID
			
 
				-            for g in tree.goals:
			
 
				-                if tree._generate_display_id(g) == focus:
			
 
				-                    goal = g
			
 
				-                    break
			
 
				+        goal = tree.find_by_display_id(focus)
			
 
				 
			
 
				         if not goal:
			
 
				-            return f"错误：找不到目标 {focus}"
			
 
				+            return f"错误：找不到目标 {focus}\n\n当前计划：\n{tree.to_prompt()}"
			
 
				 
			
 
				         tree.focus(goal.id)
			
 
				         display_id = tree._generate_display_id(goal)
			
 
				         changes.append(f"切换焦点: {display_id}. {goal.description}")
			
 
				 
			
 
				+    # 3. 处理 abandon（放弃当前目标）
			
 
				+    if abandon is not None:
			
 
				+        if not tree.current_id:
			
 
				+            return f"错误：没有当前目标可以放弃。当前焦点为空。\n\n当前计划：\n{tree.to_prompt()}"
			
 
				+        goal = tree.abandon(tree.current_id, abandon)
			
 
				+        display_id = tree._generate_display_id(goal)
			
 
				+        changes.append(f"已放弃: {display_id}. {goal.description}")
			
 
				+
			
 
				+        # 推送事件
			
 
				+        if store and trace_id:
			
 
				+            print(f"[DEBUG] goal_tool: calling store.update_goal for abandon: goal_id={goal.id}")
			
 
				+            await store.update_goal(trace_id, goal.id, status="abandoned", summary=abandon)
			
 
				+        else:
			
 
				+            print(f"[DEBUG] goal_tool: skip event push (store={store}, trace_id={trace_id})")
			
 
				+
			
 
				     # 4. 处理 add
			
 
				     if add is not None:
			
 
				         # 检查 after 和 under 互斥
			
@@ -120,34 +115,20 @@ async def goal_tool(
 
				             # 确定添加位置
			
 
				             if after is not None:
			
 
				                 # 在指定 goal 后面添加（同层级）
			
 
				-                # after 参数可以是内部 ID 或显示 ID
			
 
				-                target_goal = tree.find(after)
			
 
				-                if not target_goal:
			
 
				-                    # 尝试根据显示 ID 查找
			
 
				-                    for g in tree.goals:
			
 
				-                        if tree._generate_display_id(g) == after:
			
 
				-                            target_goal = g
			
 
				-                            break
			
 
				+                target_goal = tree.find_by_display_id(after)
			
 
				 
			
 
				                 if not target_goal:
			
 
				-                    return f"错误：找不到目标 {after}"
			
 
				+                    return f"错误：找不到目标 {after}\n\n当前计划：\n{tree.to_prompt()}"
			
 
				 
			
 
				                 new_goals = tree.add_goals_after(target_goal.id, descriptions, reasons=reasons)
			
 
				                 changes.append(f"在 {tree._generate_display_id(target_goal)} 后面添加 {len(new_goals)} 个同级目标")
			
 
				 
			
 
				             elif under is not None:
			
 
				                 # 为指定 goal 添加子目标
			
 
				-                # under 参数可以是内部 ID 或显示 ID
			
 
				-                parent_goal = tree.find(under)
			
 
				-                if not parent_goal:
			
 
				-                    # 尝试根据显示 ID 查找
			
 
				-                    for g in tree.goals:
			
 
				-                        if tree._generate_display_id(g) == under:
			
 
				-                            parent_goal = g
			
 
				-                            break
			
 
				+                parent_goal = tree.find_by_display_id(under)
			
 
				 
			
 
				                 if not parent_goal:
			
 
				-                    return f"错误：找不到目标 {under}"
			
 
				+                    return f"错误：找不到目标 {under}\n\n当前计划：\n{tree.to_prompt()}"
			
 
				 
			
 
				                 new_goals = tree.add_goals(descriptions, reasons=reasons, parent_id=parent_goal.id)
			
 
				                 changes.append(f"在 {tree._generate_display_id(parent_goal)} 下添加 {len(new_goals)} 个子目标")
			
@@ -198,11 +179,11 @@ def create_goal_tool_schema() -> dict:
 
				 
			
 
				 - add: 添加目标（逗号分隔多个）
			
 
				 - reason: 创建理由（逗号分隔多个，与 add 一一对应）。说明为什么要做这些目标。
			
 
				-- after: 在指定目标后面添加（同层级）。可以是内部 ID 或显示 ID。
			
 
				-- under: 为指定目标添加子目标。可以是内部 ID 或显示 ID。如已有子目标，追加到最后。
			
 
				+- after: 在指定目标后面添加（同层级）。使用目标的 ID。
			
 
				+- under: 为指定目标添加子目标。使用目标的 ID。如已有子目标，追加到最后。
			
 
				 - done: 完成当前目标，值为 summary
			
 
				 - abandon: 放弃当前目标，值为原因（会触发 context 压缩）
			
 
				-- focus: 切换焦点到指定 id（可以是内部 ID 或显示 ID）
			
 
				+- focus: 切换焦点到指定目标。使用目标的 ID。
			
 
				 
			
 
				 位置控制（优先使用 after）：
			
 
				 - 不指定 after/under: 添加到当前 focus 下作为子目标（无 focus 时添加到顶层）
			
@@ -210,17 +191,22 @@ def create_goal_tool_schema() -> dict:
 
				 - under="X": 为目标 X 添加子目标
			
 
				 - after 和 under 不能同时指定
			
 
				 
			
 
				+执行顺序：
			
 
				+- done → focus → abandon → add
			
 
				+- 如果同时指定 done 和 focus，会先完成当前目标，再切换焦点到新目标
			
 
				+
			
 
				 示例：
			
 
				 - goal(add="分析代码, 实现功能, 测试") - 添加顶层目标
			
 
				 - goal(add="设计接口, 实现代码", under="2") - 为目标2添加子目标
			
 
				 - goal(add="编写文档", after="3") - 在目标3后面添加同级任务
			
 
				 - goal(add="集成测试", after="2.2") - 在目标2.2后面添加同级任务
			
 
				 - goal(done="发现用户模型在 models/user.py") - 完成当前目标
			
 
				+- goal(done="已完成调研", focus="2") - 完成当前目标，切换到目标2
			
 
				 - goal(abandon="方案A需要Redis，环境没有") - 放弃当前目标
			
 
				 
			
 
				-注意：内部 ID 是纯自增数字（"1", "2", "3"），显示 ID 是带层级的（"1", "2.1", "2.2"）。
			
 
				-所有 ID 参数都可以使用任意格式的 ID。
			
 
				-reason 应该与 add 的目标数量一致，如果数量不一致，缺少的 reason 将为空。
			
 
				+注意：
			
 
				+- 目标 ID 的格式为 "1", "2", "2.1", "2.2" 等，在计划视图中可以看到
			
 
				+- reason 应该与 add 的目标数量一致，如果数量不一致，缺少的 reason 将为空
			
 
				 """,
			
 
				         "parameters": {
			
 
				             "type": "object",
			
@@ -235,11 +221,11 @@ reason 应该与 add 的目标数量一致，如果数量不一致，缺少的 r
 
				                 },
			
 
				                 "after": {
			
 
				                     "type": "string",
			
 
				-                    "description": "在指定目标后面添加（同层级）。可以是内部 ID 或显示 ID。"
			
 
				+                    "description": "在指定目标后面添加（同层级）。使用目标的 ID，如 \"2\" 或 \"2.1\"。"
			
 
				                 },
			
 
				                 "under": {
			
 
				                     "type": "string",
			
 
				-                    "description": "为指定目标添加子目标。可以是内部 ID 或显示 ID。"
			
 
				+                    "description": "为指定目标添加子目标。使用目标的 ID，如 \"2\" 或 \"2.1\"。"
			
 
				                 },
			
 
				                 "done": {
			
 
				                     "type": "string",
			
@@ -251,7 +237,7 @@ reason 应该与 add 的目标数量一致，如果数量不一致，缺少的 r
 
				                 },
			
 
				                 "focus": {
			
 
				                     "type": "string",
			
 
				-                    "description": "切换焦点到指定 goal id（可以是内部 ID 或显示 ID）"
			
 
				+                    "description": "切换焦点到指定目标。使用目标的 ID，如 \"2\" 或 \"2.1\"。"
			
 
				                 }
			
 
				             },
			
 
				             "required": []
			
--- a/agent/llm/gemini.py
+++ b/agent/llm/gemini.py
@@ -327,6 +327,7 @@ def create_gemini_llm_call(
 
				                 "tool_calls": List[Dict] | None,
			
 
				                 "prompt_tokens": int,
			
 
				                 "completion_tokens": int,
			
 
				+                "finish_reason": str,
			
 
				                 "cost": float
			
 
				             }
			
 
				         """
			
@@ -375,14 +376,27 @@ def create_gemini_llm_call(
 
				         # 解析响应
			
 
				         content = ""
			
 
				         tool_calls = None
			
 
				+        finish_reason = "stop"  # 默认值
			
 
				 
			
 
				         candidates = gemini_resp.get("candidates", [])
			
 
				         if candidates:
			
 
				             candidate = candidates[0]
			
 
				 
			
 
				+            # 提取 finish_reason（Gemini -> OpenAI 格式映射）
			
 
				+            gemini_finish_reason = candidate.get("finishReason", "STOP")
			
 
				+            if gemini_finish_reason == "STOP":
			
 
				+                finish_reason = "stop"
			
 
				+            elif gemini_finish_reason == "MAX_TOKENS":
			
 
				+                finish_reason = "length"
			
 
				+            elif gemini_finish_reason in ("SAFETY", "RECITATION"):
			
 
				+                finish_reason = "content_filter"
			
 
				+            elif gemini_finish_reason == "MALFORMED_FUNCTION_CALL":
			
 
				+                finish_reason = "stop"  # 映射为 stop，但在 content 中包含错误信息
			
 
				+            else:
			
 
				+                finish_reason = gemini_finish_reason.lower()  # 保持原值，转小写
			
 
				+
			
 
				             # 检查是否有错误
			
 
				-            finish_reason = candidate.get("finishReason")
			
 
				-            if finish_reason == "MALFORMED_FUNCTION_CALL":
			
 
				+            if gemini_finish_reason == "MALFORMED_FUNCTION_CALL":
			
 
				                 # Gemini 返回了格式错误的函数调用
			
 
				                 # 提取 finishMessage 中的内容作为 content
			
 
				                 finish_message = candidate.get("finishMessage", "")
			
@@ -426,6 +440,7 @@ def create_gemini_llm_call(
 
				             "tool_calls": tool_calls,
			
 
				             "prompt_tokens": prompt_tokens,
			
 
				             "completion_tokens": completion_tokens,
			
 
				+            "finish_reason": finish_reason,
			
 
				             "cost": 0.0
			
 
				         }
			
 
				 
			
--- a/agent/llm/openrouter.py
+++ b/agent/llm/openrouter.py
@@ -32,6 +32,7 @@ async def openrouter_llm_call(
 
				             "tool_calls": List[Dict] | None,
			
 
				             "prompt_tokens": int,
			
 
				             "completion_tokens": int,
			
 
				+            "finish_reason": str,
			
 
				             "cost": float
			
 
				         }
			
 
				     """
			
@@ -85,6 +86,7 @@ async def openrouter_llm_call(
 
				 
			
 
				     content = message.get("content", "")
			
 
				     tool_calls = message.get("tool_calls")
			
 
				+    finish_reason = choice.get("finish_reason")  # stop, length, tool_calls, content_filter 等
			
 
				 
			
 
				     # 提取 usage
			
 
				     usage = result.get("usage", {})
			
@@ -99,6 +101,7 @@ async def openrouter_llm_call(
 
				         "tool_calls": tool_calls,
			
 
				         "prompt_tokens": prompt_tokens,
			
 
				         "completion_tokens": completion_tokens,
			
 
				+        "finish_reason": finish_reason,
			
 
				         "cost": cost
			
 
				     }
			
 
				 
			
--- a/agent/skills/core.md
+++ b/agent/skills/core.md
@@ -12,38 +12,56 @@ description: 核心系统能力，自动加载到 System Prompt
 
				 
			
 
				 ## 计划与执行
			
 
				 
			
 
				-对于复杂任务，你要先分析需求，并使用 `step` 工具来管理执行计划和进度。这一工具会形成一棵思维树。
			
 
				+对于复杂任务，你要先分析需求，并使用 `goal` 工具来管理执行计划和进度。这一工具会形成一棵目标树。
			
 
				 
			
 
				 ### 创建计划：拆分任务步骤，创建TODO
			
 
				 
			
 
				 ```
			
 
				-step(plan=["调研并确定方案", "执行方案", "评估结果"])
			
 
				+goal(add="调研并确定方案, 执行方案, 评估结果")
			
 
				 ```
			
 
				 
			
 
				-这将在当前节点下增加3个plan节点。你可以在执行过程中设置进一步的sub plan。
			
 
				+这将创建3个目标。你可以在执行过程中继续添加子目标。
			
 
				 
			
 
				 ### 开始执行
			
 
				 
			
 
				-聚焦到某个目标开始执行：
			
 
				+聚焦到某个目标开始执行（使用目标的 ID）：
			
 
				 
			
 
				 ```
			
 
				-step(focus="调研并确定方案")
			
 
				+goal(focus="1")
			
 
				+```
			
 
				+
			
 
				+目标的 ID 会显示在计划视图中，格式如 "1", "2", "2.1", "2.2" 等。
			
 
				+
			
 
				+### 完成目标
			
 
				+
			
 
				+完成当前目标并提供总结：
			
 
				+
			
 
				+```
			
 
				+goal(done="人物姿势的最佳提取工具是openpose")
			
 
				 ```
			
 
				 
			
 
				 ### 完成并切换
			
 
				 
			
 
				-完成当前目标，提供总结，切换到下一个：
			
 
				+先完成当前目标，再切换焦点到下一个：
			
 
				 
			
 
				 ```
			
 
				-step(complete=True, summary="人物姿势的最佳提取工具是openpose", focus="执行方案")
			
 
				+goal(done="人物姿势的最佳提取工具是openpose", focus="2")
			
 
				 ```
			
 
				 
			
 
				-### 查看进度
			
 
				+这会先完成当前正在执行的目标，然后切换焦点到目标 "2"。
			
 
				+
			
 
				+### 添加子目标
			
 
				 
			
 
				-查看当前执行进度：
			
 
				+为指定目标添加子目标：
			
 
				 
			
 
				 ```
			
 
				-read_progress()
			
 
				+goal(add="设计接口, 实现代码", under="2")
			
 
				+```
			
 
				+
			
 
				+在指定目标后面添加同级目标：
			
 
				+
			
 
				+```
			
 
				+goal(add="编写文档", after="2")
			
 
				 ```
			
 
				 
			
 
				 ### 使用规范
			
@@ -52,9 +70,38 @@ read_progress()
 
				 2. **summary 应简洁**：记录关键结论和发现，不要冗长
			
 
				 3. **计划可调整**：根据执行情况追加或跳过目标
			
 
				 4. **简单任务不需要计划**：单步操作直接执行即可
			
 
				+5. **使用 ID 进行定位**：focus、after、under 参数都使用目标的 ID（如 "1", "2.1"）
			
 
				 
			
 
				 ## 信息调研
			
 
				 
			
 
				-你可以通过联网搜索工具`search_posts`获取来自Github、小红书、微信公众号、知乎等渠道的信息。
			
 
				+你可以通过联网搜索工具`search_posts`获取来自Github、小红书、微信公众号、知乎等渠道的信息。对于需要深度交互的网页内容，使用浏览器工具进行操作。
			
 
				+
			
 
				+调研过程可能需要多次搜索，比如基于搜索结果中获得的启发或信息启动新的搜索，直到得到令人满意的答案。你可以使用`goal`工具管理搜索的过程，或者使用文档记录搜索的中间或最终结果。
			
 
				+
			
 
				+## 浏览器工具使用指南
			
 
				+
			
 
				+所有浏览器工具都以 `browser_` 为前缀。浏览器会话会持久化，无需每次重新启动。
			
 
				+
			
 
				+### 基本工作流程
			
 
				+
			
 
				+1. **页面导航**: 使用 `browser_navigate_to_url` 或 `browser_search_web` 到达目标页面
			
 
				+2. **等待加载**: 页面跳转后调用 `browser_wait(seconds=2)` 等待内容加载
			
 
				+3. **获取元素索引**: 调用 `browser_get_selector_map` 获取可交互元素的索引映射
			
 
				+4. **执行交互**: 使用 `browser_click_element`、`browser_input_text` 等工具操作页面
			
 
				+5. **提取内容**: 使用 `browser_extract_content` 或 `browser_get_page_html` 获取数据
			
 
				+
			
 
				+### 关键原则
			
 
				+
			
 
				+- **必须先获取索引**: 所有 `index` 参数都需要先通过 `browser_get_selector_map` 获取
			
 
				+- **操作后等待**: 任何可能触发页面变化的操作（点击、输入、滚动）后都要调用 `browser_wait`
			
 
				+- **优先用高级工具**: 优先使用 `browser_extract_content` 而不是手动解析HTML
			
 
				+- **登录处理**: 需要登录的网站使用 `browser_ensure_login_with_cookies(cookie_type="xhs")` 注入Cookie
			
 
				+- **复杂操作用JS**: 当标准工具无法满足时，使用 `browser_evaluate` 执行JavaScript代码
			
 
				+
			
 
				+### 工具分类
			
 
				 
			
 
				-调研过程可能需要多次搜索，比如基于搜索结果中获得的启发或信息启动新的搜索，直到得到令人满意的答案。你可以使用`step`工具管理搜索的过程，或者使用文档记录搜索的中间或最终结果。
			
 
				+**导航**: browser_navigate_to_url, browser_search_web, browser_go_back, browser_wait
			
 
				+**交互**: browser_click_element, browser_input_text, browser_send_keys, browser_upload_file
			
 
				+**视图**: browser_scroll_page, browser_find_text, browser_screenshot
			
 
				+**提取**: browser_extract_content, browser_get_page_html, browser_get_selector_map
			
 
				+**高级**: browser_evaluate, browser_ensure_login_with_cookies, browser_wait_for_user_action
			
--- a/agent/tools/builtin/__init__.py
+++ b/agent/tools/builtin/__init__.py
@@ -19,6 +19,9 @@ from agent.tools.builtin.search import search_posts, get_search_suggestions
 
				 from agent.tools.builtin.sandbox import (sandbox_create_environment, sandbox_run_shell,
			
 
				                                          sandbox_rebuild_with_ports,sandbox_destroy_environment)
			
 
				 
			
 
				+# 导入浏览器工具以触发注册
			
 
				+import agent.tools.builtin.browser  # noqa: F401
			
 
				+
			
 
				 __all__ = [
			
 
				     "read_file",
			
 
				     "edit_file",
			
--- a/agent/tools/builtin/browser/__init__.py
+++ b/agent/tools/builtin/browser/__init__.py
@@ -0,0 +1,101 @@
 
				+"""
			
 
				+浏览器工具 - Browser-Use 原生工具适配器
			
 
				+
			
 
				+基于 browser-use 实现的浏览器自动化工具集。
			
 
				+"""
			
 
				+
			
 
				+from agent.tools.builtin.browser.baseClass import (
			
 
				+    # 会话管理
			
 
				+    init_browser_session,
			
 
				+    get_browser_session,
			
 
				+    cleanup_browser_session,
			
 
				+    kill_browser_session,
			
 
				+
			
 
				+    # 导航类工具
			
 
				+    browser_navigate_to_url,
			
 
				+    browser_search_web,
			
 
				+    browser_go_back,
			
 
				+    browser_wait,
			
 
				+
			
 
				+    # 元素交互工具
			
 
				+    browser_click_element,
			
 
				+    browser_input_text,
			
 
				+    browser_send_keys,
			
 
				+    browser_upload_file,
			
 
				+
			
 
				+    # 滚动和视图工具
			
 
				+    browser_scroll_page,
			
 
				+    browser_find_text,
			
 
				+    browser_screenshot,
			
 
				+
			
 
				+    # 标签页管理工具
			
 
				+    browser_switch_tab,
			
 
				+    browser_close_tab,
			
 
				+
			
 
				+    # 下拉框工具
			
 
				+    browser_get_dropdown_options,
			
 
				+    browser_select_dropdown_option,
			
 
				+
			
 
				+    # 内容提取工具
			
 
				+    browser_extract_content,
			
 
				+    browser_get_page_html,
			
 
				+    browser_get_selector_map,
			
 
				+
			
 
				+    # JavaScript 执行工具
			
 
				+    browser_evaluate,
			
 
				+    browser_ensure_login_with_cookies,
			
 
				+
			
 
				+    # 等待用户操作
			
 
				+    browser_wait_for_user_action,
			
 
				+
			
 
				+    # 任务完成
			
 
				+    browser_done,
			
 
				+)
			
 
				+
			
 
				+__all__ = [
			
 
				+    # 会话管理
			
 
				+    'init_browser_session',
			
 
				+    'get_browser_session',
			
 
				+    'cleanup_browser_session',
			
 
				+    'kill_browser_session',
			
 
				+
			
 
				+    # 导航类工具
			
 
				+    'browser_navigate_to_url',
			
 
				+    'browser_search_web',
			
 
				+    'browser_go_back',
			
 
				+    'browser_wait',
			
 
				+
			
 
				+    # 元素交互工具
			
 
				+    'browser_click_element',
			
 
				+    'browser_input_text',
			
 
				+    'browser_send_keys',
			
 
				+    'browser_upload_file',
			
 
				+
			
 
				+    # 滚动和视图工具
			
 
				+    'browser_scroll_page',
			
 
				+    'browser_find_text',
			
 
				+    'browser_screenshot',
			
 
				+
			
 
				+    # 标签页管理工具
			
 
				+    'browser_switch_tab',
			
 
				+    'browser_close_tab',
			
 
				+
			
 
				+    # 下拉框工具
			
 
				+    'browser_get_dropdown_options',
			
 
				+    'browser_select_dropdown_option',
			
 
				+
			
 
				+    # 内容提取工具
			
 
				+    'browser_extract_content',
			
 
				+    'browser_get_page_html',
			
 
				+    'browser_get_selector_map',
			
 
				+
			
 
				+    # JavaScript 执行工具
			
 
				+    'browser_evaluate',
			
 
				+    'browser_ensure_login_with_cookies',
			
 
				+
			
 
				+    # 等待用户操作
			
 
				+    'browser_wait_for_user_action',
			
 
				+
			
 
				+    # 任务完成
			
 
				+    'browser_done',
			
 
				+]
			
--- a/agent/tools/builtin/browser/baseClass.py
+++ b/agent/tools/builtin/browser/baseClass.py
@@ -10,9 +10,29 @@ Native Browser-Use Tools Adapter
 
				 2. 状态自动保持 - 登录状态、Cookie、LocalStorage 等
			
 
				 3. 完整的底层访问 - 可以直接使用 CDP 协议
			
 
				 4. 性能优异 - 避免频繁创建/销毁浏览器实例
			
 
				+5. 多种浏览器类型 - 支持 local、cloud、container 三种模式
			
 
				+
			
 
				+支持的浏览器类型：
			
 
				+1. Local (本地浏览器):
			
 
				+   - 在本地运行 Chrome
			
 
				+   - 支持可视化调试
			
 
				+   - 速度最快
			
 
				+   - 示例: init_browser_session(browser_type="local")
			
 
				+
			
 
				+2. Cloud (云浏览器):
			
 
				+   - 在云端运行
			
 
				+   - 不占用本地资源
			
 
				+   - 适合生产环境
			
 
				+   - 示例: init_browser_session(browser_type="cloud")
			
 
				+
			
 
				+3. Container (容器浏览器):
			
 
				+   - 在独立容器中运行
			
 
				+   - 隔离性好
			
 
				+   - 支持预配置账户
			
 
				+   - 示例: init_browser_session(browser_type="container", container_url="https://example.com")
			
 
				 
			
 
				 使用方法：
			
 
				-1. 在 Agent 初始化时调用 init_browser_session()
			
 
				+1. 在 Agent 初始化时调用 init_browser_session() 并指定 browser_type
			
 
				 2. 使用各个工具函数执行浏览器操作
			
 
				 3. 任务结束时调用 cleanup_browser_session()
			
 
				 
			
@@ -27,6 +47,7 @@ import sys
 
				 import os
			
 
				 import json
			
 
				 import asyncio
			
 
				+import aiohttp
			
 
				 from typing import Optional, List, Dict, Any, Tuple
			
 
				 from pathlib import Path
			
 
				 from urllib.parse import urlparse
			
@@ -44,6 +65,12 @@ from browser_use.tools.service import Tools
 
				 from browser_use.agent.views import ActionResult
			
 
				 from browser_use.filesystem.file_system import FileSystem
			
 
				 
			
 
				+
			
 
				+# ============================================================
			
 
				+# 无需注册的内部辅助函数
			
 
				+# ============================================================
			
 
				+
			
 
				+
			
 
				 # ============================================================
			
 
				 # 全局浏览器会话管理
			
 
				 # ============================================================
			
@@ -53,52 +80,248 @@ _browser_session: Optional[BrowserSession] = None
 
				 _browser_tools: Optional[Tools] = None
			
 
				 _file_system: Optional[FileSystem] = None
			
 
				 
			
 
				+async def create_container(url: str, account_name: str = "liuwenwu") -> Dict[str, Any]:
			
 
				+    """
			
 
				+    创建浏览器容器并导航到指定URL
			
 
				+
			
 
				+    按照 test.md 的要求：
			
 
				+    1.1 调用接口创建容器
			
 
				+    1.2 调用接口创建窗口并导航到URL
			
 
				+
			
 
				+    Args:
			
 
				+        url: 要导航的URL地址
			
 
				+        account_name: 账户名称
			
 
				+
			
 
				+    Returns:
			
 
				+        包含容器信息的字典:
			
 
				+        - success: 是否成功
			
 
				+        - container_id: 容器ID
			
 
				+        - vnc: VNC访问URL
			
 
				+        - cdp: CDP协议URL（用于浏览器连接）
			
 
				+        - connection_id: 窗口连接ID
			
 
				+        - error: 错误信息（如果失败）
			
 
				+    """
			
 
				+    result = {
			
 
				+        "success": False,
			
 
				+        "container_id": None,
			
 
				+        "vnc": None,
			
 
				+        "cdp": None,
			
 
				+        "connection_id": None,
			
 
				+        "error": None
			
 
				+    }
			
 
				+
			
 
				+    try:
			
 
				+        async with aiohttp.ClientSession() as session:
			
 
				+            # 步骤1.1: 创建容器
			
 
				+            print("📦 步骤1.1: 创建容器...")
			
 
				+            create_url = "http://47.84.182.56:8200/api/v1/container/create"
			
 
				+            create_payload = {
			
 
				+                "auto_remove": True,
			
 
				+                "need_port_binding": True,
			
 
				+                "max_lifetime_seconds": 900
			
 
				+            }
			
 
				+
			
 
				+            async with session.post(create_url, json=create_payload) as resp:
			
 
				+                if resp.status != 200:
			
 
				+                    raise RuntimeError(f"创建容器失败: HTTP {resp.status}")
			
 
				+
			
 
				+                create_result = await resp.json()
			
 
				+                if create_result.get("code") != 0:
			
 
				+                    raise RuntimeError(f"创建容器失败: {create_result.get('msg')}")
			
 
				+
			
 
				+                data = create_result.get("data", {})
			
 
				+                result["container_id"] = data.get("container_id")
			
 
				+                result["vnc"] = data.get("vnc")
			
 
				+                result["cdp"] = data.get("cdp")
			
 
				+
			
 
				+                print(f"✅ 容器创建成功")
			
 
				+                print(f"   Container ID: {result['container_id']}")
			
 
				+                print(f"   VNC: {result['vnc']}")
			
 
				+                print(f"   CDP: {result['cdp']}")
			
 
				+
			
 
				+            # 等待容器内的浏览器启动
			
 
				+            print(f"\n⏳ 等待容器内浏览器启动...")
			
 
				+            await asyncio.sleep(5)
			
 
				+
			
 
				+            # 步骤1.2: 创建页面并导航
			
 
				+            print(f"\n📱 步骤1.2: 创建页面并导航到 {url}...")
			
 
				+
			
 
				+            page_create_url = "http://47.84.182.56:8200/api/v1/browser/page/create"
			
 
				+            page_payload = {
			
 
				+                "container_id": result["container_id"],
			
 
				+                "url": url,
			
 
				+                "account_name": account_name,
			
 
				+                "need_wait": True,
			
 
				+                "timeout": 30
			
 
				+            }
			
 
				+
			
 
				+            # 重试机制：最多尝试3次
			
 
				+            max_retries = 3
			
 
				+            page_created = False
			
 
				+            last_error = None
			
 
				+
			
 
				+            for attempt in range(max_retries):
			
 
				+                try:
			
 
				+                    if attempt > 0:
			
 
				+                        print(f"   重试 {attempt + 1}/{max_retries}...")
			
 
				+                        await asyncio.sleep(3)  # 重试前等待
			
 
				+
			
 
				+                    async with session.post(page_create_url, json=page_payload, timeout=aiohttp.ClientTimeout(total=60)) as resp:
			
 
				+                        if resp.status != 200:
			
 
				+                            response_text = await resp.text()
			
 
				+                            last_error = f"HTTP {resp.status}: {response_text[:200]}"
			
 
				+                            continue
			
 
				+
			
 
				+                        page_result = await resp.json()
			
 
				+                        if page_result.get("code") != 0:
			
 
				+                            last_error = f"{page_result.get('msg')}"
			
 
				+                            continue
			
 
				+
			
 
				+                        page_data = page_result.get("data", {})
			
 
				+                        result["connection_id"] = page_data.get("connection_id")
			
 
				+                        result["success"] = True
			
 
				+                        page_created = True
			
 
				+
			
 
				+                        print(f"✅ 页面创建成功")
			
 
				+                        print(f"   Connection ID: {result['connection_id']}")
			
 
				+                        break
			
 
				+
			
 
				+                except asyncio.TimeoutError:
			
 
				+                    last_error = "请求超时"
			
 
				+                    continue
			
 
				+                except aiohttp.ClientError as e:
			
 
				+                    last_error = f"网络错误: {str(e)}"
			
 
				+                    continue
			
 
				+                except Exception as e:
			
 
				+                    last_error = f"未知错误: {str(e)}"
			
 
				+                    continue
			
 
				+
			
 
				+            if not page_created:
			
 
				+                raise RuntimeError(f"创建页面失败（尝试{max_retries}次后）: {last_error}")
			
 
				+
			
 
				+    except Exception as e:
			
 
				+        result["error"] = str(e)
			
 
				+        print(f"❌ 错误: {str(e)}")
			
 
				+
			
 
				+    return result
			
 
				 
			
 
				 async def init_browser_session(
			
 
				+    browser_type: str = "local",
			
 
				     headless: bool = False,
			
 
				-    user_data_dir: Optional[str] = None,
			
 
				+    url: Optional[str] = None,
			
 
				     profile_name: str = "default",
			
 
				+    user_data_dir: Optional[str] = None,
			
 
				     browser_profile: Optional[BrowserProfile] = None,
			
 
				-    use_cloud: bool = False,
			
 
				     **kwargs
			
 
				 ) -> tuple[BrowserSession, Tools]:
			
 
				     """
			
 
				-    初始化全局浏览器会话
			
 
				+    初始化全局浏览器会话 - 支持三种浏览器类型
			
 
				 
			
 
				     Args:
			
 
				+        browser_type: 浏览器类型 ("local", "cloud", "container")
			
 
				         headless: 是否无头模式
			
 
				-        user_data_dir: 用户数据目录（用于保存登录状态）
			
 
				-        profile_name: 配置文件名称
			
 
				-        browser_profile: BrowserProfile 对象（用于预设 cookies 等）
			
 
				-        use_cloud: 是否使用云浏览器（默认 False，使用本地浏览器）
			
 
				+        url: 初始访问URL（可选）
			
 
				+             - local/cloud: 初始化后会自动导航到此URL
			
 
				+             - container: 必需，容器启动时访问的URL
			
 
				+        profile_name: 配置文件/账户名称（默认 "default"）
			
 
				+                     - local: 用于创建用户数据目录路径
			
 
				+                     - cloud: 云浏览器配置ID
			
 
				+                     - container: 容器账户名称
			
 
				+        user_data_dir: 用户数据目录（仅 local 模式，高级用法）
			
 
				+                      如果提供则覆盖 profile_name 生成的路径
			
 
				+        browser_profile: BrowserProfile 对象（通用，高级用法）
			
 
				+                        用于预设 cookies 等
			
 
				         **kwargs: 其他 BrowserSession 参数
			
 
				 
			
 
				     Returns:
			
 
				         (BrowserSession, Tools) 元组
			
 
				+
			
 
				+    Examples:
			
 
				+        # 本地浏览器
			
 
				+        browser, tools = await init_browser_session(
			
 
				+            browser_type="local",
			
 
				+            url="https://www.baidu.com"  # 可选
			
 
				+        )
			
 
				+
			
 
				+        # 云浏览器
			
 
				+        browser, tools = await init_browser_session(
			
 
				+            browser_type="cloud",
			
 
				+            profile_name="my_cloud_profile"  # 可选
			
 
				+        )
			
 
				+
			
 
				+        # 容器浏览器
			
 
				+        browser, tools = await init_browser_session(
			
 
				+            browser_type="container",
			
 
				+            url="https://www.xiaohongshu.com",  # 必需
			
 
				+            profile_name="my_account"  # 可选
			
 
				+        )
			
 
				     """
			
 
				     global _browser_session, _browser_tools, _file_system
			
 
				 
			
 
				     if _browser_session is not None:
			
 
				         return _browser_session, _browser_tools
			
 
				 
			
 
				-    # 设置用户数据目录（持久化登录状态）
			
 
				-    if user_data_dir is None and profile_name and not use_cloud:
			
 
				-        user_data_dir = str(Path.home() / ".browser_use" / "profiles" / profile_name)
			
 
				-        Path(user_data_dir).mkdir(parents=True, exist_ok=True)
			
 
				+    # 验证 browser_type
			
 
				+    valid_types = ["local", "cloud", "container"]
			
 
				+    if browser_type not in valid_types:
			
 
				+        raise ValueError(f"无效的 browser_type: {browser_type}，必须是 {valid_types} 之一")
			
 
				 
			
 
				-    # 创建浏览器会话
			
 
				+    # 创建浏览器会话参数
			
 
				     session_params = {
			
 
				         "headless": headless,
			
 
				     }
			
 
				 
			
 
				-    if use_cloud:
			
 
				-        # 云浏览器模式
			
 
				-        session_params["use_cloud"] = True
			
 
				+    # === Container 模式 ===
			
 
				+    if browser_type == "container":
			
 
				+        print("🐳 使用容器浏览器模式")
			
 
				+
			
 
				+        # container 模式必须提供 URL
			
 
				+        if not url:
			
 
				+            url = "about:blank"  # 使用默认空白页
			
 
				+            print("⚠️  未提供 url 参数，使用默认空白页")
			
 
				+
			
 
				+        # 创建容器并获取 CDP URL
			
 
				+        print(f"📦 正在创建容器...")
			
 
				+        container_info = await create_container(
			
 
				+            url=url,
			
 
				+            account_name=profile_name
			
 
				+        )
			
 
				+
			
 
				+        if not container_info["success"]:
			
 
				+            raise RuntimeError(f"容器创建失败: {container_info['error']}")
			
 
				+
			
 
				+        cdp_url = container_info["cdp"]
			
 
				+        print(f"✅ 容器创建成功")
			
 
				+        print(f"   CDP URL: {cdp_url}")
			
 
				+        print(f"   Container ID: {container_info['container_id']}")
			
 
				+        print(f"   Connection ID: {container_info.get('connection_id')}")
			
 
				+
			
 
				+        # 使用容器的 CDP URL 连接
			
 
				+        session_params["cdp_url"] = cdp_url
			
 
				+
			
 
				+        # 等待容器完全启动
			
 
				+        print("⏳ 等待容器浏览器启动...")
			
 
				+        await asyncio.sleep(3)
			
 
				+
			
 
				+    # === Cloud 模式 ===
			
 
				+    elif browser_type == "cloud":
			
 
				         print("🌐 使用云浏览器模式")
			
 
				-    else:
			
 
				-        # 本地浏览器模式
			
 
				+        session_params["use_cloud"] = True
			
 
				+
			
 
				+        # profile_name 作为云配置ID
			
 
				+        if profile_name and profile_name != "default":
			
 
				+            session_params["cloud_profile_id"] = profile_name
			
 
				+
			
 
				+    # === Local 模式 ===
			
 
				+    else:  # local
			
 
				+        print("💻 使用本地浏览器模式")
			
 
				         session_params["is_local"] = True
			
 
				 
			
 
				+        # 设置用户数据目录（持久化登录状态）
			
 
				+        if user_data_dir is None and profile_name:
			
 
				+            user_data_dir = str(Path.home() / ".browser_use" / "profiles" / profile_name)
			
 
				+            Path(user_data_dir).mkdir(parents=True, exist_ok=True)
			
 
				+
			
 
				         # macOS 上显式指定 Chrome 路径
			
 
				         import platform
			
 
				         if platform.system() == "Darwin":  # macOS
			
@@ -110,13 +333,14 @@ async def init_browser_session(
 
				         if user_data_dir:
			
 
				             session_params["user_data_dir"] = user_data_dir
			
 
				 
			
 
				-    # 只在有值时才添加 browser_profile
			
 
				+    # 只在有值时才添加 browser_profile (适用于所有模式)
			
 
				     if browser_profile:
			
 
				         session_params["browser_profile"] = browser_profile
			
 
				 
			
 
				     # 合并其他参数
			
 
				     session_params.update(kwargs)
			
 
				 
			
 
				+    # 创建浏览器会话
			
 
				     _browser_session = BrowserSession(**session_params)
			
 
				 
			
 
				     # 启动浏览器
			
@@ -132,6 +356,13 @@ async def init_browser_session(
 
				     base_dir.mkdir(parents=True, exist_ok=True)
			
 
				     _file_system = FileSystem(base_dir=str(base_dir))
			
 
				 
			
 
				+    print("✅ 浏览器会话初始化成功")
			
 
				+
			
 
				+    # 如果是 local 或 cloud 模式且提供了 URL，导航到该 URL
			
 
				+    if browser_type in ["local", "cloud"] and url:
			
 
				+        print(f"🔗 导航到: {url}")
			
 
				+        await _browser_tools.navigate(url=url, browser_session=_browser_session)
			
 
				+
			
 
				     return _browser_session, _browser_tools
			
 
				 
			
 
				 
			
@@ -318,12 +549,16 @@ def _fetch_profile_id(cookie_type: str) -> Optional[str]:
 
				         return None
			
 
				 
			
 
				 
			
 
				+# ============================================================
			
 
				+# 需要注册的工具
			
 
				+# ============================================================
			
 
				+
			
 
				 # ============================================================
			
 
				 # 导航类工具 (Navigation Tools)
			
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def navigate_to_url(url: str, new_tab: bool = False) -> ToolResult:
			
 
				+async def browser_navigate_to_url(url: str, new_tab: bool = False) -> ToolResult:
			
 
				     """
			
 
				     导航到指定的 URL
			
 
				     Navigate to a specific URL
			
@@ -363,7 +598,7 @@ async def navigate_to_url(url: str, new_tab: bool = False) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def search_web(query: str, engine: str = "google") -> ToolResult:
			
 
				+async def browser_search_web(query: str, engine: str = "google") -> ToolResult:
			
 
				     """
			
 
				     使用搜索引擎搜索
			
 
				     Search the web using a search engine
			
@@ -400,7 +635,7 @@ async def search_web(query: str, engine: str = "google") -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def go_back() -> ToolResult:
			
 
				+async def browser_go_back() -> ToolResult:
			
 
				     """
			
 
				     返回到上一个页面
			
 
				     Go back to the previous page
			
@@ -427,7 +662,7 @@ async def go_back() -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def wait(seconds: int = 3) -> ToolResult:
			
 
				+async def browser_wait(seconds: int = 3) -> ToolResult:
			
 
				     """
			
 
				     等待指定的秒数
			
 
				     Wait for a specified number of seconds
			
@@ -464,7 +699,7 @@ async def wait(seconds: int = 3) -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def click_element(index: int) -> ToolResult:
			
 
				+async def browser_click_element(index: int) -> ToolResult:
			
 
				     """
			
 
				     通过索引点击页面元素
			
 
				     Click an element by index
			
@@ -501,7 +736,7 @@ async def click_element(index: int) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def input_text(index: int, text: str, clear: bool = True) -> ToolResult:
			
 
				+async def browser_input_text(index: int, text: str, clear: bool = True) -> ToolResult:
			
 
				     """
			
 
				     在指定元素中输入文本
			
 
				     Input text into an element
			
@@ -539,7 +774,7 @@ async def input_text(index: int, text: str, clear: bool = True) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def send_keys(keys: str) -> ToolResult:
			
 
				+async def browser_send_keys(keys: str) -> ToolResult:
			
 
				     """
			
 
				     发送键盘按键或快捷键
			
 
				     Send keyboard keys or shortcuts
			
@@ -579,7 +814,7 @@ async def send_keys(keys: str) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def upload_file(index: int, path: str) -> ToolResult:
			
 
				+async def browser_upload_file(index: int, path: str) -> ToolResult:
			
 
				     """
			
 
				     上传文件到文件输入元素
			
 
				     Upload a file to a file input element
			
@@ -624,7 +859,7 @@ async def upload_file(index: int, path: str) -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def scroll_page(down: bool = True, pages: float = 1.0,
			
 
				+async def browser_scroll_page(down: bool = True, pages: float = 1.0,
			
 
				                      index: Optional[int] = None) -> ToolResult:
			
 
				     """
			
 
				     滚动页面或元素
			
@@ -665,7 +900,7 @@ async def scroll_page(down: bool = True, pages: float = 1.0,
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def find_text(text: str) -> ToolResult:
			
 
				+async def browser_find_text(text: str) -> ToolResult:
			
 
				     """
			
 
				     查找页面中的文本并滚动到该位置
			
 
				     Find text on the page and scroll to it
			
@@ -701,7 +936,7 @@ async def find_text(text: str) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def screenshot() -> ToolResult:
			
 
				+async def browser_screenshot() -> ToolResult:
			
 
				     """
			
 
				     请求在下次观察中包含页面截图
			
 
				     Request a screenshot to be included in the next observation
			
@@ -738,7 +973,7 @@ async def screenshot() -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def switch_tab(tab_id: str) -> ToolResult:
			
 
				+async def browser_switch_tab(tab_id: str) -> ToolResult:
			
 
				     """
			
 
				     切换到指定标签页
			
 
				     Switch to a different browser tab
			
@@ -773,7 +1008,7 @@ async def switch_tab(tab_id: str) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def close_tab(tab_id: str) -> ToolResult:
			
 
				+async def browser_close_tab(tab_id: str) -> ToolResult:
			
 
				     """
			
 
				     关闭指定标签页
			
 
				     Close a browser tab
			
@@ -812,7 +1047,7 @@ async def close_tab(tab_id: str) -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def get_dropdown_options(index: int) -> ToolResult:
			
 
				+async def browser_get_dropdown_options(index: int) -> ToolResult:
			
 
				     """
			
 
				     获取下拉框的所有选项
			
 
				     Get options from a dropdown element
			
@@ -846,7 +1081,7 @@ async def get_dropdown_options(index: int) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def select_dropdown_option(index: int, text: str) -> ToolResult:
			
 
				+async def browser_select_dropdown_option(index: int, text: str) -> ToolResult:
			
 
				     """
			
 
				     选择下拉框选项
			
 
				     Select an option from a dropdown
			
@@ -886,7 +1121,7 @@ async def select_dropdown_option(index: int, text: str) -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def extract_content(query: str, extract_links: bool = False,
			
 
				+async def browser_extract_content(query: str, extract_links: bool = False,
			
 
				                          start_from_char: int = 0) -> ToolResult:
			
 
				     """
			
 
				     使用 LLM 从页面提取结构化数据
			
@@ -934,7 +1169,7 @@ async def extract_content(query: str, extract_links: bool = False,
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def get_page_html() -> ToolResult:
			
 
				+async def browser_get_page_html() -> ToolResult:
			
 
				     """
			
 
				     获取当前页面的完整 HTML
			
 
				     Get the full HTML of the current page
			
@@ -996,7 +1231,7 @@ async def get_page_html() -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def get_selector_map() -> ToolResult:
			
 
				+async def browser_get_selector_map() -> ToolResult:
			
 
				     """
			
 
				     获取当前页面的元素索引映射
			
 
				     Get the selector map of interactive elements on the current page
			
@@ -1052,7 +1287,7 @@ async def get_selector_map() -> ToolResult:
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def evaluate(code: str) -> ToolResult:
			
 
				+async def browser_evaluate(code: str) -> ToolResult:
			
 
				     """
			
 
				     在页面中执行 JavaScript 代码
			
 
				     Execute JavaScript code in the page context
			
@@ -1094,7 +1329,7 @@ async def evaluate(code: str) -> ToolResult:
 
				 
			
 
				 
			
 
				 @tool()
			
 
				-async def ensure_login_with_cookies(cookie_type: str, url: str = "https://www.xiaohongshu.com") -> ToolResult:
			
 
				+async def browser_ensure_login_with_cookies(cookie_type: str, url: str = "https://www.xiaohongshu.com") -> ToolResult:
			
 
				     """
			
 
				     检查登录状态并在需要时注入 cookies
			
 
				     """
			
@@ -1190,7 +1425,7 @@ async def ensure_login_with_cookies(cookie_type: str, url: str = "https://www.xi
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def wait_for_user_action(message: str = "Please complete the action in browser",
			
 
				+async def browser_wait_for_user_action(message: str = "Please complete the action in browser",
			
 
				                                timeout: int = 300) -> ToolResult:
			
 
				     """
			
 
				     等待用户在浏览器中完成操作（如登录）
			
@@ -1262,7 +1497,7 @@ async def wait_for_user_action(message: str = "Please complete the action in bro
 
				 # ============================================================
			
 
				 
			
 
				 @tool()
			
 
				-async def done(text: str, success: bool = True,
			
 
				+async def browser_done(text: str, success: bool = True,
			
 
				               files_to_display: Optional[List[str]] = None) -> ToolResult:
			
 
				     """
			
 
				     标记任务完成并返回最终消息
			
@@ -1300,138 +1535,6 @@ async def done(text: str, success: bool = True,
 
				         )
			
 
				 
			
 
				 
			
 
				-# ============================================================
			
 
				-# 容器管理工具 (Container Management Tools)
			
 
				-# ============================================================
			
 
				-
			
 
				-import aiohttp
			
 
				-
			
 
				-async def create_container(url: str, account_name: str = "liuwenwu") -> Dict[str, Any]:
			
 
				-    """
			
 
				-    创建浏览器容器并导航到指定URL
			
 
				-
			
 
				-    按照 test.md 的要求：
			
 
				-    1.1 调用接口创建容器
			
 
				-    1.2 调用接口创建窗口并导航到URL
			
 
				-
			
 
				-    Args:
			
 
				-        url: 要导航的URL地址
			
 
				-        account_name: 账户名称
			
 
				-
			
 
				-    Returns:
			
 
				-        包含容器信息的字典:
			
 
				-        - success: 是否成功
			
 
				-        - container_id: 容器ID
			
 
				-        - vnc: VNC访问URL
			
 
				-        - cdp: CDP协议URL（用于浏览器连接）
			
 
				-        - connection_id: 窗口连接ID
			
 
				-        - error: 错误信息（如果失败）
			
 
				-    """
			
 
				-    result = {
			
 
				-        "success": False,
			
 
				-        "container_id": None,
			
 
				-        "vnc": None,
			
 
				-        "cdp": None,
			
 
				-        "connection_id": None,
			
 
				-        "error": None
			
 
				-    }
			
 
				-
			
 
				-    try:
			
 
				-        async with aiohttp.ClientSession() as session:
			
 
				-            # 步骤1.1: 创建容器
			
 
				-            print("📦 步骤1.1: 创建容器...")
			
 
				-            create_url = "http://47.84.182.56:8200/api/v1/container/create"
			
 
				-            create_payload = {
			
 
				-                "auto_remove": True,
			
 
				-                "need_port_binding": True,
			
 
				-                "max_lifetime_seconds": 900
			
 
				-            }
			
 
				-
			
 
				-            async with session.post(create_url, json=create_payload) as resp:
			
 
				-                if resp.status != 200:
			
 
				-                    raise RuntimeError(f"创建容器失败: HTTP {resp.status}")
			
 
				-
			
 
				-                create_result = await resp.json()
			
 
				-                if create_result.get("code") != 0:
			
 
				-                    raise RuntimeError(f"创建容器失败: {create_result.get('msg')}")
			
 
				-
			
 
				-                data = create_result.get("data", {})
			
 
				-                result["container_id"] = data.get("container_id")
			
 
				-                result["vnc"] = data.get("vnc")
			
 
				-                result["cdp"] = data.get("cdp")
			
 
				-
			
 
				-                print(f"✅ 容器创建成功")
			
 
				-                print(f"   Container ID: {result['container_id']}")
			
 
				-                print(f"   VNC: {result['vnc']}")
			
 
				-                print(f"   CDP: {result['cdp']}")
			
 
				-
			
 
				-            # 等待容器内的浏览器启动
			
 
				-            print(f"\n⏳ 等待容器内浏览器启动...")
			
 
				-            await asyncio.sleep(5)
			
 
				-
			
 
				-            # 步骤1.2: 创建页面并导航
			
 
				-            print(f"\n📱 步骤1.2: 创建页面并导航到 {url}...")
			
 
				-
			
 
				-            page_create_url = "http://47.84.182.56:8200/api/v1/browser/page/create"
			
 
				-            page_payload = {
			
 
				-                "container_id": result["container_id"],
			
 
				-                "url": url,
			
 
				-                "account_name": account_name,
			
 
				-                "need_wait": True,
			
 
				-                "timeout": 30
			
 
				-            }
			
 
				-
			
 
				-            # 重试机制：最多尝试3次
			
 
				-            max_retries = 3
			
 
				-            page_created = False
			
 
				-            last_error = None
			
 
				-
			
 
				-            for attempt in range(max_retries):
			
 
				-                try:
			
 
				-                    if attempt > 0:
			
 
				-                        print(f"   重试 {attempt + 1}/{max_retries}...")
			
 
				-                        await asyncio.sleep(3)  # 重试前等待
			
 
				-
			
 
				-                    async with session.post(page_create_url, json=page_payload, timeout=aiohttp.ClientTimeout(total=60)) as resp:
			
 
				-                        if resp.status != 200:
			
 
				-                            response_text = await resp.text()
			
 
				-                            last_error = f"HTTP {resp.status}: {response_text[:200]}"
			
 
				-                            continue
			
 
				-
			
 
				-                        page_result = await resp.json()
			
 
				-                        if page_result.get("code") != 0:
			
 
				-                            last_error = f"{page_result.get('msg')}"
			
 
				-                            continue
			
 
				-
			
 
				-                        page_data = page_result.get("data", {})
			
 
				-                        result["connection_id"] = page_data.get("connection_id")
			
 
				-                        result["success"] = True
			
 
				-                        page_created = True
			
 
				-
			
 
				-                        print(f"✅ 页面创建成功")
			
 
				-                        print(f"   Connection ID: {result['connection_id']}")
			
 
				-                        break
			
 
				-
			
 
				-                except asyncio.TimeoutError:
			
 
				-                    last_error = "请求超时"
			
 
				-                    continue
			
 
				-                except aiohttp.ClientError as e:
			
 
				-                    last_error = f"网络错误: {str(e)}"
			
 
				-                    continue
			
 
				-                except Exception as e:
			
 
				-                    last_error = f"未知错误: {str(e)}"
			
 
				-                    continue
			
 
				-
			
 
				-            if not page_created:
			
 
				-                raise RuntimeError(f"创建页面失败（尝试{max_retries}次后）: {last_error}")
			
 
				-
			
 
				-    except Exception as e:
			
 
				-        result["error"] = str(e)
			
 
				-        print(f"❌ 错误: {str(e)}")
			
 
				-
			
 
				-    return result
			
 
				-
			
 
				-
			
 
				 # ============================================================
			
 
				 # 导出所有工具函数（供外部使用）
			
 
				 # ============================================================
			
@@ -1444,45 +1547,42 @@ __all__ = [
 
				     'kill_browser_session',
			
 
				 
			
 
				     # 导航类工具
			
 
				-    'navigate_to_url',
			
 
				-    'search_web',
			
 
				-    'go_back',
			
 
				-    'wait',
			
 
				+    'browser_navigate_to_url',
			
 
				+    'browser_search_web',
			
 
				+    'browser_go_back',
			
 
				+    'browser_wait',
			
 
				 
			
 
				     # 元素交互工具
			
 
				-    'click_element',
			
 
				-    'input_text',
			
 
				-    'send_keys',
			
 
				-    'upload_file',
			
 
				+    'browser_click_element',
			
 
				+    'browser_input_text',
			
 
				+    'browser_send_keys',
			
 
				+    'browser_upload_file',
			
 
				 
			
 
				     # 滚动和视图工具
			
 
				-    'scroll_page',
			
 
				-    'find_text',
			
 
				-    'screenshot',
			
 
				+    'browser_scroll_page',
			
 
				+    'browser_find_text',
			
 
				+    'browser_screenshot',
			
 
				 
			
 
				     # 标签页管理工具
			
 
				-    'switch_tab',
			
 
				-    'close_tab',
			
 
				+    'browser_switch_tab',
			
 
				+    'browser_close_tab',
			
 
				 
			
 
				     # 下拉框工具
			
 
				-    'get_dropdown_options',
			
 
				-    'select_dropdown_option',
			
 
				+    'browser_get_dropdown_options',
			
 
				+    'browser_select_dropdown_option',
			
 
				 
			
 
				     # 内容提取工具
			
 
				-    'extract_content',
			
 
				-    'get_page_html',
			
 
				-    'get_selector_map',
			
 
				+    'browser_extract_content',
			
 
				+    'browser_get_page_html',
			
 
				+    'browser_get_selector_map',
			
 
				 
			
 
				     # JavaScript 执行工具
			
 
				-    'evaluate',
			
 
				-    'ensure_login_with_cookies',
			
 
				+    'browser_evaluate',
			
 
				+    'browser_ensure_login_with_cookies',
			
 
				 
			
 
				     # 等待用户操作
			
 
				-    'wait_for_user_action',
			
 
				+    'browser_wait_for_user_action',
			
 
				 
			
 
				     # 任务完成
			
 
				-    'done',
			
 
				-
			
 
				-    # 容器管理
			
 
				-    'create_container',
			
 
				+    'browser_done',
			
 
				 ]
			
--- a/agent/tools/builtin/goal.py
+++ b/agent/tools/builtin/goal.py
@@ -40,13 +40,14 @@ async def goal(
 
				         reason: 创建理由（逗号分隔多个，与 add 一一对应）。说明为什么要做这些目标。
			
 
				         done: 完成当前目标，值为 summary
			
 
				         abandon: 放弃当前目标，值为原因（会触发 context 压缩）
			
 
				-        focus: 切换焦点到指定 id（可以是内部 ID 或显示 ID）
			
 
				+        focus: 切换焦点到指定 ID（如 "1", "2.1", "2.2"）
			
 
				         context: 工具执行上下文（包含 store 和 trace_id）
			
 
				 
			
 
				     Examples:
			
 
				         goal(add="分析代码, 实现功能, 测试", reason="了解现有结构, 完成需求, 确保质量")
			
 
				         goal(focus="2", add="设计接口, 实现代码", reason="明确API规范, 编写核心逻辑")
			
 
				         goal(done="发现用户模型在 models/user.py")
			
 
				+        goal(done="已完成调研", focus="2")
			
 
				         goal(abandon="方案A需要Redis，环境没有", add="实现方案B", reason="使用现有技术栈")
			
 
				 
			
 
				     Returns:
			
--- a/docs/ref/skills.md
+++ b/docs/ref/skills.md
@@ -0,0 +1,31 @@
 
				+Skill structure
			
 
				+Every Skill requires a SKILL.md file with YAML frontmatter:
			
 
				+
			
 
				+---
			
 
				+name: your-skill-name
			
 
				+description: Brief description of what this Skill does and when to use it
			
 
				+---
			
 
				+
			
 
				+# Your Skill Name
			
 
				+
			
 
				+## Instructions
			
 
				+[Clear, step-by-step guidance for Claude to follow]
			
 
				+
			
 
				+## Examples
			
 
				+[Concrete examples of using this Skill]
			
 
				+Required fields: name and description
			
 
				+
			
 
				+Field requirements:
			
 
				+
			
 
				+name:
			
 
				+
			
 
				+Maximum 64 characters
			
 
				+Must contain only lowercase letters, numbers, and hyphens
			
 
				+Cannot contain XML tags
			
 
				+Cannot contain reserved words: "anthropic", "claude"
			
 
				+description:
			
 
				+
			
 
				+Must be non-empty
			
 
				+Maximum 1024 characters
			
 
				+Cannot contain XML tags
			
 
				+The description should include both what the Skill does and when Claude should use it. For complete authoring guidance, see the best practices guide.
			
--- a/examples/cloud_browser_demo_db.py
+++ b/examples/cloud_browser_demo_db.py
@@ -22,11 +22,11 @@ from agent.tools.builtin.browser.baseClass import (
 
				     init_browser_session,
			
 
				     cleanup_browser_session,
			
 
				     kill_browser_session,
			
 
				-    navigate_to_url,
			
 
				-    scroll_page,
			
 
				-    evaluate,
			
 
				-    wait,
			
 
				-    get_page_html,
			
 
				+    browser_navigate_to_url,
			
 
				+    browser_scroll_page,
			
 
				+    browser_evaluate,
			
 
				+    browser_wait,
			
 
				+    browser_get_page_html,
			
 
				     _fetch_cookie_row,
			
 
				     _fetch_profile_id,
			
 
				     _normalize_cookies,
			
@@ -102,10 +102,10 @@ async def example_xhs_fitness_search(cookie_type: str = "xhs") -> dict:
 
				 
			
 
				             # 访问首页
			
 
				             print("\n🏠 访问小红书首页...")
			
 
				-            nav_result = await navigate_to_url("https://www.xiaohongshu.com")
			
 
				+            nav_result = await browser_navigate_to_url("https://www.xiaohongshu.com")
			
 
				             if nav_result.error:
			
 
				                 raise RuntimeError(nav_result.error)
			
 
				-            await wait(3)
			
 
				+            await browser_wait(3)
			
 
				 
			
 
				             # 注入 Cookie（如果有）
			
 
				             if cookie_row:
			
@@ -119,7 +119,7 @@ async def example_xhs_fitness_search(cookie_type: str = "xhs") -> dict:
 
				                         print(f"✅ 成功注入 {len(cookies)} 个 Cookie")
			
 
				                         # 刷新页面使 Cookie 生效
			
 
				                         await navigate_to_url("https://www.xiaohongshu.com")
			
 
				-                        await wait(2)
			
 
				+                        await browser_wait(2)
			
 
				                     else:
			
 
				                         print("⚠️  Cookie 解析失败")
			
 
				                 else:
			
@@ -127,20 +127,20 @@ async def example_xhs_fitness_search(cookie_type: str = "xhs") -> dict:
 
				 
			
 
				             # 访问搜索页面
			
 
				             print(f"\n🔗 访问搜索页面: {keyword}")
			
 
				-            nav_result = await navigate_to_url(search_url)
			
 
				+            nav_result = await browser_navigate_to_url(search_url)
			
 
				             if nav_result.error:
			
 
				                 raise RuntimeError(nav_result.error)
			
 
				-            await wait(8)
			
 
				+            await browser_wait(8)
			
 
				 
			
 
				             # 滚动页面
			
 
				             print("\n📜 滚动页面...")
			
 
				             for i in range(3):
			
 
				-                await scroll_page(down=True, pages=2.0)
			
 
				-                await wait(2)
			
 
				+                await browser_scroll_page(down=True, pages=2.0)
			
 
				+                await browser_wait(2)
			
 
				 
			
 
				             # 提取数据
			
 
				             print("\n🔍 提取数据...")
			
 
				-            html_result = await get_page_html()
			
 
				+            html_result = await browser_get_page_html()
			
 
				             if html_result.error:
			
 
				                 raise RuntimeError(html_result.error)
			
 
				             html = html_result.metadata.get("html", "")
			
@@ -223,7 +223,7 @@ async def example_xhs_fitness_search(cookie_type: str = "xhs") -> dict:
 
				             extract_js = extract_js.replace("__KEYWORD__", json.dumps(keyword, ensure_ascii=False))
			
 
				 
			
 
				             async def run_extract() -> dict:
			
 
				-                result = await evaluate(extract_js)
			
 
				+                result = await browser_evaluate(extract_js)
			
 
				                 if result.error:
			
 
				                     raise RuntimeError(result.error)
			
 
				                 output = result.output
			
@@ -253,7 +253,7 @@ async def example_xhs_fitness_search(cookie_type: str = "xhs") -> dict:
 
				                     }
			
 
				 
			
 
				                 if isinstance(data, dict) and data.get("count", 0) == 0:
			
 
				-                    html_result = await get_page_html()
			
 
				+                    html_result = await browser_get_page_html()
			
 
				                     if html_result.error:
			
 
				                         raise RuntimeError(html_result.error)
			
 
				                     html = html_result.metadata.get("html", "")
			
--- a/examples/research/run.py
+++ b/examples/research/run.py
@@ -0,0 +1,164 @@
 
				+"""
			
 
				+浏览器调研示例
			
 
				+
			
 
				+使用 Agent 模式 + 浏览器工具进行网络调研
			
 
				+"""
			
 
				+
			
 
				+import os
			
 
				+import sys
			
 
				+import asyncio
			
 
				+from pathlib import Path
			
 
				+
			
 
				+# 添加项目根目录到 Python 路径
			
 
				+sys.path.insert(0, str(Path(__file__).parent.parent.parent))
			
 
				+
			
 
				+from dotenv import load_dotenv
			
 
				+load_dotenv()
			
 
				+
			
 
				+from agent.llm.prompts import SimplePrompt
			
 
				+from agent.core.runner import AgentRunner
			
 
				+from agent.execution import (
			
 
				+    FileSystemTraceStore,
			
 
				+    Trace,
			
 
				+    Message,
			
 
				+)
			
 
				+from agent.llm import create_openrouter_llm_call
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    # 路径配置
			
 
				+    base_dir = Path(__file__).parent
			
 
				+    project_root = base_dir.parent.parent
			
 
				+    prompt_path = base_dir / "test.prompt"
			
 
				+    output_dir = base_dir / "output"
			
 
				+    output_dir.mkdir(exist_ok=True)
			
 
				+
			
 
				+    # Skills 目录（可选：用户自定义 skills）
			
 
				+    # 注意：内置 skills（agent/skills/core.md）会自动加载
			
 
				+    skills_dir = None  # 或者指定自定义 skills 目录，如: project_root / "skills"
			
 
				+
			
 
				+    print("=" * 60)
			
 
				+    print("浏览器调研任务 (Agent 模式)")
			
 
				+    print("=" * 60)
			
 
				+    print()
			
 
				+
			
 
				+    # 1. 加载 prompt
			
 
				+    print("1. 加载 prompt...")
			
 
				+    prompt = SimplePrompt(prompt_path)
			
 
				+
			
 
				+    # 提取配置
			
 
				+    system_prompt = prompt._messages.get("system", "")
			
 
				+    user_task = prompt._messages.get("user", "")
			
 
				+    model_name = prompt.config.get('model', 'gemini-2.5-flash')
			
 
				+    temperature = float(prompt.config.get('temperature', 0.3))
			
 
				+
			
 
				+    print(f"   - 任务: {user_task[:80]}...")
			
 
				+    print(f"   - 模型: {model_name}")
			
 
				+
			
 
				+    # 2. 构建消息
			
 
				+    print("2. 构建任务消息...")
			
 
				+    messages = prompt.build_messages()
			
 
				+
			
 
				+    # 3. 创建 Agent Runner（配置 skills 和浏览器工具）
			
 
				+    print("3. 创建 Agent Runner...")
			
 
				+    print(f"   - Skills 目录: {skills_dir}")
			
 
				+    print(f"   - 模型: {model_name} (via OpenRouter)")
			
 
				+
			
 
				+    # 使用 OpenRouter 的 Gemini 模型
			
 
				+    runner = AgentRunner(
			
 
				+        trace_store=FileSystemTraceStore(base_path=".trace"),
			
 
				+        llm_call=create_openrouter_llm_call(model=f"google/{model_name}"),
			
 
				+        skills_dir=skills_dir,
			
 
				+        debug=True  # 启用 debug，输出到 .trace/
			
 
				+    )
			
 
				+
			
 
				+    # 4. Agent 模式执行
			
 
				+    print(f"4. 启动 Agent 模式...")
			
 
				+    print()
			
 
				+
			
 
				+    final_response = ""
			
 
				+    current_trace_id = None
			
 
				+
			
 
				+    async for item in runner.run(
			
 
				+        task=user_task,
			
 
				+        messages=messages,
			
 
				+        system_prompt=system_prompt,
			
 
				+        model=f"google/{model_name}",
			
 
				+        temperature=temperature,
			
 
				+        max_iterations=20,  # 调研任务可能需要更多迭代
			
 
				+    ):
			
 
				+        # 处理 Trace 对象（整体状态变化）
			
 
				+        if isinstance(item, Trace):
			
 
				+            current_trace_id = item.trace_id
			
 
				+            if item.status == "running":
			
 
				+                print(f"[Trace] 开始: {item.trace_id[:8]}")
			
 
				+            elif item.status == "completed":
			
 
				+                print(f"[Trace] 完成")
			
 
				+                print(f"  - Total messages: {item.total_messages}")
			
 
				+                print(f"  - Total tokens: {item.total_tokens}")
			
 
				+                print(f"  - Total cost: ${item.total_cost:.4f}")
			
 
				+            elif item.status == "failed":
			
 
				+                print(f"[Trace] 失败: {item.error_message}")
			
 
				+
			
 
				+        # 处理 Message 对象（执行过程）
			
 
				+        elif isinstance(item, Message):
			
 
				+            if item.role == "assistant":
			
 
				+                content = item.content
			
 
				+                if isinstance(content, dict):
			
 
				+                    text = content.get("text", "")
			
 
				+                    tool_calls = content.get("tool_calls")
			
 
				+
			
 
				+                    if text and not tool_calls:
			
 
				+                        # 纯文本回复（最终响应）
			
 
				+                        final_response = text
			
 
				+                        print(f"[Response] Agent 完成")
			
 
				+                    elif text:
			
 
				+                        print(f"[Assistant] {text[:100]}...")
			
 
				+
			
 
				+                    if tool_calls:
			
 
				+                        for tc in tool_calls:
			
 
				+                            tool_name = tc.get("function", {}).get("name", "unknown")
			
 
				+                            print(f"[Tool Call] {tool_name}")
			
 
				+
			
 
				+            elif item.role == "tool":
			
 
				+                content = item.content
			
 
				+                if isinstance(content, dict):
			
 
				+                    tool_name = content.get("tool_name", "unknown")
			
 
				+                    print(f"[Tool Result] {tool_name}")
			
 
				+                if item.description:
			
 
				+                    desc = item.description[:80] if len(item.description) > 80 else item.description
			
 
				+                    print(f"  {desc}...")
			
 
				+
			
 
				+    # 5. 输出结果
			
 
				+    print()
			
 
				+    print("=" * 60)
			
 
				+    print("Agent 响应:")
			
 
				+    print("=" * 60)
			
 
				+    print(final_response)
			
 
				+    print("=" * 60)
			
 
				+    print()
			
 
				+
			
 
				+    # 6. 保存结果
			
 
				+    output_file = output_dir / "research_result.txt"
			
 
				+    with open(output_file, 'w', encoding='utf-8') as f:
			
 
				+        f.write(final_response)
			
 
				+
			
 
				+    print(f"✓ 结果已保存到: {output_file}")
			
 
				+    print()
			
 
				+
			
 
				+    # 提示使用 API 可视化
			
 
				+    print("=" * 60)
			
 
				+    print("可视化 Step Tree:")
			
 
				+    print("=" * 60)
			
 
				+    print("1. 启动 API Server:")
			
 
				+    print("   python3 api_server.py")
			
 
				+    print()
			
 
				+    print("2. 浏览器访问:")
			
 
				+    print("   http://localhost:8000/api/traces")
			
 
				+    print()
			
 
				+    print(f"3. Trace ID: {current_trace_id}")
			
 
				+    print("=" * 60)
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    asyncio.run(main())
			
--- a/examples/research/test.prompt
+++ b/examples/research/test.prompt
@@ -0,0 +1,11 @@
 
				+---
			
 
				+model: gemini-2.5-flash
			
 
				+temperature: 0.3
			
 
				+---
			
 
				+
			
 
				+$system$
			
 
				+你是最顶尖的AI助手，可以拆分并调用工具逐步解决复杂问题。
			
 
				+
			
 
				+$user$
			
 
				+使用浏览器帮我做个调研：一张图片中的构图可以如何表示？我希望寻找一些构图特征的表示方法。
			
 
				+注意使用explore工具，在合适的时候调用多个分支并行探索。
			
--- a/examples/test_tools_baidu.py
+++ b/examples/test_tools_baidu.py
@@ -10,11 +10,11 @@ sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 
				 
			
 
				 from agent.tools.builtin.browser.baseClass import (
			
 
				     init_browser_session,
			
 
				-    navigate_to_url,
			
 
				-    wait,
			
 
				-    get_page_html,
			
 
				-    evaluate,
			
 
				-    scroll_page,
			
 
				+    browser_navigate_to_url,
			
 
				+    browser_wait,
			
 
				+    browser_get_page_html,
			
 
				+    browser_evaluate,
			
 
				+    browser_scroll_page,
			
 
				     cleanup_browser_session,
			
 
				 )
			
 
				 
			
@@ -30,15 +30,15 @@ async def run_task():
 
				     try:
			
 
				         await init_browser_session(headless=False, profile_name="baidu_profile")
			
 
				 
			
 
				-        await navigate_to_url("https://www.baidu.com")
			
 
				-        await wait(seconds=2)
			
 
				+        await browser_navigate_to_url("https://www.baidu.com")
			
 
				+        await browser_wait(seconds=2)
			
 
				 
			
 
				         keyword = "Python 教程"
			
 
				         search_url = f"https://www.baidu.com/s?wd={quote(keyword)}"
			
 
				-        await navigate_to_url(search_url)
			
 
				-        await wait(seconds=3)
			
 
				-        await scroll_page(down=True, pages=1.0)
			
 
				-        await wait(seconds=2)
			
 
				+        await browser_navigate_to_url(search_url)
			
 
				+        await browser_wait(seconds=3)
			
 
				+        await browser_scroll_page(down=True, pages=1.0)
			
 
				+        await browser_wait(seconds=2)
			
 
				 
			
 
				         extract_js = """
			
 
				         (function(){
			
@@ -84,7 +84,7 @@ async def run_task():
 
				         })()
			
 
				         """
			
 
				 
			
 
				-        result = await evaluate(code=extract_js)
			
 
				+        result = await browser_evaluate(code=extract_js)
			
 
				         output = result.output
			
 
				         if output.startswith("Result: "):
			
 
				             output = output[8:]
			
@@ -103,7 +103,7 @@ async def run_task():
 
				         with open(json_file, "w", encoding="utf-8") as f:
			
 
				             json.dump(data, f, ensure_ascii=False, indent=2)
			
 
				 
			
 
				-        html_result = await get_page_html()
			
 
				+        html_result = await browser_get_page_html()
			
 
				         html_content = html_result.metadata.get("html", "")
			
 
				         page_url = html_result.metadata.get("url", "")
			
 
				         page_title = html_result.metadata.get("title", "")
			
--- a/examples/test_xhs_container.py
+++ b/examples/test_xhs_container.py
@@ -1,12 +1,10 @@
 
				 """
			
 
				 小红书容器测试脚本
			
 
				-根据 test.md 要求实现：
			
 
				-1. 创建容器并导航到小红书
			
 
				-2. 初始化浏览器会话
			
 
				-3. 切换到指定窗口
			
 
				-4. 搜索健身
			
 
				-5. 随机进入一个详情页
			
 
				-6. 获取详情页的HTML和iframe并保存到output
			
 
				+演示容器浏览器的使用：
			
 
				+1. 初始化容器浏览器（自动创建容器并连接）
			
 
				+2. 搜索健身
			
 
				+3. 随机进入一个详情页
			
 
				+4. 获取详情页的HTML和iframe并保存到output
			
 
				 """
			
 
				 
			
 
				 import sys
			
@@ -25,14 +23,14 @@ project_root = Path(__file__).parent.parent
 
				 sys.path.insert(0, str(project_root))
			
 
				 
			
 
				 from agent.tools.builtin.browser.baseClass import (
			
 
				-    create_container,
			
 
				     init_browser_session,
			
 
				     cleanup_browser_session,
			
 
				-    navigate_to_url,
			
 
				-    scroll_page,
			
 
				-    evaluate,
			
 
				-    wait,
			
 
				-    get_page_html,
			
 
				+    browser_navigate_to_url,
			
 
				+    browser_scroll_page,
			
 
				+    browser_evaluate,
			
 
				+    browser_wait,
			
 
				+    browser_get_page_html,
			
 
				+    browser_switch_tab,
			
 
				 )
			
 
				 
			
 
				 
			
@@ -52,83 +50,41 @@ async def test_xhs_container():
 
				     output_dir.mkdir(parents=True, exist_ok=True)
			
 
				 
			
 
				     try:
			
 
				-        # 步骤1: 创建容器并导航到小红书
			
 
				-        container_info = await create_container(url="https://www.xiaohongshu.com")
			
 
				-
			
 
				-        if not container_info["success"]:
			
 
				-            raise RuntimeError(f"容器创建失败: {container_info['error']}")
			
 
				-
			
 
				-        cdp_url = container_info["cdp"]
			
 
				-        container_id = container_info["container_id"]
			
 
				-        connection_id = container_info.get("connection_id")
			
 
				-
			
 
				-        print(f"\n📋 容器信息:")
			
 
				-        print(f"   CDP URL: {cdp_url}")
			
 
				-        print(f"   Container ID: {container_id}")
			
 
				-        print(f"   Connection ID: {connection_id}")
			
 
				-
			
 
				-        # 等待容器完全启动
			
 
				-        print(f"\n⏳ 等待容器启动...")
			
 
				-        await asyncio.sleep(3)
			
 
				-
			
 
				-        # 步骤2: 初始化浏览器会话
			
 
				-        print(f"\n🌐 初始化浏览器会话...")
			
 
				+        # 初始化容器浏览器（一步完成）
			
 
				+        print(f"\n🚀 初始化容器浏览器...")
			
 
				         browser, tools = await init_browser_session(
			
 
				-            headless=True,
			
 
				-            cdp_url=cdp_url
			
 
				+            browser_type="container",
			
 
				+            url="https://www.xiaohongshu.com",  # 容器启动时访问的URL
			
 
				+            headless=True
			
 
				         )
			
 
				 
			
 
				-        if browser is None or tools is None:
			
 
				-            raise RuntimeError("浏览器初始化失败")
			
 
				-
			
 
				-        print("✅ 浏览器会话初始化成功")
			
 
				-
			
 
				-        # 步骤3: 如果有 connection_id，切换到对应窗口
			
 
				-        if connection_id:
			
 
				-            print(f"\n🔄 切换到窗口: {connection_id}")
			
 
				-            await wait(2)
			
 
				-
			
 
				-            # 获取当前浏览器状态
			
 
				-            try:
			
 
				-                state = await browser.get_browser_state_summary(cached=False)
			
 
				-                print(f"   当前标签页数: {len(state.tabs)}")
			
 
				-                for tab in state.tabs:
			
 
				-                    print(f"   - Tab ID: {tab.target_id[-4:]}, URL: {tab.url}")
			
 
				-
			
 
				-                # 尝试切换到 connection_id 对应的标签页
			
 
				-                # connection_id 可能是完整ID，取最后4位
			
 
				-                from agent.tools.builtin.browser.baseClass import switch_tab
			
 
				-                await switch_tab(connection_id[-4:] if len(connection_id) > 4 else connection_id)
			
 
				-                await wait(2)
			
 
				-                print(f"✅ 已切换到窗口")
			
 
				-            except Exception as e:
			
 
				-                print(f"⚠️  切换窗口警告: {str(e)[:100]}")
			
 
				-                print(f"   将继续使用当前窗口")
			
 
				+        print("✅ 容器浏览器初始化成功")
			
 
				 
			
 
				-        await wait(3)
			
 
				+        # 等待页面完全加载
			
 
				+        await browser_wait(3)
			
 
				 
			
 
				-        # 步骤4: 搜索健身
			
 
				+        # 步骤1: 搜索健身
			
 
				         print(f"\n🔍 搜索关键词: {keyword}")
			
 
				         try:
			
 
				-            nav_result = await navigate_to_url(search_url)
			
 
				+            nav_result = await browser_navigate_to_url(search_url)
			
 
				             if nav_result.error:
			
 
				                 print(f"⚠️  导航警告: {nav_result.error[:100]}")
			
 
				         except Exception as e:
			
 
				             print(f"⚠️  导航异常: {str(e)[:100]}")
			
 
				 
			
 
				-        await wait(10)
			
 
				+        await browser_wait(10)
			
 
				 
			
 
				         # 滚动页面加载更多内容
			
 
				         print("\n📜 滚动页面...")
			
 
				         for i in range(2):
			
 
				-            await scroll_page(down=True, pages=2.0)
			
 
				-            await wait(2)
			
 
				+            await browser_scroll_page(down=True, pages=2.0)
			
 
				+            await browser_wait(2)
			
 
				 
			
 
				         # 提取搜索结果
			
 
				         print("\n🔍 提取搜索结果...")
			
 
				 
			
 
				         # 先保存HTML看看页面内容
			
 
				-        html_result = await get_page_html()
			
 
				+        html_result = await browser_get_page_html()
			
 
				         if not html_result.error:
			
 
				             html = html_result.metadata.get("html", "")
			
 
				             debug_html_path = output_dir / "search_page_debug.html"
			
@@ -155,7 +111,7 @@ async def test_xhs_container():
 
				         })()
			
 
				         """
			
 
				 
			
 
				-        eval_result = await evaluate(extract_js)
			
 
				+        eval_result = await browser_evaluate(extract_js)
			
 
				         if eval_result.error:
			
 
				             raise RuntimeError(f"提取搜索结果失败: {eval_result.error}")
			
 
				 
			
@@ -170,7 +126,7 @@ async def test_xhs_container():
 
				 
			
 
				         print(f"✅ 找到 {len(posts)} 个帖子")
			
 
				 
			
 
				-        # 步骤5: 随机进入一个详情页
			
 
				+        # 步骤2: 随机进入一个详情页
			
 
				         selected_post = random.choice(posts)
			
 
				         post_url = selected_post["link"]
			
 
				 
			
@@ -178,23 +134,23 @@ async def test_xhs_container():
 
				         print(f"🔗 访问帖子详情页: {post_url}")
			
 
				 
			
 
				         try:
			
 
				-            nav_result = await navigate_to_url(post_url)
			
 
				+            nav_result = await browser_navigate_to_url(post_url)
			
 
				             if nav_result.error:
			
 
				                 print(f"⚠️  导航警告: {nav_result.error[:100]}")
			
 
				         except Exception as e:
			
 
				             print(f"⚠️  导航异常: {str(e)[:100]}")
			
 
				 
			
 
				-        await wait(8)
			
 
				+        await browser_wait(8)
			
 
				 
			
 
				         # 滚动详情页
			
 
				         print("\n📜 滚动详情页...")
			
 
				         for i in range(3):
			
 
				-            await scroll_page(down=True, pages=1.5)
			
 
				-            await wait(2)
			
 
				+            await browser_scroll_page(down=True, pages=1.5)
			
 
				+            await browser_wait(2)
			
 
				 
			
 
				-        # 步骤6: 保存详情页HTML
			
 
				+        # 步骤3: 保存详情页HTML
			
 
				         print("\n💾 保存详情页 HTML...")
			
 
				-        html_result = await get_page_html()
			
 
				+        html_result = await browser_get_page_html()
			
 
				         if html_result.error:
			
 
				             print(f"⚠️  获取HTML失败: {html_result.error}")
			
 
				         else:
			
@@ -221,7 +177,7 @@ async def test_xhs_container():
 
				         })()
			
 
				         """
			
 
				 
			
 
				-        iframe_result = await evaluate(iframe_js)
			
 
				+        iframe_result = await browser_evaluate(iframe_js)
			
 
				         if not iframe_result.error:
			
 
				             iframe_output = iframe_result.output
			
 
				             if isinstance(iframe_output, str) and iframe_output.startswith("Result: "):
			
@@ -251,7 +207,7 @@ async def test_xhs_container():
 
				                         }})()
			
 
				                         """
			
 
				 
			
 
				-                        iframe_html_result = await evaluate(get_iframe_html_js)
			
 
				+                        iframe_html_result = await browser_evaluate(get_iframe_html_js)
			
 
				                         if not iframe_html_result.error:
			
 
				                             iframe_html = iframe_html_result.output
			
 
				                             if isinstance(iframe_html, str) and iframe_html.startswith("Result: "):