3 месяцев назад · 9c6f9d6124
--- a/agent/core/runner.py
+++ b/agent/core/runner.py
@@ -100,7 +100,7 @@ class RunConfig:
 
				     分为模型层参数（由上游 agent 或用户决定）和框架层参数（由系统注入）。
			
 
				     """
			
 
				     # --- 模型层参数 ---
			
 
				-    model: str = "gpt-4o"
			
 
				+    model: str = "qwen3.5-flash"
			
 
				     temperature: float = 0.3
			
 
				     max_iterations: int = 200
			
 
				     tools: Optional[List[str]] = None          # None = 全部已注册工具
			
@@ -459,7 +459,7 @@ class AgentRunner:
 
				     async def call(
			
 
				         self,
			
 
				         messages: List[Dict],
			
 
				-        model: str = "gpt-4o",
			
 
				+        model: str = "qwen3.5-flash",
			
 
				         tools: Optional[List[str]] = None,
			
 
				         uid: Optional[str] = None,
			
 
				         trace: bool = True,
			
@@ -2521,7 +2521,7 @@ class AgentRunner:
 
				                         {"role": "system", "content": TASK_NAME_GENERATION_SYSTEM_PROMPT},
			
 
				                         {"role": "user", "content": raw_text[:2000]},
			
 
				                     ],
			
 
				-                    model="gpt-4o-mini",  # 使用便宜模型
			
 
				+                    model="qwen3.5-flash",
			
 
				                 )
			
 
				                 title = result.get("content", "").strip()
			
 
				                 if title and len(title) < 100:
			
--- a/agent/tools/builtin/subagent.py
+++ b/agent/tools/builtin/subagent.py
@@ -488,7 +488,7 @@ async def _run_agents(
 
				             config=_make_run_config(
			
 
				                 trace_id=cur_stid,
			
 
				                 agent_type=agent_type or ("delegate" if single else "explore"),
			
 
				-                model=parent_trace.model if parent_trace else "gpt-4o",
			
 
				+                model=parent_trace.model if parent_trace else "qwen3.5-flash",
			
 
				                 uid=parent_trace.uid if parent_trace else None,
			
 
				                 tools=allowed_tools,
			
 
				                 name=task_item[:50],
			
@@ -779,7 +779,7 @@ async def evaluate(
 
				             config=_make_run_config(
			
 
				                 trace_id=sub_trace_id,
			
 
				                 agent_type="evaluate",
			
 
				-                model=parent_trace.model if parent_trace else "gpt-4o",
			
 
				+                model=parent_trace.model if parent_trace else "qwen3.5-flash",
			
 
				                 uid=parent_trace.uid if parent_trace else None,
			
 
				                 tools=allowed_tools,
			
 
				                 name=f"评估: {goal_id}",
			
--- a/agent/trace/run_api.py
+++ b/agent/trace/run_api.py
@@ -61,7 +61,7 @@ class CreateRequest(BaseModel):
 
				         ...,
			
 
				         description="OpenAI SDK 格式的输入消息。可包含 system + user 消息；若无 system 消息则从 skills 自动构建",
			
 
				     )
			
 
				-    model: str = Field("gpt-4o", description="模型名称")
			
 
				+    model: str = Field("qwen3.5-flash", description="模型名称")
			
 
				     temperature: float = Field(0.3)
			
 
				     max_iterations: int = Field(200)
			
 
				     tools: Optional[List[str]] = Field(None, description="工具白名单（None = 全部）")
			
@@ -486,7 +486,7 @@ async def reflect_trace(trace_id: str, req: ReflectRequest):
 
				     # 使用 force_side_branch 触发反思侧分支
			
 
				     config = RunConfig(
			
 
				         trace_id=trace_id,
			
 
				-        model=trace.model or "gpt-4o",
			
 
				+        model=trace.model or "qwen3.5-flash",
			
 
				         force_side_branch=["reflection"],  # 使用列表格式
			
 
				         max_iterations=20,  # 给侧分支足够的轮次
			
 
				         enable_prompt_caching=True,
			
@@ -534,7 +534,7 @@ async def compact_trace(trace_id: str):
 
				     # 使用 force_side_branch 触发压缩侧分支
			
 
				     config = RunConfig(
			
 
				         trace_id=trace_id,
			
 
				-        model=trace.model or "gpt-4o",
			
 
				+        model=trace.model or "qwen3.5-flash",
			
 
				         force_side_branch=["compression"],  # 使用列表格式
			
 
				         max_iterations=20,  # 给侧分支足够的轮次
			
 
				         enable_prompt_caching=True,
			
--- a/api_server.py
+++ b/api_server.py
@@ -70,11 +70,11 @@ set_upload_trace_store(trace_store)
 
				 # 如需启用 POST /api/traces（新建/运行/停止/反思），取消以下注释并配置 LLM：
			
 
				 
			
 
				 from agent.core.runner import AgentRunner
			
 
				-from agent.llm import create_openrouter_llm_call
			
 
				+from agent.llm import create_qwen_llm_call
			
 
				 
			
 
				 runner = AgentRunner(
			
 
				     trace_store=trace_store,
			
 
				-    llm_call=create_openrouter_llm_call(model="anthropic/claude-sonnet-4.5"),
			
 
				+    llm_call=create_qwen_llm_call(model='qwen3.5-flash'),
			
 
				 )
			
 
				 set_runner(runner)
			
 
				 
			
--- a/gateway/core/channels/feishu/http_run_executor.py
+++ b/gateway/core/channels/feishu/http_run_executor.py
@@ -1,14 +1,15 @@
 
				 """
			
 
				-飞书执行器：通过 HTTP 调用 Agent 的 ``run_api``（``POST /api/traces`` / ``POST /api/traces/{id}/run``）。
			
 
				-
			
 
				-按飞书 ``user_id``（与 ``DefaultUserIdentityResolver`` 一致）维护 API ``trace_id``，与首次创建 / 续跑语义对齐。
			
 
				+飞书执行器：通过 HTTP 调用 Agent 的 ``run_api``，并在后台轮询 ``GET /api/traces/{id}/messages``
			
 
				+将主路径上每一条 assistant 消息转发到飞书。
			
 
				 """
			
 
				 
			
 
				 from __future__ import annotations
			
 
				 
			
 
				 import asyncio
			
 
				 import logging
			
 
				+import time
			
 
				 import uuid
			
 
				+from copy import copy
			
 
				 from typing import Any
			
 
				 
			
 
				 import httpx
			
@@ -17,6 +18,14 @@ from gateway.core.channels.feishu.types import FeishuReplyContext, IncomingFeish
 
				 
			
 
				 logger = logging.getLogger(__name__)
			
 
				 
			
 
				+_TERMINAL_STATUSES = frozenset({"completed", "failed", "stopped"})
			
 
				+
			
 
				+# 同一 trace 仅一个轮询任务，避免并发重复推送
			
 
				+_poll_tasks: dict[str, asyncio.Task[None]] = {}
			
 
				+_poll_tasks_lock = asyncio.Lock()
			
 
				+# trace_id → 已成功推送到飞书的 assistant sequence（跨多次 run，避免重复发送）
			
 
				+_assistant_sent_sequences: dict[str, set[int]] = {}
			
 
				+
			
 
				 
			
 
				 def _format_api_error(status_code: int, body_text: str) -> str:
			
 
				     try:
			
@@ -58,8 +67,215 @@ def _append_feishu_context_block(
 
				     return "\n".join(lines)
			
 
				 
			
 
				 
			
 
				+def _assistant_wire_to_feishu_text(msg: dict[str, Any]) -> str | None:
			
 
				+    """从 ``GET .../messages`` 返回的单条消息 dict 提取可发给用户的文本；无可展示内容则返回 None。"""
			
 
				+    if msg.get("role") != "assistant":
			
 
				+        return None
			
 
				+    content = msg.get("content")
			
 
				+    parts: list[str] = []
			
 
				+
			
 
				+    if isinstance(content, dict):
			
 
				+        text = (content.get("text") or "").strip()
			
 
				+        if text:
			
 
				+            parts.append(text)
			
 
				+        tool_calls = content.get("tool_calls")
			
 
				+        if tool_calls:
			
 
				+            desc = (msg.get("description") or "").strip()
			
 
				+            parts.append(desc if desc else "[工具调用]")
			
 
				+    elif isinstance(content, str) and content.strip():
			
 
				+        parts.append(content.strip())
			
 
				+    else:
			
 
				+        desc = (msg.get("description") or "").strip()
			
 
				+        if desc:
			
 
				+            parts.append(desc)
			
 
				+
			
 
				+    if not parts:
			
 
				+        return None
			
 
				+    return "\n".join(parts)
			
 
				+
			
 
				+
			
 
				+def _truncate_for_im(text: str, max_chars: int) -> str:
			
 
				+    if len(text) <= max_chars:
			
 
				+        return text
			
 
				+    return text[: max_chars - 80] + "\n\n…（内容过长已截断）"
			
 
				+
			
 
				+
			
 
				+def _message_sequence(msg: dict[str, Any]) -> int | None:
			
 
				+    s = msg.get("sequence")
			
 
				+    if s is None:
			
 
				+        return None
			
 
				+    if isinstance(s, int):
			
 
				+        return s
			
 
				+    if isinstance(s, float):
			
 
				+        return int(s)
			
 
				+    if isinstance(s, str):
			
 
				+        try:
			
 
				+            return int(s)
			
 
				+        except ValueError:
			
 
				+            return None
			
 
				+    try:
			
 
				+        return int(s)
			
 
				+    except (TypeError, ValueError):
			
 
				+        return None
			
 
				+
			
 
				+
			
 
				+async def _poll_assistants_to_feishu(
			
 
				+    *,
			
 
				+    agent_base_url: str,
			
 
				+    trace_id: str,
			
 
				+    reply_ctx: FeishuReplyContext,
			
 
				+    connector: Any,
			
 
				+    poll_interval: float,
			
 
				+    poll_request_timeout: float,
			
 
				+    terminal_grace_rounds: int,
			
 
				+    poll_max_seconds: float,
			
 
				+    max_text_chars: int,
			
 
				+) -> None:
			
 
				+    """
			
 
				+    轮询 Trace 状态与主路径消息，将尚未推送过的 assistant 消息按 sequence 顺序发到飞书。
			
 
				+    """
			
 
				+    if trace_id not in _assistant_sent_sequences:
			
 
				+        _assistant_sent_sequences[trace_id] = set()
			
 
				+    sent_sequences = _assistant_sent_sequences[trace_id]
			
 
				+    grace = 0
			
 
				+    started = time.monotonic()
			
 
				+    base = agent_base_url.rstrip("/")
			
 
				+
			
 
				+    try:
			
 
				+        while True:
			
 
				+            if poll_max_seconds > 0 and (time.monotonic() - started) >= poll_max_seconds:
			
 
				+                logger.warning(
			
 
				+                    "feishu poll: trace_id=%s stopped by poll_max_seconds=%s",
			
 
				+                    trace_id,
			
 
				+                    poll_max_seconds,
			
 
				+                )
			
 
				+                break
			
 
				+
			
 
				+            status = "running"
			
 
				+            try:
			
 
				+                async with httpx.AsyncClient(timeout=poll_request_timeout) as client:
			
 
				+                    tr = await client.get(f"{base}/api/traces/{trace_id}")
			
 
				+                    if tr.status_code == 404:
			
 
				+                        logger.warning("feishu poll: trace %s not found, stop", trace_id)
			
 
				+                        break
			
 
				+                    if tr.status_code >= 400:
			
 
				+                        logger.warning(
			
 
				+                            "feishu poll: GET trace failed status=%s body=%s",
			
 
				+                            tr.status_code,
			
 
				+                            tr.text[:300],
			
 
				+                        )
			
 
				+                    else:
			
 
				+                        data = tr.json()
			
 
				+                        trace_obj = data.get("trace") or {}
			
 
				+                        status = str(trace_obj.get("status") or "running")
			
 
				+
			
 
				+                    ms = await client.get(
			
 
				+                        f"{base}/api/traces/{trace_id}/messages",
			
 
				+                        params={"mode": "main_path"},
			
 
				+                    )
			
 
				+                    if ms.status_code != 200:
			
 
				+                        logger.warning(
			
 
				+                            "feishu poll: GET messages failed status=%s",
			
 
				+                            ms.status_code,
			
 
				+                        )
			
 
				+                    else:
			
 
				+                        payload = ms.json()
			
 
				+                        raw_list = payload.get("messages") or []
			
 
				+                        assistants = [
			
 
				+                            m
			
 
				+                            for m in raw_list
			
 
				+                            if isinstance(m, dict) and m.get("role") == "assistant"
			
 
				+                        ]
			
 
				+                        assistants.sort(key=lambda m: (_message_sequence(m) or 0))
			
 
				+
			
 
				+                        for m in assistants:
			
 
				+                            seq = _message_sequence(m)
			
 
				+                            if seq is None:
			
 
				+                                continue
			
 
				+                            if seq in sent_sequences:
			
 
				+                                continue
			
 
				+                            body = _assistant_wire_to_feishu_text(m)
			
 
				+                            if body is None:
			
 
				+                                sent_sequences.add(seq)
			
 
				+                                continue
			
 
				+                            body = _truncate_for_im(body, max_text_chars)
			
 
				+                            try:
			
 
				+                                result = await connector.send_text(reply_ctx, body)
			
 
				+                                if result.get("ok"):
			
 
				+                                    sent_sequences.add(seq)
			
 
				+                                else:
			
 
				+                                    logger.error(
			
 
				+                                        "feishu poll: send_text failed seq=%s result=%s",
			
 
				+                                        seq,
			
 
				+                                        result,
			
 
				+                                    )
			
 
				+                            except Exception:
			
 
				+                                logger.exception(
			
 
				+                                    "feishu poll: send_text exception seq=%s",
			
 
				+                                    seq,
			
 
				+                                )
			
 
				+            except httpx.RequestError as exc:
			
 
				+                logger.warning("feishu poll: request error trace_id=%s err=%s", trace_id, exc)
			
 
				+
			
 
				+            if status in _TERMINAL_STATUSES:
			
 
				+                grace += 1
			
 
				+                if grace >= terminal_grace_rounds:
			
 
				+                    break
			
 
				+            else:
			
 
				+                grace = 0
			
 
				+
			
 
				+            await asyncio.sleep(poll_interval)
			
 
				+    finally:
			
 
				+        cur = asyncio.current_task()
			
 
				+        async with _poll_tasks_lock:
			
 
				+            if _poll_tasks.get(trace_id) is cur:
			
 
				+                _poll_tasks.pop(trace_id, None)
			
 
				+
			
 
				+
			
 
				+def _schedule_assistant_poll(
			
 
				+    *,
			
 
				+    agent_base_url: str,
			
 
				+    trace_id: str,
			
 
				+    reply_context: FeishuReplyContext,
			
 
				+    connector: Any,
			
 
				+    poll_interval: float,
			
 
				+    poll_request_timeout: float,
			
 
				+    terminal_grace_rounds: int,
			
 
				+    poll_max_seconds: float,
			
 
				+    max_text_chars: int,
			
 
				+) -> None:
			
 
				+    """同一 trace 仅保留一个活跃轮询任务。"""
			
 
				+
			
 
				+    async def _runner() -> None:
			
 
				+        await _poll_assistants_to_feishu(
			
 
				+            agent_base_url=agent_base_url,
			
 
				+            trace_id=trace_id,
			
 
				+            reply_ctx=reply_context,
			
 
				+            connector=connector,
			
 
				+            poll_interval=poll_interval,
			
 
				+            poll_request_timeout=poll_request_timeout,
			
 
				+            terminal_grace_rounds=terminal_grace_rounds,
			
 
				+            poll_max_seconds=poll_max_seconds,
			
 
				+            max_text_chars=max_text_chars,
			
 
				+        )
			
 
				+
			
 
				+    async def _spawn() -> None:
			
 
				+        async with _poll_tasks_lock:
			
 
				+            existing = _poll_tasks.get(trace_id)
			
 
				+            if existing is not None and not existing.done():
			
 
				+                return
			
 
				+            task = asyncio.create_task(_runner())
			
 
				+            _poll_tasks[trace_id] = task
			
 
				+
			
 
				+    try:
			
 
				+        loop = asyncio.get_running_loop()
			
 
				+    except RuntimeError:
			
 
				+        return
			
 
				+    _ = loop.create_task(_spawn())
			
 
				+
			
 
				+
			
 
				 class FeishuHttpRunApiExecutor:
			
 
				-    """调用 ``agent/trace/run_api`` 暴露的 Trace HTTP API，触发后台 Agent 运行。"""
			
 
				+    """调用 Agent Trace HTTP API，并可选轮询 assistant 消息转发到飞书。"""
			
 
				 
			
 
				     def __init__(
			
 
				         self,
			
@@ -67,10 +283,16 @@ class FeishuHttpRunApiExecutor:
 
				         base_url: str,
			
 
				         timeout: float,
			
 
				         identity_resolver: Any,
			
 
				-        model: str = "gpt-4o",
			
 
				+        model: str = "qwen3.5-flash",
			
 
				         max_iterations: int = 200,
			
 
				         temperature: float = 0.3,
			
 
				         notify_on_submit: bool = True,
			
 
				+        poll_assistant_messages: bool = True,
			
 
				+        poll_interval_seconds: float = 1.0,
			
 
				+        poll_request_timeout: float = 30.0,
			
 
				+        poll_terminal_grace_rounds: int = 2,
			
 
				+        poll_max_seconds: float = 0.0,
			
 
				+        assistant_max_text_chars: int = 8000,
			
 
				     ) -> None:
			
 
				         self._base = base_url.rstrip("/")
			
 
				         self._timeout = timeout
			
@@ -79,6 +301,12 @@ class FeishuHttpRunApiExecutor:
 
				         self._max_iterations = max_iterations
			
 
				         self._temperature = temperature
			
 
				         self._notify = notify_on_submit
			
 
				+        self._poll_assistants = poll_assistant_messages
			
 
				+        self._poll_interval = poll_interval_seconds
			
 
				+        self._poll_req_timeout = poll_request_timeout
			
 
				+        self._poll_grace = poll_terminal_grace_rounds
			
 
				+        self._poll_max_seconds = poll_max_seconds
			
 
				+        self._assistant_max_chars = assistant_max_text_chars
			
 
				         self._map_lock = asyncio.Lock()
			
 
				         self._api_trace_by_user: dict[str, str] = {}
			
 
				 
			
@@ -175,4 +403,17 @@ class FeishuHttpRunApiExecutor:
 
				                 f"[Gateway] 已提交 Agent（API trace_id={resolved_id}），后台执行中。",
			
 
				             )
			
 
				 
			
 
				+        if self._poll_assistants:
			
 
				+            _schedule_assistant_poll(
			
 
				+                agent_base_url=self._base,
			
 
				+                trace_id=resolved_id,
			
 
				+                reply_context=copy(reply_context),
			
 
				+                connector=connector,
			
 
				+                poll_interval=self._poll_interval,
			
 
				+                poll_request_timeout=self._poll_req_timeout,
			
 
				+                terminal_grace_rounds=self._poll_grace,
			
 
				+                poll_max_seconds=self._poll_max_seconds,
			
 
				+                max_text_chars=self._assistant_max_chars,
			
 
				+            )
			
 
				+
			
 
				         return task_id
			
--- a/gateway/core/channels/feishu/manager.py
+++ b/gateway/core/channels/feishu/manager.py
@@ -26,10 +26,17 @@ class FeishuChannelConfig:
 
				     dispatch_reactions: bool = False
			
 
				     dispatch_card_actions: bool = False
			
 
				     agent_api_base_url: str = "http://127.0.0.1:8000"
			
 
				-    agent_run_model: str = "gpt-4o"
			
 
				+    agent_run_model: str = "qwen3.5-flash"
			
 
				     agent_run_max_iterations: int = 200
			
 
				     agent_run_temperature: float = 0.3
			
 
				     feishu_run_notify_on_submit: bool = True
			
 
				+    # 轮询 Agent GET /api/traces/{id}/messages，逐条转发主路径 assistant 到飞书
			
 
				+    poll_assistant_messages: bool = True
			
 
				+    poll_interval_seconds: float = 1.0
			
 
				+    poll_request_timeout: float = 30.0
			
 
				+    poll_terminal_grace_rounds: int = 2
			
 
				+    poll_max_seconds: float = 0.0
			
 
				+    assistant_max_text_chars: int = 8000
			
 
				 
			
 
				 
			
 
				 class FeishuChannelManager(ChannelRegistry):
			
@@ -54,6 +61,12 @@ class FeishuChannelManager(ChannelRegistry):
 
				             max_iterations=self._config.agent_run_max_iterations,
			
 
				             temperature=self._config.agent_run_temperature,
			
 
				             notify_on_submit=self._config.feishu_run_notify_on_submit,
			
 
				+            poll_assistant_messages=self._config.poll_assistant_messages,
			
 
				+            poll_interval_seconds=self._config.poll_interval_seconds,
			
 
				+            poll_request_timeout=self._config.poll_request_timeout,
			
 
				+            poll_terminal_grace_rounds=self._config.poll_terminal_grace_rounds,
			
 
				+            poll_max_seconds=self._config.poll_max_seconds,
			
 
				+            assistant_max_text_chars=self._config.assistant_max_text_chars,
			
 
				         )
			
 
				         self._router = FeishuMessageRouter(
			
 
				             connector=self._connector,
			
@@ -90,11 +103,18 @@ class FeishuChannelManager(ChannelRegistry):
 
				                 dispatch_card_actions=os.getenv("CHANNELS_DISPATCH_CARD_ACTIONS", "false").lower()
			
 
				                 in ("1", "true", "yes"),
			
 
				                 agent_api_base_url=os.getenv("GATEWAY_AGENT_API_BASE_URL", "http://127.0.0.1:8000").strip(),
			
 
				-                agent_run_model=os.getenv("FEISHU_AGENT_RUN_MODEL", "gpt-4o").strip(),
			
 
				+                agent_run_model=os.getenv("FEISHU_AGENT_RUN_MODEL", "qwen3.5-flash").strip(),
			
 
				                 agent_run_max_iterations=int(os.getenv("FEISHU_AGENT_RUN_MAX_ITERATIONS", "200")),
			
 
				                 agent_run_temperature=float(os.getenv("FEISHU_AGENT_RUN_TEMPERATURE", "0.3")),
			
 
				                 feishu_run_notify_on_submit=os.getenv("CHANNELS_FEISHU_RUN_NOTIFY", "true").lower()
			
 
				                 in ("1", "true", "yes"),
			
 
				+                poll_assistant_messages=os.getenv("FEISHU_AGENT_POLL_ASSISTANTS", "true").lower()
			
 
				+                in ("1", "true", "yes"),
			
 
				+                poll_interval_seconds=float(os.getenv("FEISHU_AGENT_POLL_INTERVAL", "1.0")),
			
 
				+                poll_request_timeout=float(os.getenv("FEISHU_AGENT_POLL_REQUEST_TIMEOUT", "30")),
			
 
				+                poll_terminal_grace_rounds=int(os.getenv("FEISHU_AGENT_POLL_GRACE_ROUNDS", "2")),
			
 
				+                poll_max_seconds=float(os.getenv("FEISHU_AGENT_POLL_MAX_SECONDS", "0")),
			
 
				+                assistant_max_text_chars=int(os.getenv("FEISHU_AGENT_ASSISTANT_MAX_CHARS", "8000")),
			
 
				             )
			
 
				         )