1 месяц назад · edb3a191a0
--- a/agent/tools/models.py
+++ b/agent/tools/models.py
@@ -6,6 +6,7 @@ Tool Models - 工具系统核心数据模型
 
				 2. ToolContext: 工具执行上下文（依赖注入）
			
 
				 """
			
 
				 
			
 
				+import json
			
 
				 from dataclasses import dataclass, field
			
 
				 from typing import Any, Dict, List, Optional, Protocol
			
 
				 
			
@@ -44,6 +45,9 @@ class ToolResult:
 
				 	# Token追踪（用于工具内部LLM调用）
			
 
				 	tool_usage: Optional[Dict[str, Any]] = None  # 格式：{"model": "...", "prompt_tokens": 100, "completion_tokens": 50, "cost": 0.0}
			
 
				 
			
 
				+	# 默认 metadata 不会进入对话；对批量画像等工具设为 True，将 metadata 序列化后追加给 LLM
			
 
				+	include_metadata_in_llm: bool = False
			
 
				+
			
 
				 	def to_llm_message(self, first_time: bool = True) -> str:
			
 
				 		"""
			
 
				 		转换为给 LLM 的消息
			
@@ -80,6 +84,12 @@ class ToolResult:
 
				 		if self.attachments:
			
 
				 			parts.append(f"\nAttachments: {', '.join(self.attachments)}")
			
 
				 
			
 
				+		if self.include_metadata_in_llm and self.metadata:
			
 
				+			parts.append(
			
 
				+				"## metadata (JSON)\n"
			
 
				+				+ json.dumps(self.metadata, ensure_ascii=False)
			
 
				+			)
			
 
				+
			
 
				 		return "\n\n".join(parts)
			
 
				 
			
 
				 
			
--- a/examples/content_finder/content_finder.md
+++ b/examples/content_finder/content_finder.md
@@ -20,8 +20,9 @@ $system$
 
				 - 抖音视频搜索（Tikhub）：`douyin_search_tikhub`
			
 
				 - 订阅账号作品搜索：`douyin_user_videos`
			
 
				 - 数据库作者检索（按搜索词找历史优质作者）：`find_authors_from_db`
			
 
				-- 作品画像获取：`get_content_fans_portrait`
			
 
				-- 作者画像获取：`get_account_fans_portrait`
			
 
				+- 批量画像（**筛选阶段优先**：一次调用拉齐多条内容画像并按规则账号兜底）：`batch_fetch_portraits`（参数 `candidates_json` 为 JSON 数组字符串）。工具返回的同一条 `tool` 消息正文末尾会附带 `## metadata (JSON)`（含 `results`）；同时会写入 `{OUTPUT_DIR}/{trace_id}/batch_portraits.json`，上下文丢失时用 `read_file` 读取该文件即可恢复结构化结果。
			
 
				+- 作品画像（单条）：`get_content_fans_portrait`
			
 
				+- 作者画像（单条兜底）：`get_account_fans_portrait`
			
 
				 - 过程记录：`think_and_plan`
			
 
				 - 存储结果至数据库：`store_results_mysql`
			
 
				 - 创建aigc计划：`create_crawler_plan_by_douyin_content_id`、`create_crawler_plan_by_douyin_account_id`
			
@@ -91,8 +92,8 @@ $system$
 
				 ```
			
 
				 
			
 
				 ### 筛选阶段必须按照 `content_filtering_strategy` 的步骤进行，对于**case出发**的搜索结果，满足6分即可输出不需要查看画像；其他结果按顺序查看画像
			
 
				-1. 先调用 `get_content_fans_portrait`，检查 `metadata.has_portrait`。
			
 
				-2. 若 `has_portrait=False`，如果是 `douyin_search` 或 `douyin_search_tikhub` 获取到的视频，再调用 `get_account_fans_portrait` 兜底，如果是`douyin_user_videos`则不需要再次调用`get_account_fans_portrait`。
			
 
				+1. **优先**对本轮待画像的候选列表调用一次 `batch_fetch_portraits`：在 `candidates_json` 中传入数组，每项含 `aweme_id`、可选 `author_sec_uid`；来自 `douyin_user_videos` 的条目设 `try_account_fallback: false`，来自 `douyin_search` / `douyin_search_tikhub` 的条目设 `true`（默认）。根据返回的 `metadata.results` 逐条读取 `content.has_portrait` / `account.has_portrait` 与 `portrait_data`（逻辑同原单条工具）。
			
 
				+2. 仅当批量不适用（例如单条补拉）时，再使用 `get_content_fans_portrait`，检查 `metadata.has_portrait`；若 `has_portrait=False` 且来源为搜索类视频，再调用 `get_account_fans_portrait` 兜底；`douyin_user_videos` 来源不调用账号兜底。
			
 
				 补充：`douyin_search` 失败后再调用 `douyin_search_tikhub` 作为兜底。
			
 
				 3. **不允许跳过画像获取直接输出**
			
 
				 
			
@@ -111,8 +112,8 @@ $system$
 
				 
			
 
				 ### 2.筛选阶段是否按规则执行
			
 
				 - 对于所有`基于case出发策略`的搜索结果，优先进行 **基础筛选**和**基于case出发策略筛选**，满足6分条件直接进入最终输出池，不需要调用画像数据。
			
 
				-- 其他策略获取的视频或达不到6分的视频，是否都已调用过 `get_content_fans_portrait(aweme_id)`？
			
 
				-- 对其中 `metadata.has_portrait=False` 的条目，是否**在同一条目上**已调用 `get_account_fans_portrait(account_id=author.sec_uid)` 作为兜底？
			
 
				+- 其他策略获取的视频或达不到6分的视频，是否已通过 **`batch_fetch_portraits`**（或等价的逐条 `get_content_fans_portrait`）获取内容画像？
			
 
				+- 对其中内容无有效画像、且来源为搜索类的条目，是否在批量结果中已包含账号兜底尝试，或已逐条调用 `get_account_fans_portrait`？（`douyin_user_videos` 来源不要求账号兜底。）
			
 
				 - **禁止**：仅因内容侧无画像就跳过账号画像、直接把 `portrait_data` 当空或来源标为 `none` 而未尝试账号接口（除非两次调用均失败且已在理由中说明）。
			
 
				 
			
 
				 ### 3.输出、校验、入库顺序是否正确
			
--- a/examples/content_finder/core.py
+++ b/examples/content_finder/core.py
@@ -79,6 +79,7 @@ from tools import (
 
				     douyin_user_videos,
			
 
				     get_content_fans_portrait,
			
 
				     get_account_fans_portrait,
			
 
				+    batch_fetch_portraits,
			
 
				     create_crawler_plan_by_douyin_content_id,
			
 
				     create_crawler_plan_by_douyin_account_id,
			
 
				     store_results_mysql,
			
@@ -91,7 +92,7 @@ from tools import (
 
				 logger = logging.getLogger(__name__)
			
 
				 
			
 
				 # 默认搜索词
			
 
				-DEFAULT_QUERY = "体制内,近亲繁殖"
			
 
				+DEFAULT_QUERY = "婆媳矛盾,反转式"
			
 
				 DEFAULT_DEMAND_ID = 1
			
 
				 
			
 
				 
			
@@ -174,6 +175,7 @@ async def run_agent(
 
				         "douyin_user_videos",
			
 
				         "get_content_fans_portrait",
			
 
				         "get_account_fans_portrait",
			
 
				+        "batch_fetch_portraits",
			
 
				         "find_authors_from_db",
			
 
				         "store_results_mysql",
			
 
				         "create_crawler_plan_by_douyin_content_id",
			
--- a/examples/content_finder/render_log_html.py
+++ b/examples/content_finder/render_log_html.py
@@ -68,6 +68,7 @@ TOOL_DESCRIPTION_MAP: dict[str, str] = {
 
				     "douyin_user_videos": "通过账号/作者 sec_uid 获取其历史作品列表。",
			
 
				     "get_content_fans_portrait": "获取视频点赞用户画像（热点宝），判断 metadata.has_portrait。",
			
 
				     "get_account_fans_portrait": "获取作者粉丝画像（热点宝），用于内容画像缺失兜底。",
			
 
				+    "batch_fetch_portraits": "批量获取多条内容画像并按规则账号兜底，一次工具调用返回 metadata.results。",
			
 
				     "store_results_mysql": "将 output.json 写入 MySQL（作者表与内容表）。",
			
 
				     "create_crawler_plan_by_douyin_content_id": "为入选视频生成 AIGC 爬取计划。",
			
 
				     "create_crawler_plan_by_douyin_account_id": "为入选账号生成 AIGC 爬取计划。",
			
--- a/examples/content_finder/server.py
+++ b/examples/content_finder/server.py
@@ -244,6 +244,7 @@ async def create_task(request: TaskRequest):
 
				                     "douyin_user_videos",
			
 
				                     "get_content_fans_portrait",
			
 
				                     "get_account_fans_portrait",
			
 
				+                    "batch_fetch_portraits",
			
 
				                     "store_results_mysql",
			
 
				                     "exec_summary",
			
 
				                 ]
			
--- a/examples/content_finder/skills/content_filtering_strategy.md
+++ b/examples/content_finder/skills/content_filtering_strategy.md
@@ -53,19 +53,19 @@ description: 内容筛选方法论
 
				 
			
 
				 ### 阶段3：画像匹配筛选
			
 
				 **分批处理**：先处理前 10 条候选内容，筛选后 >= M 则停止，不足再继续下一批。  
			
 
				-**并行限制**：每次最多并行调用 3 个画像工具。  
			
 
				-**停止条件**：已获取画像数量 >= M × 1.5 时，立即停止，进入下一阶段。
			
 
				-不要无限循环获取画像，避免陷入"一直获取画像"的状态
			
 
				+**批量画像（推荐）**：每一批内先整理本批待画像条目，**一次**调用 `batch_fetch_portraits(candidates_json=...)`（工具内顺序请求接口），用返回的 `metadata.results` 完成本批评估；避免对每条视频各打一轮「内容画像工具 + 可能账号画像工具」导致对话消息暴涨。单批条数不超过工具上限（30），超过则拆成多批多次 `batch_fetch_portraits`。  
			
 
				+**停止条件**：已获取画像数量 >= M × 1.5 时，立即停止，进入下一阶段。  
			
 
				+不要无限循环获取画像，避免陷入"一直获取画像"的状态。
			
 
				 
			
 
				 #### 画像获取优先级
			
 
				 
			
 
				 **优先级 1：内容点赞用户画像**
			
 
				-- 调用 `get_content_fans_portrait(content_id=aweme_id)`
			
 
				-- `metadata.has_portrait=True` → 从 `metadata.portrait_data` 评估，标注来源 `content_like`
			
 
				+- 批量：`batch_fetch_portraits` 返回中每条 `results[i].content.has_portrait` 与 `portrait_data`
			
 
				+- 单条兜底：`get_content_fans_portrait(content_id=aweme_id)`，`metadata.has_portrait=True` → 从 `metadata.portrait_data` 评估，标注来源 `content_like`
			
 
				 
			
 
				 **优先级 2：账号粉丝画像（兜底）**
			
 
				-- 如果 `has_portrait=False`，调用 `get_account_fans_portrait(account_id=author.sec_uid)`
			
 
				-- 有画像则评估，标注来源 `account_fans`
			
 
				+- 批量：同条目的 `results[i].account`（`attempted=true` 且 `has_portrait`）；仅当该条 `try_account_fallback` 为 true（搜索来源）时工具才会请求账号接口；`douyin_user_videos` 来源在 `candidates_json` 中对该条设 `try_account_fallback: false`
			
 
				+- 单条：若 `has_portrait=False`，调用 `get_account_fans_portrait(account_id=author.sec_uid)`；有画像则评估，标注来源 `account_fans`
			
 
				 
			
 
				 **优先级 3：无画像**
			
 
				 - 两者均无画像，仅基于热度和相关性评估，标注来源 `none`
			
--- a/examples/content_finder/skills/exec_summary_rows.md
+++ b/examples/content_finder/skills/exec_summary_rows.md
@@ -7,27 +7,23 @@ description: 仅在需要写入 process_trace.json 时，用于记录最终输
 
				 生成用于记录最终输出的每条视频的寻找过程的json
			
 
				 
			
 
				 ## 强约束（必须遵守）
			
 
				-1. **只基于入选内容**：只能对 `output.json.contents` 中出现的 `aweme_id` 生成 rows；不得输出任何不在 contents 的视频（包括淘汰候选/搜索过程中的视频）。
			
 
				+1. **视频选择**：只能对 `output.json.contents` 中出现的 `aweme_id` 生成 rows；不得输出任何不在 contents 的视频（包括淘汰候选/搜索过程中的视频）。
			
 
				 2. **rows 数量必须等于 contents 数量**：一条入选内容必须对应且仅对应一行 row。
			
 
				 3. **字段固定且统一**：每行 row 只允许包含下列 key（不得增删改名）：
			
 
				-   - `aweme_id`
			
 
				-   - `title`
			
 
				-   - `author_nickname`
			
 
				-   - `strategy_type`
			
 
				-   - `from_case_aweme_id`
			
 
				-   - `from_case_point`
			
 
				-   - `from_feature`
			
 
				-   - `search_keyword`
			
 
				-   - `channel`
			
 
				-   - `decision_basis`
			
 
				-   - `decision_notes`
			
 
				-   - `input_features`
			
 
				-4. **值使用中文枚举**：
			
 
				-   - `strategy_type`: `"case出发策略"` / `"特征出发策略"`
			
 
				-   - `channel`: `"抖音搜索"` / `"订阅账号"` / `"榜单"` / `"其他"`
			
 
				-   - `decision_basis`: `"内容画像匹配"` / `"作者画像匹配"` / `"需求筛选"` / `"画像缺失"` / `"其他"`
			
 
				+   - `aweme_id`：视频id
			
 
				+   - `title`：视频标题
			
 
				+   - `author_nickname`：作者名称。
			
 
				+   - `strategy_type`：寻找策略。"case出发" / "特征出发"。
			
 
				+   - `from_case_aweme_id`：case出发策略关联的内容id
			
 
				+   - `from_case_point`： case出发策略 关联的灵感点。
			
 
				+   - `from_feature`： 特征出发 关联的特征词。
			
 
				+   - `search_keyword`： 搜索词，该内容从哪个搜索词来。
			
 
				+   - `channel`：寻找方式 "抖音搜索" / "索引榜单搜索" / "垂类推荐流" / "订阅账号作品搜索"
			
 
				+   - `decision_basis`：筛选的方式 "基于case出发策略筛选" / "内容点赞用户画像" / "账号粉丝画像" / "其他"
			
 
				+   - `decision_notes`：筛选的理由
			
 
				+   - `input_features`： Agent起始输入的特征词
			
 
				+4. **值使用中文枚举**
			
 
				 5. **input_features**：必须是 `list[str]`；默认从 `output.json.query` 按逗号拆分得到（兼容中文逗号）。
			
 
				-6. **允许为空的字段**：`from_case_aweme_id/from_case_point/from_feature` 若无法确定可为空字符串，但不能缺 key。
			
 
				 
			
 
				 ## 依据
			
 
				 - `output.json`（必须读取并以 `contents` 为准）
			
@@ -35,18 +31,6 @@ description: 仅在需要写入 process_trace.json 时，用于记录最终输
 
				   - `contents[]`：每条入选内容，含 `aweme_id/title/author_nickname/reason/portrait_data.source` 等
			
 
				 - `log.txt`：用于判断内容的 strategy_type(来自哪种策略)、from_case_point(来自哪个灵感点)、search_keyword(搜索词)与渠道等
			
 
				 
			
 
				-## 生成规则（建议优先级）
			
 
				-对每个 `content in output.json.contents`：
			
 
				-1. `aweme_id/title/author_nickname` 直接来自 content（必须与 contents 一致）
			
 
				-2. `decision_notes`：优先用 `content.reason`（入选理由）
			
 
				-3. `decision_basis`：
			
 
				-   - 若 `content.portrait_data.source == "content_like"` → `"内容画像匹配"`
			
 
				-   - 若 `== "account_fans"` → `"作者画像匹配"`
			
 
				-   - 否则 `"其他"`
			
 
				-4. `strategy_type/channel/search_keyword`：
			
 
				-   - 在`log.txt`/上下文找明确来源，按事实填（且用上面的中文枚举）
			
 
				-   - 否则 字段留空
			
 
				-5. `from_case_* / from_feature`：能确定就填；不确定可空串。
			
 
				 
			
 
				 ## 输出格式（必须严格）
			
 
				 只输出一个 JSON 对象（不要 Markdown、不要解释、不要多余文本）：
			
--- a/examples/content_finder/tools/__init__.py
+++ b/examples/content_finder/tools/__init__.py
@@ -5,7 +5,11 @@
 
				 from .douyin_search import douyin_search
			
 
				 from .douyin_search_tikhub import douyin_search_tikhub
			
 
				 from .douyin_user_videos import douyin_user_videos
			
 
				-from .hotspot_profile import get_content_fans_portrait, get_account_fans_portrait
			
 
				+from .hotspot_profile import (
			
 
				+    get_content_fans_portrait,
			
 
				+    get_account_fans_portrait,
			
 
				+    batch_fetch_portraits,
			
 
				+)
			
 
				 from .store_results_mysql import store_results_mysql
			
 
				 from .aigc_platform_api import create_crawler_plan_by_douyin_content_id, create_crawler_plan_by_douyin_account_id
			
 
				 from .think_and_plan import think_and_plan
			
@@ -19,6 +23,7 @@ __all__ = [
 
				     "douyin_user_videos",
			
 
				     "get_content_fans_portrait",
			
 
				     "get_account_fans_portrait",
			
 
				+    "batch_fetch_portraits",
			
 
				     "store_results_mysql",
			
 
				     "create_crawler_plan_by_douyin_content_id",
			
 
				     "create_crawler_plan_by_douyin_account_id",
			
--- a/examples/content_finder/tools/aigc_platform_api.py
+++ b/examples/content_finder/tools/aigc_platform_api.py
@@ -25,7 +25,7 @@ def _log_aigc_return(label: str, params: Dict[str, Any], r: ToolResult) -> ToolR
 
				     log_tool_call(label, params, format_tool_result_for_log(r))
			
 
				     return r
			
 
				 
			
 
				-CAN_NOT_CREATE_PLAN = False
			
 
				+CAN_NOT_CREATE_PLAN = True
			
 
				 
			
 
				 AIGC_BASE_URL = "https://aigc-api.aiddit.com"
			
 
				 CRAWLER_PLAN_CREATE_URL = f"{AIGC_BASE_URL}/aigc/crawler/plan/save"
			
--- a/examples/content_finder/tools/hotspot_profile.py
+++ b/examples/content_finder/tools/hotspot_profile.py
@@ -3,10 +3,12 @@
 
				 
			
 
				 调用内部爬虫服务获取账号/内容的粉丝画像。
			
 
				 """
			
 
				-import asyncio
			
 
				+import json
			
 
				 import logging
			
 
				+import os
			
 
				 import time
			
 
				-from typing import Optional, Dict, Any, List, Tuple
			
 
				+from pathlib import Path
			
 
				+from typing import Any, Dict, List, Optional, Tuple, TypedDict
			
 
				 
			
 
				 import requests
			
 
				 
			
@@ -17,11 +19,47 @@ logger = logging.getLogger(__name__)
 
				 
			
 
				 _LABEL_ACCOUNT = "工具调用：get_account_fans_portrait -> 抖音账号粉丝画像（热点宝）"
			
 
				 _LABEL_CONTENT = "工具调用：get_content_fans_portrait -> 内容点赞用户画像（热点宝）"
			
 
				+_LABEL_BATCH = "工具调用：batch_fetch_portraits -> 批量获取内容/账号画像（热点宝）"
			
 
				 
			
 
				+BATCH_MAX_ITEMS = 30
			
 
				+_BATCH_SNAPSHOT_NAME = "batch_portraits.json"
			
 
				 
			
 
				-def _log_return(label: str, params: Dict[str, Any], r: ToolResult) -> ToolResult:
			
 
				-    log_tool_call(label, params, format_tool_result_for_log(r))
			
 
				-    return r
			
 
				+
			
 
				+def _repo_root_from_this_file() -> Path:
			
 
				+    # examples/content_finder/tools/hotspot_profile.py -> Agent 仓库根
			
 
				+    return Path(__file__).resolve().parents[3]
			
 
				+
			
 
				+
			
 
				+def _resolve_output_dir_path() -> Path:
			
 
				+    raw = (os.getenv("OUTPUT_DIR") or ".cache/output").strip()
			
 
				+    p = Path(raw).expanduser()
			
 
				+    return p.resolve() if p.is_absolute() else (_repo_root_from_this_file() / p).resolve()
			
 
				+
			
 
				+
			
 
				+def _persist_batch_portraits_json(
			
 
				+    trace_id: Optional[str],
			
 
				+    results: List[Dict[str, Any]],
			
 
				+    count: int,
			
 
				+) -> Optional[str]:
			
 
				+    """将批量画像结果写入 OUTPUT_DIR/<trace_id>/batch_portraits.json，便于 read_file 与排障。"""
			
 
				+    if not trace_id:
			
 
				+        return None
			
 
				+    try:
			
 
				+        out_dir = _resolve_output_dir_path() / trace_id
			
 
				+        out_dir.mkdir(parents=True, exist_ok=True)
			
 
				+        path = out_dir / _BATCH_SNAPSHOT_NAME
			
 
				+        path.write_text(
			
 
				+            json.dumps(
			
 
				+                {"trace_id": trace_id, "count": count, "results": results},
			
 
				+                ensure_ascii=False,
			
 
				+                indent=2,
			
 
				+            ),
			
 
				+            encoding="utf-8",
			
 
				+        )
			
 
				+        return str(path)
			
 
				+    except OSError as e:
			
 
				+        logger.warning("batch portrait snapshot write failed: %s", e)
			
 
				+        return None
			
 
				 
			
 
				 
			
 
				 ACCOUNT_FANS_PORTRAIT_API = "http://crawapi.piaoquantv.com/crawler/dou_yin/re_dian_bao/account_fans_portrait"
			
@@ -29,6 +67,189 @@ CONTENT_FANS_PORTRAIT_API = "http://crawapi.piaoquantv.com/crawler/dou_yin/re_di
 
				 DEFAULT_TIMEOUT = 60.0
			
 
				 
			
 
				 
			
 
				+class _PortraitOk(TypedDict):
			
 
				+    output: str
			
 
				+    has_portrait: bool
			
 
				+    portrait_data: Dict[str, Any]
			
 
				+    raw_data: Any
			
 
				+
			
 
				+
			
 
				+def _log_return(label: str, params: Dict[str, Any], r: ToolResult) -> ToolResult:
			
 
				+    log_tool_call(label, params, format_tool_result_for_log(r))
			
 
				+    return r
			
 
				+
			
 
				+
			
 
				+def _top_k(items: Dict[str, Any], k: int) -> List[Tuple[str, Any]]:
			
 
				+    def percent_value(entry: Tuple[str, Any]) -> float:
			
 
				+        metrics = entry[1] if isinstance(entry[1], dict) else {}
			
 
				+        return metrics.get("percentage")
			
 
				+
			
 
				+    return sorted(items.items(), key=percent_value, reverse=True)[:k]
			
 
				+
			
 
				+
			
 
				+def _format_portrait_summary(
			
 
				+    header_line: str,
			
 
				+    link_line: str,
			
 
				+    portrait: Dict[str, Any],
			
 
				+) -> str:
			
 
				+    summary_lines = [header_line, link_line, ""]
			
 
				+    for k, v in portrait.items():
			
 
				+        if not isinstance(v, dict):
			
 
				+            continue
			
 
				+        if k in ("省份", "城市"):
			
 
				+            summary_lines.append(f"【{k} TOP5】分布")
			
 
				+            items = _top_k(v, 5)
			
 
				+        else:
			
 
				+            summary_lines.append(f"【{k}】分布")
			
 
				+            items = v.items()
			
 
				+
			
 
				+        for name, metrics in items:
			
 
				+            ratio = metrics.get("percentage")
			
 
				+            tgi = metrics.get("preference")
			
 
				+            summary_lines.append(f"  {name}: {ratio} (偏好度: {tgi})")
			
 
				+        summary_lines.append("")
			
 
				+    return "\n".join(summary_lines)
			
 
				+
			
 
				+
			
 
				+def _validate_account_id(account_id: str) -> Optional[str]:
			
 
				+    if not account_id or not isinstance(account_id, str):
			
 
				+        return "account_id 参数无效：必须是非空字符串"
			
 
				+    if not account_id.startswith("MS4wLjABAAAA"):
			
 
				+        return (
			
 
				+            f"account_id 格式错误：必须以 MS4wLjABAAAA 开头，"
			
 
				+            f"当前值: {account_id[:min(20, len(account_id))]}..."
			
 
				+        )
			
 
				+    return None
			
 
				+
			
 
				+
			
 
				+def _validate_content_id(content_id: str) -> Optional[str]:
			
 
				+    if not content_id or not isinstance(content_id, str):
			
 
				+        return "content_id 参数无效：必须是非空字符串"
			
 
				+    if not content_id.isdigit():
			
 
				+        return f"content_id 格式错误：aweme_id 应该是纯数字，当前值: {content_id[:20]}..."
			
 
				+    if len(content_id) < 15 or len(content_id) > 25:
			
 
				+        return f"content_id 长度异常：期望 15-25 位数字，实际 {len(content_id)} 位"
			
 
				+    return None
			
 
				+
			
 
				+
			
 
				+def _dimension_flags(
			
 
				+    need_province: bool,
			
 
				+    need_city: bool,
			
 
				+    need_city_level: bool,
			
 
				+    need_gender: bool,
			
 
				+    need_age: bool,
			
 
				+    need_phone_brand: bool,
			
 
				+    need_phone_price: bool,
			
 
				+) -> Dict[str, bool]:
			
 
				+    return {
			
 
				+        "need_province": need_province,
			
 
				+        "need_city": need_city,
			
 
				+        "need_city_level": need_city_level,
			
 
				+        "need_gender": need_gender,
			
 
				+        "need_age": need_age,
			
 
				+        "need_phone_brand": need_phone_brand,
			
 
				+        "need_phone_price": need_phone_price,
			
 
				+    }
			
 
				+
			
 
				+
			
 
				+def _sync_fetch_account_portrait(
			
 
				+    account_id: str,
			
 
				+    flags: Dict[str, bool],
			
 
				+    request_timeout: float,
			
 
				+) -> Tuple[Optional[str], Optional[_PortraitOk]]:
			
 
				+    err = _validate_account_id(account_id)
			
 
				+    if err:
			
 
				+        return err, None
			
 
				+    payload = {"account_id": account_id, **flags}
			
 
				+    try:
			
 
				+        response = requests.post(
			
 
				+            ACCOUNT_FANS_PORTRAIT_API,
			
 
				+            json=payload,
			
 
				+            headers={"Content-Type": "application/json"},
			
 
				+            timeout=request_timeout,
			
 
				+        )
			
 
				+        response.raise_for_status()
			
 
				+        data = response.json()
			
 
				+    except requests.exceptions.HTTPError as e:
			
 
				+        return f"HTTP {e.response.status_code}: {e.response.text}", None
			
 
				+    except requests.exceptions.Timeout:
			
 
				+        return f"请求超时（{request_timeout}秒）", None
			
 
				+    except requests.exceptions.RequestException as e:
			
 
				+        return f"网络错误: {str(e)}", None
			
 
				+    except Exception as e:
			
 
				+        logger.error(
			
 
				+            "account portrait request failed",
			
 
				+            extra={"account_id": account_id, "error": str(e)},
			
 
				+            exc_info=True,
			
 
				+        )
			
 
				+        return f"未知错误: {str(e)}", None
			
 
				+
			
 
				+    data_block = data.get("data", {}) if isinstance(data.get("data"), dict) else {}
			
 
				+    portrait = data_block.get("data", {}) if isinstance(data_block.get("data"), dict) else {}
			
 
				+    header = f"账号 {account_id} 的粉丝画像"
			
 
				+    link = (
			
 
				+        f"画像链接：https://douhot.douyin.com/creator/detail?"
			
 
				+        f"active_tab=creator_fans_portrait&creator_id={account_id}"
			
 
				+    )
			
 
				+    output = _format_portrait_summary(header, link, portrait)
			
 
				+    has_valid = bool(portrait and any(isinstance(v, dict) and v for v in portrait.values()))
			
 
				+    return None, _PortraitOk(
			
 
				+        output=output,
			
 
				+        has_portrait=has_valid,
			
 
				+        portrait_data=portrait,
			
 
				+        raw_data=data,
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+def _sync_fetch_content_portrait(
			
 
				+    content_id: str,
			
 
				+    flags: Dict[str, bool],
			
 
				+    request_timeout: float,
			
 
				+) -> Tuple[Optional[str], Optional[_PortraitOk]]:
			
 
				+    err = _validate_content_id(content_id)
			
 
				+    if err:
			
 
				+        return err, None
			
 
				+    payload = {"content_id": content_id, **flags}
			
 
				+    try:
			
 
				+        response = requests.post(
			
 
				+            CONTENT_FANS_PORTRAIT_API,
			
 
				+            json=payload,
			
 
				+            headers={"Content-Type": "application/json"},
			
 
				+            timeout=request_timeout,
			
 
				+        )
			
 
				+        response.raise_for_status()
			
 
				+        data = response.json()
			
 
				+    except requests.exceptions.HTTPError as e:
			
 
				+        return f"HTTP {e.response.status_code}: {e.response.text}", None
			
 
				+    except requests.exceptions.Timeout:
			
 
				+        return f"请求超时（{request_timeout}秒）", None
			
 
				+    except requests.exceptions.RequestException as e:
			
 
				+        return f"网络错误: {str(e)}", None
			
 
				+    except Exception as e:
			
 
				+        logger.error(
			
 
				+            "content portrait request failed",
			
 
				+            extra={"content_id": content_id, "error": str(e)},
			
 
				+            exc_info=True,
			
 
				+        )
			
 
				+        return f"未知错误: {str(e)}", None
			
 
				+
			
 
				+    data_block = data.get("data", {}) if isinstance(data.get("data"), dict) else {}
			
 
				+    portrait = data_block.get("data", {}) if isinstance(data_block.get("data"), dict) else {}
			
 
				+    header = f"内容 {content_id} 的点赞用户画像"
			
 
				+    link = (
			
 
				+        f"画像链接：https://douhot.douyin.com/video/detail?"
			
 
				+        f"active_tab=video_fans&video_id={content_id}"
			
 
				+    )
			
 
				+    output = _format_portrait_summary(header, link, portrait)
			
 
				+    has_valid = bool(portrait and any(isinstance(v, dict) and v for v in portrait.values()))
			
 
				+    return None, _PortraitOk(
			
 
				+        output=output,
			
 
				+        has_portrait=has_valid,
			
 
				+        portrait_data=portrait,
			
 
				+        raw_data=data,
			
 
				+    )
			
 
				+
			
 
				+
			
 
				 @tool(description="获取抖音账号粉丝画像（热点宝），支持选择画像维度")
			
 
				 async def get_account_fans_portrait(
			
 
				     account_id: str,
			
@@ -93,166 +314,55 @@ async def get_account_fans_portrait(
 
				         "need_phone_price": need_phone_price,
			
 
				         "timeout": timeout,
			
 
				     }
			
 
				-
			
 
				-    # 验证 account_id 格式
			
 
				-    if not account_id or not isinstance(account_id, str):
			
 
				-        logger.error("get_account_fans_portrait invalid account_id", extra={"account_id": account_id})
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="账号粉丝画像获取失败",
			
 
				-                output="",
			
 
				-                error="account_id 参数无效：必须是非空字符串",
			
 
				-            ),
			
 
				-        )
			
 
				-
			
 
				-    if not account_id.startswith("MS4wLjABAAAA"):
			
 
				-        logger.error("get_account_fans_portrait invalid sec_uid format", extra={"account_id": account_id})
			
 
				+    flags = _dimension_flags(
			
 
				+        need_province,
			
 
				+        need_city,
			
 
				+        need_city_level,
			
 
				+        need_gender,
			
 
				+        need_age,
			
 
				+        need_phone_brand,
			
 
				+        need_phone_price,
			
 
				+    )
			
 
				+    request_timeout = timeout if timeout is not None else DEFAULT_TIMEOUT
			
 
				+    err, ok = _sync_fetch_account_portrait(account_id, flags, request_timeout)
			
 
				+    duration_ms = int((time.time() - start_time) * 1000)
			
 
				+
			
 
				+    if err:
			
 
				+        logger.error("get_account_fans_portrait failed", extra={"account_id": account_id, "error": err})
			
 
				         return _log_return(
			
 
				             _LABEL_ACCOUNT,
			
 
				             call_params,
			
 
				             ToolResult(
			
 
				                 title="账号粉丝画像获取失败",
			
 
				                 output="",
			
 
				-                error=f"account_id 格式错误：必须以 MS4wLjABAAAA 开头，当前值: {account_id[:min(20, len(account_id))]}...",
			
 
				+                error=err,
			
 
				             ),
			
 
				         )
			
 
				 
			
 
				-    # if len(account_id) < 70 or len(account_id) > 90:
			
 
				-    #     logger.error("get_account_fans_portrait invalid sec_uid length", extra={"account_id": account_id, "length": len(account_id)})
			
 
				-    #     return ToolResult(
			
 
				-    #         title="账号粉丝画像获取失败",
			
 
				-    #         output="",
			
 
				-    #         error=f"account_id 长度异常：期望 70-90 字符，实际 {len(account_id)} 字符。这可能是编造或截断的数据。",
			
 
				-    #     )
			
 
				-
			
 
				-    try:
			
 
				-        payload = {
			
 
				+    assert ok is not None
			
 
				+    logger.info(
			
 
				+        "get_account_fans_portrait completed",
			
 
				+        extra={
			
 
				             "account_id": account_id,
			
 
				-            "need_province": need_province,
			
 
				-            "need_city": need_city,
			
 
				-            "need_city_level": need_city_level,
			
 
				-            "need_gender": need_gender,
			
 
				-            "need_age": need_age,
			
 
				-            "need_phone_brand": need_phone_brand,
			
 
				-            "need_phone_price": need_phone_price,
			
 
				-        }
			
 
				-
			
 
				-        request_timeout = timeout if timeout is not None else DEFAULT_TIMEOUT
			
 
				-
			
 
				-        response = requests.post(
			
 
				-            ACCOUNT_FANS_PORTRAIT_API,
			
 
				-            json=payload,
			
 
				-            headers={"Content-Type": "application/json"},
			
 
				-            timeout=request_timeout
			
 
				-        )
			
 
				-        response.raise_for_status()
			
 
				-        data = response.json()
			
 
				-
			
 
				-        data_block = data.get("data", {}) if isinstance(data.get("data"), dict) else {}
			
 
				-        portrait = data_block.get("data", {}) if isinstance(data_block.get("data"), dict) else {}
			
 
				-
			
 
				-        # 格式化输出摘要
			
 
				-        summary_lines = [f"账号 {account_id} 的粉丝画像"]
			
 
				-        summary_lines.append(f"画像链接：https://douhot.douyin.com/creator/detail?active_tab=creator_fans_portrait&creator_id={account_id}")
			
 
				-        summary_lines.append("")
			
 
				-        for k, v in portrait.items():
			
 
				-            if not isinstance(v, dict):
			
 
				-                continue
			
 
				-            if k in ("省份", "城市"):
			
 
				-                summary_lines.append(f"【{k} TOP5】分布")
			
 
				-                items = _top_k(v, 5)
			
 
				-            else:
			
 
				-                summary_lines.append(f"【{k}】分布")
			
 
				-                items = v.items()
			
 
				-
			
 
				-            for name, metrics in items:
			
 
				-                ratio = metrics.get("percentage")
			
 
				-                tgi = metrics.get("preference")
			
 
				-                summary_lines.append(f"  {name}: {ratio} (偏好度: {tgi})")
			
 
				-            summary_lines.append("")
			
 
				-
			
 
				-        duration_ms = int((time.time() - start_time) * 1000)
			
 
				-        has_valid_portrait = bool(portrait and any(
			
 
				-            isinstance(v, dict) and v for v in portrait.values()
			
 
				-        ))
			
 
				-
			
 
				-        logger.info(
			
 
				-            "get_account_fans_portrait completed",
			
 
				-            extra={
			
 
				-                "account_id": account_id,
			
 
				-                "has_portrait": has_valid_portrait,
			
 
				-                "portrait_dimensions": list(portrait.keys()) if portrait else [],
			
 
				-                "duration_ms": duration_ms
			
 
				-            }
			
 
				-        )
			
 
				-
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title=f"账号粉丝画像: {account_id}",
			
 
				-                output="\n".join(summary_lines),
			
 
				-                long_term_memory=f"Fetched fans portrait for account '{account_id}'",
			
 
				-                metadata={
			
 
				-                    "raw_data": data,
			
 
				-                    "has_portrait": has_valid_portrait,
			
 
				-                    "portrait_data": portrait,
			
 
				-                },
			
 
				-            ),
			
 
				-        )
			
 
				-    except requests.exceptions.HTTPError as e:
			
 
				-        logger.error(
			
 
				-            "get_account_fans_portrait HTTP error",
			
 
				-            extra={
			
 
				-                "account_id": account_id,
			
 
				-                "status_code": e.response.status_code,
			
 
				-                "error": str(e)
			
 
				-            }
			
 
				-        )
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="账号粉丝画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"HTTP {e.response.status_code}: {e.response.text}",
			
 
				-            ),
			
 
				-        )
			
 
				-    except requests.exceptions.Timeout:
			
 
				-        logger.error("get_account_fans_portrait timeout", extra={"account_id": account_id, "timeout": request_timeout})
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="账号粉丝画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"请求超时（{request_timeout}秒）",
			
 
				-            ),
			
 
				-        )
			
 
				-    except requests.exceptions.RequestException as e:
			
 
				-        logger.error("get_account_fans_portrait network error", extra={"account_id": account_id, "error": str(e)})
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="账号粉丝画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"网络错误: {str(e)}",
			
 
				-            ),
			
 
				-        )
			
 
				-    except Exception as e:
			
 
				-        logger.error("get_account_fans_portrait unexpected error", extra={"account_id": account_id, "error": str(e)}, exc_info=True)
			
 
				-        return _log_return(
			
 
				-            _LABEL_ACCOUNT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="账号粉丝画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"未知错误: {str(e)}",
			
 
				-            ),
			
 
				-        )
			
 
				+            "has_portrait": ok["has_portrait"],
			
 
				+            "portrait_dimensions": list(ok["portrait_data"].keys()) if ok["portrait_data"] else [],
			
 
				+            "duration_ms": duration_ms,
			
 
				+        },
			
 
				+    )
			
 
				+    return _log_return(
			
 
				+        _LABEL_ACCOUNT,
			
 
				+        call_params,
			
 
				+        ToolResult(
			
 
				+            title=f"账号粉丝画像: {account_id}",
			
 
				+            output=ok["output"],
			
 
				+            long_term_memory=f"Fetched fans portrait for account '{account_id}'",
			
 
				+            metadata={
			
 
				+                "raw_data": ok["raw_data"],
			
 
				+                "has_portrait": ok["has_portrait"],
			
 
				+                "portrait_data": ok["portrait_data"],
			
 
				+            },
			
 
				+        ),
			
 
				+    )
			
 
				 
			
 
				 
			
 
				 @tool(description="获取抖音内容点赞用户画像（热点宝），支持选择画像维度")
			
@@ -320,176 +430,311 @@ async def get_content_fans_portrait(
 
				         "need_phone_price": need_phone_price,
			
 
				         "timeout": timeout,
			
 
				     }
			
 
				-
			
 
				-    # 验证 content_id 格式
			
 
				-    if not content_id or not isinstance(content_id, str):
			
 
				-        logger.error("get_content_fans_portrait invalid content_id", extra={"content_id": content_id})
			
 
				+    flags = _dimension_flags(
			
 
				+        need_province,
			
 
				+        need_city,
			
 
				+        need_city_level,
			
 
				+        need_gender,
			
 
				+        need_age,
			
 
				+        need_phone_brand,
			
 
				+        need_phone_price,
			
 
				+    )
			
 
				+    request_timeout = timeout if timeout is not None else DEFAULT_TIMEOUT
			
 
				+    err, ok = _sync_fetch_content_portrait(content_id, flags, request_timeout)
			
 
				+    duration_ms = int((time.time() - start_time) * 1000)
			
 
				+
			
 
				+    if err:
			
 
				+        logger.error("get_content_fans_portrait failed", extra={"content_id": content_id, "error": err})
			
 
				         return _log_return(
			
 
				             _LABEL_CONTENT,
			
 
				             call_params,
			
 
				             ToolResult(
			
 
				                 title="内容点赞用户画像获取失败",
			
 
				                 output="",
			
 
				-                error="content_id 参数无效：必须是非空字符串",
			
 
				+                error=err,
			
 
				             ),
			
 
				         )
			
 
				 
			
 
				-    # aweme_id 应该是纯数字字符串，长度约 19 位
			
 
				-    if not content_id.isdigit():
			
 
				-        logger.error("get_content_fans_portrait invalid aweme_id format", extra={"content_id": content_id})
			
 
				-        return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"content_id 格式错误：aweme_id 应该是纯数字，当前值: {content_id[:20]}...",
			
 
				-            ),
			
 
				-        )
			
 
				-
			
 
				-    if len(content_id) < 15 or len(content_id) > 25:
			
 
				-        logger.error("get_content_fans_portrait invalid aweme_id length", extra={"content_id": content_id, "length": len(content_id)})
			
 
				-        return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"content_id 长度异常：期望 15-25 位数字，实际 {len(content_id)} 位",
			
 
				-            ),
			
 
				-        )
			
 
				-
			
 
				-    try:
			
 
				-        payload = {
			
 
				+    assert ok is not None
			
 
				+    logger.info(
			
 
				+        "get_content_fans_portrait completed",
			
 
				+        extra={
			
 
				             "content_id": content_id,
			
 
				-            "need_province": need_province,
			
 
				-            "need_city": need_city,
			
 
				-            "need_city_level": need_city_level,
			
 
				-            "need_gender": need_gender,
			
 
				-            "need_age": need_age,
			
 
				-            "need_phone_brand": need_phone_brand,
			
 
				-            "need_phone_price": need_phone_price,
			
 
				-        }
			
 
				-
			
 
				-        request_timeout = timeout if timeout is not None else DEFAULT_TIMEOUT
			
 
				-
			
 
				-        response = requests.post(
			
 
				-            CONTENT_FANS_PORTRAIT_API,
			
 
				-            json=payload,
			
 
				-            headers={"Content-Type": "application/json"},
			
 
				-            timeout=request_timeout
			
 
				-        )
			
 
				-        response.raise_for_status()
			
 
				-        data = response.json()
			
 
				-
			
 
				-        data_block = data.get("data", {}) if isinstance(data.get("data"), dict) else {}
			
 
				-        portrait = data_block.get("data", {}) if isinstance(data_block.get("data"), dict) else {}
			
 
				+            "has_portrait": ok["has_portrait"],
			
 
				+            "portrait_dimensions": list(ok["portrait_data"].keys()) if ok["portrait_data"] else [],
			
 
				+            "duration_ms": duration_ms,
			
 
				+        },
			
 
				+    )
			
 
				+    return _log_return(
			
 
				+        _LABEL_CONTENT,
			
 
				+        call_params,
			
 
				+        ToolResult(
			
 
				+            title=f"内容点赞用户画像: {content_id}",
			
 
				+            output=ok["output"],
			
 
				+            long_term_memory=f"Fetched fans portrait for content '{content_id}'",
			
 
				+            metadata={
			
 
				+                "raw_data": ok["raw_data"],
			
 
				+                "has_portrait": ok["has_portrait"],
			
 
				+                "portrait_data": ok["portrait_data"],
			
 
				+            },
			
 
				+        ),
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+@tool(
			
 
				+    description=(
			
 
				+        "批量获取多条候选视频的画像：工具内依次请求内容点赞画像；"
			
 
				+        "若无画像且允许兜底则再请求作者粉丝画像。一次调用返回所有条目，减少对话轮次。"
			
 
				+        "完整结构化结果在同一条 tool 消息的 metadata JSON 中，并写入 OUTPUT_DIR/<trace_id>/batch_portraits.json。"
			
 
				+    ),
			
 
				+    hidden_params=["context"],
			
 
				+)
			
 
				+async def batch_fetch_portraits(
			
 
				+    candidates_json: str,
			
 
				+    need_province: bool = False,
			
 
				+    need_city: bool = False,
			
 
				+    need_city_level: bool = False,
			
 
				+    need_gender: bool = False,
			
 
				+    need_age: bool = True,
			
 
				+    need_phone_brand: bool = False,
			
 
				+    need_phone_price: bool = False,
			
 
				+    timeout: Optional[float] = None,
			
 
				+    context: Optional[Dict[str, Any]] = None,
			
 
				+) -> ToolResult:
			
 
				+    """
			
 
				+    批量拉取内容画像并在规则允许时用账号画像兜底（单工具、多 HTTP 顺序请求）。
			
 
				 
			
 
				-        # 格式化输出摘要
			
 
				-        summary_lines = [f"内容 {content_id} 的点赞用户画像"]
			
 
				-        summary_lines.append(f"画像链接：https://douhot.douyin.com/video/detail?active_tab=video_fans&video_id={content_id}")
			
 
				-        summary_lines.append("")
			
 
				+    Args:
			
 
				+        candidates_json: JSON 数组字符串。每项为对象，字段：
			
 
				+            - aweme_id (必填): 视频 id
			
 
				+            - author_sec_uid (可选): 作者 sec_uid，兜底时需要
			
 
				+            - try_account_fallback (可选，默认 true): 为 false 时不请求账号画像
			
 
				+              （对应来自 douyin_user_videos 的条目，与单条工具规则一致）
			
 
				+        need_* / timeout: 与各单条画像工具一致
			
 
				 
			
 
				-        for k, v in portrait.items():
			
 
				-            if not isinstance(v, dict):
			
 
				-                continue
			
 
				-            if k in ("省份", "城市"):
			
 
				-                summary_lines.append(f"【{k} TOP5】分布")
			
 
				-                items = _top_k(v, 5)
			
 
				-            else:
			
 
				-                summary_lines.append(f"【{k}】分布")
			
 
				-                items = v.items()
			
 
				-
			
 
				-            for name, metrics in items:
			
 
				-                ratio = metrics.get("percentage")
			
 
				-                tgi = metrics.get("preference")
			
 
				-                summary_lines.append(f"  {name}: {ratio} (偏好度: {tgi})")
			
 
				-            summary_lines.append("")
			
 
				-
			
 
				-        duration_ms = int((time.time() - start_time) * 1000)
			
 
				-        has_valid_portrait = bool(portrait and any(
			
 
				-            isinstance(v, dict) and v for v in portrait.values()
			
 
				-        ))
			
 
				-
			
 
				-        logger.info(
			
 
				-            "get_content_fans_portrait completed",
			
 
				-            extra={
			
 
				-                "content_id": content_id,
			
 
				-                "has_portrait": has_valid_portrait,
			
 
				-                "portrait_dimensions": list(portrait.keys()) if portrait else [],
			
 
				-                "duration_ms": duration_ms
			
 
				-            }
			
 
				-        )
			
 
				+    Returns:
			
 
				+        ToolResult.output: 人类可读的分条摘要
			
 
				+        metadata.results: 与 candidates 顺序一致的列表，每项含 content / account 子对象；
			
 
				+            通过 ToolResult.include_metadata_in_llm 会进入本轮 tool 消息正文（JSON），无需从 log 猜测。
			
 
				+        metadata.snapshot_path: 落盘文件绝对路径（若写入成功）
			
 
				 
			
 
				+    Note:
			
 
				+        context 由 Runner 注入，含 trace_id，用于写入 batch_portraits.json。
			
 
				+    """
			
 
				+    call_params: Dict[str, Any] = {
			
 
				+        "candidates_json": candidates_json[:2000] + ("..." if len(candidates_json) > 2000 else ""),
			
 
				+        "need_age": need_age,
			
 
				+        "timeout": timeout,
			
 
				+    }
			
 
				+    raw = (candidates_json or "").strip()
			
 
				+    if not raw:
			
 
				         return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				+            _LABEL_BATCH,
			
 
				             call_params,
			
 
				-            ToolResult(
			
 
				-                title=f"内容点赞用户画像: {content_id}",
			
 
				-                output="\n".join(summary_lines),
			
 
				-                long_term_memory=f"Fetched fans portrait for content '{content_id}'",
			
 
				-                metadata={
			
 
				-                    "raw_data": data,
			
 
				-                    "has_portrait": has_valid_portrait,
			
 
				-                    "portrait_data": portrait,
			
 
				-                },
			
 
				-            ),
			
 
				+            ToolResult(title="批量画像失败", output="", error="candidates_json 为空"),
			
 
				         )
			
 
				-    except requests.exceptions.HTTPError as e:
			
 
				-        logger.error(
			
 
				-            "get_content_fans_portrait HTTP error",
			
 
				-            extra={
			
 
				-                "content_id": content_id,
			
 
				-                "status_code": e.response.status_code,
			
 
				-                "error": str(e)
			
 
				-            }
			
 
				-        )
			
 
				-        return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				-            call_params,
			
 
				-            ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"HTTP {e.response.status_code}: {e.response.text}",
			
 
				-            ),
			
 
				-        )
			
 
				-    except requests.exceptions.Timeout:
			
 
				-        logger.error("get_content_fans_portrait timeout", extra={"content_id": content_id, "timeout": request_timeout})
			
 
				+    try:
			
 
				+        parsed = json.loads(raw)
			
 
				+    except json.JSONDecodeError as e:
			
 
				         return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				+            _LABEL_BATCH,
			
 
				             call_params,
			
 
				             ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				+                title="批量画像失败",
			
 
				                 output="",
			
 
				-                error=f"请求超时（{request_timeout}秒）",
			
 
				+                error=f"candidates_json 不是合法 JSON: {e}",
			
 
				             ),
			
 
				         )
			
 
				-    except requests.exceptions.RequestException as e:
			
 
				-        logger.error("get_content_fans_portrait network error", extra={"content_id": content_id, "error": str(e)})
			
 
				+    if not isinstance(parsed, list):
			
 
				         return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				+            _LABEL_BATCH,
			
 
				             call_params,
			
 
				-            ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				-                output="",
			
 
				-                error=f"网络错误: {str(e)}",
			
 
				-            ),
			
 
				+            ToolResult(title="批量画像失败", output="", error="candidates_json 必须是 JSON 数组"),
			
 
				         )
			
 
				-    except Exception as e:
			
 
				-        logger.error("get_content_fans_portrait unexpected error", extra={"content_id": content_id, "error": str(e)}, exc_info=True)
			
 
				+    if len(parsed) > BATCH_MAX_ITEMS:
			
 
				         return _log_return(
			
 
				-            _LABEL_CONTENT,
			
 
				+            _LABEL_BATCH,
			
 
				             call_params,
			
 
				             ToolResult(
			
 
				-                title="内容点赞用户画像获取失败",
			
 
				+                title="批量画像失败",
			
 
				                 output="",
			
 
				-                error=f"未知错误: {str(e)}",
			
 
				+                error=f"条目数超过上限 {BATCH_MAX_ITEMS}，请分批调用",
			
 
				             ),
			
 
				         )
			
 
				 
			
 
				-def _top_k(items: Dict[str, Any], k: int) -> List[Tuple[str, Any]]:
			
 
				-    def percent_value(entry: Tuple[str, Any]) -> float:
			
 
				-        metrics = entry[1] if isinstance(entry[1], dict) else {}
			
 
				-        return metrics.get("percentage")
			
 
				+    flags = _dimension_flags(
			
 
				+        need_province,
			
 
				+        need_city,
			
 
				+        need_city_level,
			
 
				+        need_gender,
			
 
				+        need_age,
			
 
				+        need_phone_brand,
			
 
				+        need_phone_price,
			
 
				+    )
			
 
				+    request_timeout = timeout if timeout is not None else DEFAULT_TIMEOUT
			
 
				+
			
 
				+    results: List[Dict[str, Any]] = []
			
 
				+    output_chunks: List[str] = []
			
 
				+
			
 
				+    for idx, entry in enumerate(parsed):
			
 
				+        if not isinstance(entry, dict):
			
 
				+            results.append(
			
 
				+                {
			
 
				+                    "aweme_id": None,
			
 
				+                    "error": "条目不是对象",
			
 
				+                    "content": None,
			
 
				+                    "account": None,
			
 
				+                }
			
 
				+            )
			
 
				+            output_chunks.append(f"[{idx}] 跳过：条目不是 JSON 对象")
			
 
				+            continue
			
 
				+
			
 
				+        aweme_id = entry.get("aweme_id") or entry.get("content_id")
			
 
				+        author_sec = entry.get("author_sec_uid") or entry.get("account_id")
			
 
				+        try_fallback = entry.get("try_account_fallback", True)
			
 
				+        if isinstance(try_fallback, str):
			
 
				+            try_fallback = try_fallback.strip().lower() in ("1", "true", "yes")
			
 
				+
			
 
				+        if not aweme_id or not isinstance(aweme_id, str):
			
 
				+            results.append(
			
 
				+                {
			
 
				+                    "aweme_id": aweme_id,
			
 
				+                    "error": "缺少 aweme_id",
			
 
				+                    "content": None,
			
 
				+                    "account": None,
			
 
				+                }
			
 
				+            )
			
 
				+            output_chunks.append(f"[{idx}] 跳过：缺少 aweme_id")
			
 
				+            continue
			
 
				+
			
 
				+        item_result: Dict[str, Any] = {
			
 
				+            "aweme_id": aweme_id,
			
 
				+            "author_sec_uid": author_sec if isinstance(author_sec, str) else None,
			
 
				+            "try_account_fallback": bool(try_fallback),
			
 
				+            "content": None,
			
 
				+            "account": None,
			
 
				+            "error": None,
			
 
				+        }
			
 
				 
			
 
				-    return sorted(items.items(), key=percent_value, reverse=True)[:k]
			
 
				+        cerr, cok = _sync_fetch_content_portrait(aweme_id, flags, request_timeout)
			
 
				+        if cerr:
			
 
				+            item_result["content"] = {
			
 
				+                "ok": False,
			
 
				+                "error": cerr,
			
 
				+                "has_portrait": False,
			
 
				+                "portrait_data": {},
			
 
				+            }
			
 
				+        else:
			
 
				+            assert cok is not None
			
 
				+            item_result["content"] = {
			
 
				+                "ok": True,
			
 
				+                "error": None,
			
 
				+                "has_portrait": cok["has_portrait"],
			
 
				+                "portrait_data": cok["portrait_data"],
			
 
				+                "output": cok["output"],
			
 
				+            }
			
 
				+
			
 
				+        c_block = item_result["content"]
			
 
				+        content_has = bool(c_block and c_block.get("has_portrait"))
			
 
				+        need_account = bool(try_fallback) and not content_has
			
 
				+        if need_account:
			
 
				+            if not author_sec or not isinstance(author_sec, str):
			
 
				+                item_result["account"] = {
			
 
				+                    "attempted": False,
			
 
				+                    "skipped_reason": "缺少 author_sec_uid，无法账号兜底",
			
 
				+                    "has_portrait": False,
			
 
				+                    "portrait_data": {},
			
 
				+                }
			
 
				+            else:
			
 
				+                aerr, aok = _sync_fetch_account_portrait(author_sec, flags, request_timeout)
			
 
				+                if aerr:
			
 
				+                    item_result["account"] = {
			
 
				+                        "attempted": True,
			
 
				+                        "error": aerr,
			
 
				+                        "has_portrait": False,
			
 
				+                        "portrait_data": {},
			
 
				+                    }
			
 
				+                else:
			
 
				+                    assert aok is not None
			
 
				+                    item_result["account"] = {
			
 
				+                        "attempted": True,
			
 
				+                        "error": None,
			
 
				+                        "has_portrait": aok["has_portrait"],
			
 
				+                        "portrait_data": aok["portrait_data"],
			
 
				+                        "output": aok["output"],
			
 
				+                    }
			
 
				+        else:
			
 
				+            skip_reason = (
			
 
				+                "try_account_fallback 为 false（如 douyin_user_videos 来源）"
			
 
				+                if not try_fallback
			
 
				+                else "内容侧已有有效画像，无需账号兜底"
			
 
				+            )
			
 
				+            item_result["account"] = {
			
 
				+                "attempted": False,
			
 
				+                "skipped_reason": skip_reason,
			
 
				+                "has_portrait": False,
			
 
				+                "portrait_data": {},
			
 
				+            }
			
 
				+
			
 
				+        results.append(item_result)
			
 
				+        # 压缩每条在 output 中的篇幅
			
 
				+        c_part = item_result["content"] or {}
			
 
				+        a_part = item_result["account"] or {}
			
 
				+        line = (
			
 
				+            f"[{idx}] aweme_id={aweme_id} "
			
 
				+            f"content_has_portrait={c_part.get('has_portrait')} "
			
 
				+            f"account_attempted={a_part.get('attempted')} "
			
 
				+            f"account_has_portrait={a_part.get('has_portrait')}"
			
 
				+        )
			
 
				+        output_chunks.append(line)
			
 
				+
			
 
				+    full_text = "\n".join(output_chunks)
			
 
				+    trace_id = None
			
 
				+    if isinstance(context, dict):
			
 
				+        tid = context.get("trace_id")
			
 
				+        if isinstance(tid, str) and tid.strip():
			
 
				+            trace_id = tid.strip()
			
 
				+    snapshot_path = _persist_batch_portraits_json(trace_id, results, len(results))
			
 
				+
			
 
				+    out_display = (os.getenv("OUTPUT_DIR") or ".cache/output").strip()
			
 
				+    rel_hint = (
			
 
				+        f"{out_display}/{trace_id}/{_BATCH_SNAPSHOT_NAME}"
			
 
				+        if trace_id
			
 
				+        else f"{out_display}/<trace_id>/{_BATCH_SNAPSHOT_NAME}"
			
 
				+    )
			
 
				+    meta_hint = (
			
 
				+        "\n\n本条 tool 消息在标题与摘要后附有 ## metadata (JSON)，其中 results 含每条 "
			
 
				+        "content/account 的 has_portrait 与 portrait_data；若上下文被压缩，可用 read_file 读取："
			
 
				+        f" {rel_hint}"
			
 
				+        + (f"（本机路径: {snapshot_path}）" if snapshot_path else "")
			
 
				+    )
			
 
				+    output_body = full_text + meta_hint
			
 
				+
			
 
				+    logger.info(
			
 
				+        "batch_fetch_portraits completed",
			
 
				+        extra={
			
 
				+            "count": len(results),
			
 
				+            "candidates": len(parsed),
			
 
				+            "trace_id": trace_id,
			
 
				+            "snapshot_path": snapshot_path,
			
 
				+        },
			
 
				+    )
			
 
				+
			
 
				+    meta: Dict[str, Any] = {
			
 
				+        "results": results,
			
 
				+        "count": len(results),
			
 
				+    }
			
 
				+    if snapshot_path:
			
 
				+        meta["snapshot_path"] = snapshot_path
			
 
				+
			
 
				+    return _log_return(
			
 
				+        _LABEL_BATCH,
			
 
				+        call_params,
			
 
				+        ToolResult(
			
 
				+            title=f"批量画像完成 ({len(results)} 条)",
			
 
				+            output=output_body,
			
 
				+            long_term_memory=f"Batch portrait fetch for {len(results)} items",
			
 
				+            metadata=meta,
			
 
				+            include_metadata_in_llm=True,
			
 
				+        ),
			
 
				+    )
			
--- a/examples/content_finder/utils/tool_logging.py
+++ b/examples/content_finder/utils/tool_logging.py
@@ -39,6 +39,18 @@ def format_tool_result_for_log(result: Any) -> str:
 
				     md = getattr(result, "metadata", None)
			
 
				     if isinstance(md, dict) and md:
			
 
				         payload["metadata_keys"] = list(md.keys())
			
 
				+        # 批量画像等：log 里仅列 keys 会导致排障困难，附加 results 摘要（仍可能较长故截断）
			
 
				+        if "results" in md and isinstance(md["results"], list):
			
 
				+            try:
			
 
				+                rs = json.dumps(md["results"], ensure_ascii=False)
			
 
				+            except (TypeError, ValueError):
			
 
				+                rs = str(md["results"])
			
 
				+            max_rs = 24_000
			
 
				+            payload["metadata_results"] = (
			
 
				+                rs if len(rs) <= max_rs else rs[:max_rs] + "\n...(truncated)"
			
 
				+            )
			
 
				+        if isinstance(md.get("snapshot_path"), str):
			
 
				+            payload["snapshot_path"] = md["snapshot_path"]
			
 
				     return json.dumps(payload, ensure_ascii=False)