hai 1 semana · 0bb4664a90
--- a/examples/mode_workflow/stages/query_score.py
+++ b/examples/mode_workflow/stages/query_score.py
@@ -0,0 +1,184 @@
 
															+# -*- coding: utf-8 -*-
														
 
															+"""Query 正交格评分 · 对 judged_matrix 的 tier≥1 格(动作×类型)在当前维度上下文下用 Sonnet 打分,
														
 
															+挑出有意义、人话、有助于内容制作知识库目的的组合。结果原子写 .cache/query_score/<sel>.json。
														
 
															+
														
 
															+由 server.py /api/query_score 起子进程调;也可独立跑:
														
 
															+  python stages/query_score.py --tool-type AI --modality 图片 --suffix 怎么做 \
														
 
															+      --substance-path 表象,实体 --form-path 呈现,视觉 --sel adhoc --dry-run
														
 
															+"""
														
 
															+import argparse
														
 
															+import asyncio
														
 
															+import json
														
 
															+import re
														
 
															+import sys
														
 
															+from pathlib import Path
														
 
															+
														
 
															+PROJECT_ROOT = Path(__file__).resolve().parents[3]   # …/Agent
														
 
															+sys.path.insert(0, str(PROJECT_ROOT))
														
 
															+
														
 
															+from dotenv import load_dotenv
														
 
															+load_dotenv()
														
 
															+
														
 
															+HERE = Path(__file__).resolve().parent
														
 
															+MW = HERE.parent
														
 
															+MATRIX_FILE = MW / "reference" / "judged_matrix.json"
														
 
															+PROMPT_FILE = MW / "prompts" / "query_score_system.md"
														
 
															+CACHE_DIR = MW / ".cache" / "query_score"
														
 
															+DEFAULT_MODEL = "anthropic/claude-sonnet-4-6"
														
 
															+BATCH = 40
														
 
															+CONCURRENCY = 5
														
 
															+
														
 
															+
														
 
															+def _build_cells(matrix, tool_type, modality, suffix):
														
 
															+    """筛 tier≥1 格,产出 [{a_idx,t_idx,action,type,tier,query}]。
														
 
															+    query = [工具类型] 动作叶 类型叶 [模态] [后缀],"无"/空跳过。"""
														
 
															+    actions, types, grid = matrix["actions"], matrix["types"], matrix["matrix"]
														
 
															+    pre, mod, suf = (tool_type or "").strip(), (modality or "").strip(), (suffix or "").strip()
														
 
															+    cells = []
														
 
															+    for ai, arow in enumerate(grid):
														
 
															+        action = actions[ai]["name"]
														
 
															+        for ti, cell in enumerate(arow):
														
 
															+            if cell.get("tier", 0) < 1:
														
 
															+                continue
														
 
															+            typ = types[ti]["name"]
														
 
															+            parts = [p for p in (pre, action, typ, mod, suf) if p and p != "无"]
														
 
															+            cells.append({"a_idx": ai, "t_idx": ti, "action": action,
														
 
															+                          "type": typ, "tier": cell["tier"], "query": " ".join(parts)})
														
 
															+    return cells
														
 
															+
														
 
															+
														
 
															+def _build_user(batch, ctx):
														
 
															+    lines = [f'{i}. "{c["query"]}"   (动作={c["action"]} 类型={c["type"]} 内容树tier={c["tier"]})'
														
 
															+             for i, c in enumerate(batch)]
														
 
															+    sub = (ctx["substance"] or "无").replace(",", "›")
														
 
															+    form = (ctx["form"] or "无").replace(",", "›")
														
 
															+    return (f"【固定上下文(本批共享)】\n"
														
 
															+            f"工具类型: {ctx['tool_type'] or '无'}   模态: {ctx['modality'] or '无'}   后缀: {ctx['suffix'] or '无'}\n"
														
 
															+            f"(实质/形式不参与拼词，仅供理解领域定位: 实质路径={sub}  形式路径={form})\n\n"
														
 
															+            f"【候选列表】每条 = 动作 + 类型 + 上下文词拼成的 query:\n" + "\n".join(lines))
														
 
															+
														
 
															+
														
 
															+async def _call_with_retry(llm_call, messages, model, task_name, max_retries=3):
														
 
															+    """直接调 llm_call 并解析 JSON 数组(call_llm_with_retry 的正则只捕获 {…},不适用数组)。"""
														
 
															+    total_cost = 0.0
														
 
															+    last_err = None
														
 
															+    cur_messages = list(messages)
														
 
															+    for attempt in range(max_retries):
														
 
															+        if attempt > 0 and last_err:
														
 
															+            cur_messages = list(messages) + [
														
 
															+                {"role": "user",
														
 
															+                 "content": f"上次输出未通过校验：{last_err}\n请重新输出完整 JSON 数组，不含其他内容。"}]
														
 
															+            print(f"   [{task_name}] Retry {attempt}/{max_retries - 1}: {last_err[:80]}...")
														
 
															+        try:
														
 
															+            resp = await llm_call(messages=cur_messages, model=model,
														
 
															+                                  temperature=0.1, max_tokens=4000)
														
 
															+            cost = resp.get("cost") or 0.0
														
 
															+            total_cost += cost
														
 
															+            content = resp.get("content", "")
														
 
															+            if isinstance(content, list):
														
 
															+                first = content[0] if content else ""
														
 
															+                content = first.get("text", "") if isinstance(first, dict) else str(first)
														
 
															+            # 提取 JSON 数组(支持裸数组和 markdown 围栏包裹)
														
 
															+            arr_match = re.search(r"\[[\s\S]*\]", content)
														
 
															+            if not arr_match:
														
 
															+                last_err = "LLM 输出中未找到 JSON 数组"
														
 
															+                continue
														
 
															+            try:
														
 
															+                data = json.loads(arr_match.group())
														
 
															+            except json.JSONDecodeError as e:
														
 
															+                last_err = f"JSON 解析失败: {e}"
														
 
															+                continue
														
 
															+            if not isinstance(data, list):
														
 
															+                last_err = "需 JSON 数组"
														
 
															+                continue
														
 
															+            return data, total_cost
														
 
															+        except Exception as e:
														
 
															+            last_err = f"LLM 调用异常: {type(e).__name__}: {e}"
														
 
															+            print(f"   [{task_name}] Error: {last_err}")
														
 
															+    print(f"   [{task_name}] All {max_retries} attempts failed. Last error: {last_err}")
														
 
															+    return None, total_cost
														
 
															+
														
 
															+
														
 
															+async def _score_batch(batch, ctx, system, llm_call, model, sem):
														
 
															+    messages = [{"role": "system", "content": system},
														
 
															+                {"role": "user", "content": _build_user(batch, ctx)}]
														
 
															+    task_name = f"QueryScore[{batch[0]['query'][:12]}]"
														
 
															+    async with sem:
														
 
															+        data, cost = await _call_with_retry(llm_call, messages, model, task_name)
														
 
															+    out = {}
														
 
															+    for v in (data or []):
														
 
															+        if not isinstance(v, dict):
														
 
															+            continue
														
 
															+        i = v.get("idx")
														
 
															+        if not isinstance(i, int) or not (0 <= i < len(batch)):
														
 
															+            continue
														
 
															+        c = batch[i]
														
 
															+        try:
														
 
															+            score = round(float(v.get("natural")) * 0.4 + float(v.get("findable")) * 0.3
														
 
															+                          + float(v.get("useful")) * 0.3, 1)
														
 
															+        except (TypeError, ValueError):
														
 
															+            score = None
														
 
															+        out[f"{c['a_idx']}_{c['t_idx']}"] = {
														
 
															+            "query": c["query"], "natural": v.get("natural"), "findable": v.get("findable"),
														
 
															+            "useful": v.get("useful"), "keep": bool(v.get("keep")),
														
 
															+            "rewrite": (v.get("rewrite") or c["query"]), "reason": v.get("reason", ""),
														
 
															+            "score": score}
														
 
															+    return out, cost
														
 
															+
														
 
															+
														
 
															+async def run(args):
														
 
															+    matrix = json.loads(MATRIX_FILE.read_text(encoding="utf-8"))
														
 
															+    ctx = {"tool_type": args.tool_type, "modality": args.modality, "suffix": args.suffix,
														
 
															+           "substance": args.substance_path, "form": args.form_path}
														
 
															+    cells = _build_cells(matrix, args.tool_type, args.modality, args.suffix)
														
 
															+    if args.limit:
														
 
															+        cells = cells[:args.limit]
														
 
															+    print(f"📋 tier≥1 候选 {len(cells)} 格" + (f" (--limit {args.limit})" if args.limit else ""))
														
 
															+    if args.dry_run:
														
 
															+        for c in cells[:10]:
														
 
															+            print(f"  [{c['tier']}] {c['query']}")
														
 
															+        print(f"…共 {len(cells)} 格(dry-run,未调 LLM)")
														
 
															+        return 0
														
 
															+
														
 
															+    system = PROMPT_FILE.read_text(encoding="utf-8")
														
 
															+    from agent.llm.openrouter import create_openrouter_llm_call
														
 
															+    llm_call = create_openrouter_llm_call(model=args.model)
														
 
															+    sem = asyncio.Semaphore(CONCURRENCY)
														
 
															+    batches = [cells[i:i + BATCH] for i in range(0, len(cells), BATCH)]
														
 
															+    print(f"🤖 {len(batches)} 批 × ≤{BATCH} 格 · 并发 {CONCURRENCY} · 模型 {args.model}")
														
 
															+    results = await asyncio.gather(*[
														
 
															+        _score_batch(b, ctx, system, llm_call, args.model, sem) for b in batches])
														
 
															+    merged, cost = {}, 0.0
														
 
															+    for cmap, c in results:
														
 
															+        merged.update(cmap)
														
 
															+        cost += c
														
 
															+    kept = sum(1 for v in merged.values() if v.get("keep"))
														
 
															+    out = {"sel": ctx, "model": args.model, "kept": kept, "total": len(merged),
														
 
															+           "cost_usd": round(cost, 4), "cells": merged}
														
 
															+    CACHE_DIR.mkdir(parents=True, exist_ok=True)
														
 
															+    dest = CACHE_DIR / f"{args.sel}.json"
														
 
															+    tmp = dest.with_suffix(".tmp")
														
 
															+    tmp.write_text(json.dumps(out, ensure_ascii=False, indent=2), encoding="utf-8")
														
 
															+    tmp.replace(dest)   # 原子落盘,避免前端读到半截
														
 
															+    print(f"✅ 评分完成 {len(merged)} 格 · keep {kept} · ${cost:.4f} → {dest.name}")
														
 
															+    return 0
														
 
															+
														
 
															+
														
 
															+def main():
														
 
															+    p = argparse.ArgumentParser(description="Query 正交格评分(tier≥1 × 当前维度 → Sonnet 打分)")
														
 
															+    p.add_argument("--tool-type", default="")
														
 
															+    p.add_argument("--modality", default="")
														
 
															+    p.add_argument("--suffix", default="")
														
 
															+    p.add_argument("--substance-path", default="", help="实质祖先路径,逗号分隔(仅作上下文)")
														
 
															+    p.add_argument("--form-path", default="", help="形式祖先路径,逗号分隔(仅作上下文)")
														
 
															+    p.add_argument("--model", default=DEFAULT_MODEL)
														
 
															+    p.add_argument("--sel", default="adhoc", help="缓存文件名(server 传 sel_hash)")
														
 
															+    p.add_argument("--limit", type=int, default=None, help="只评前 N 格(调试)")
														
 
															+    p.add_argument("--dry-run", action="store_true", help="只拼词打印,不调 LLM、不落盘")
														
 
															+    p.add_argument("--force", action="store_true", help="(占位)缓存短路在 server 侧,本脚本恒重算")
														
 
															+    args = p.parse_args()
														
 
															+    raise SystemExit(asyncio.run(run(args)))
														
 
															+
														
 
															+
														
 
															+if __name__ == "__main__":
														
 
															+    main()