server.py 49 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031
  1. # -*- coding: utf-8 -*-
  2. """搜索评估案例查看 server。
  3. 沿用 图文排版搜索评估.html 的版式(卡片 + dialog 详情 + rubric 评分条),
  4. 数据实时扫描 runs_full/*/form_*.json —— runs_full 下每新增一个 q 文件夹,刷新即出现。
  5. 分页:query → 三种形式(A/B/C) → 三个渠道 三行从上到下。
  6. 用法:python server.py [port] 默认 8770,浏览器开 http://0.0.0.0:8770
  7. """
  8. import json, re, glob, sys, pathlib, subprocess, threading
  9. from datetime import datetime
  10. from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
  11. from urllib.parse import urlparse, parse_qs
  12. try: # Windows 控制台默认 cp1252,中文 print 会崩,统一切 utf-8
  13. sys.stdout.reconfigure(encoding="utf-8")
  14. except Exception:
  15. pass
  16. HERE = pathlib.Path(__file__).parent
  17. sys.path.insert(0, str(HERE))
  18. sys.path.insert(0, str(HERE.parent)) # fixed_query_eval:让兄弟模块 batch_extract_procedures 可 import
  19. PORT = int(sys.argv[1]) if len(sys.argv) > 1 else 8770
  20. PLAT = {"xhs": "小红书", "gzh": "公众号", "zhihu": "知乎", "x": "X", "bili": "B站", "douyin": "抖音",
  21. "sph": "视频号", "youtube": "YouTube", "github": "GitHub", "toutiao": "头条", "weibo": "微博"}
  22. KT = {"procedure": "工序", "step": "步骤", "tool": "工具"}
  23. # 从 taxonomy 取动作叶子/类型名,用于把 original_q 解析回原始维度(动作×类型 正交)
  24. # 路径优先级:search_eval/evaluation/(主源,IDE 编辑那份就是 runtime 实际读的)
  25. # → test_script/evaluation/(历史副本兜底)→ script/evaluation/(更老兜底)
  26. # 谁也找不到时整目录扫空,server 仍能起。
  27. EVALDIR = HERE / "evaluation"
  28. if not EVALDIR.exists():
  29. EVALDIR = HERE.parent.parent / "test_script" / "evaluation"
  30. if not EVALDIR.exists():
  31. EVALDIR = HERE.parent / "evaluation"
  32. try:
  33. _jm = json.load(open(EVALDIR / "judged_matrix.json", encoding="utf-8"))
  34. ACT_L1 = {a["name"]: a["l1"] for a in _jm["actions"]}
  35. ACTION_SET = set(ACT_L1)
  36. TYPE_SET = {t["name"] for t in _jm["types"]}
  37. ACTIONS_TAX = [{"name": a["name"], "l1": a["l1"], "l2": a.get("l2", "")} for a in _jm["actions"]]
  38. TYPES_TAX = [{"name": t["name"], "l1": t["l1"]} for t in _jm["types"]]
  39. # taxonomy 顺序沿用 judged_matrix(严格版);矩阵分值改用 type_action_scores(宽松版) —
  40. # 两份是同一组 27×50 cell 的独立 gemini judging,前者只 53 格到 tier3,后者 156 格到 score3
  41. _tas = json.load(open(EVALDIR / "type_action_scores.json", encoding="utf-8"))["scores"]
  42. _MATRIX = []
  43. for a in _jm["actions"]:
  44. row = []
  45. for t in _jm["types"]:
  46. rec = _tas.get(t["name"], {}).get(a["name"])
  47. row.append({"tier": rec["score"], "r": rec.get("reason", "")} if rec else {})
  48. _MATRIX.append(row)
  49. except Exception:
  50. ACT_L1, ACTION_SET, TYPE_SET, ACTIONS_TAX, TYPES_TAX, _MATRIX = {}, set(), set(), [], [], []
  51. ACTIVE_TASKS = {}
  52. ACTIVE_REEVALS = {}
  53. from batch_extract_procedures import _short_case, _source_to_dsl_input, _write_meta, _composite_score
  54. def run_extraction_task(q, folder_name, src_path, out_dir, engine, model):
  55. task_key = f"{q}/{folder_name}"
  56. log_path = out_dir / "_extract.log"
  57. try:
  58. out_dir.mkdir(parents=True, exist_ok=True)
  59. if engine == "cyber_runner":
  60. script_path = HERE / "procedure-dsl" / "run_cyber.py"
  61. else:
  62. script_path = HERE / "procedure-dsl" / "run_procedure_dsl.py"
  63. cmd = [
  64. sys.executable, "-u", str(script_path),
  65. str(src_path),
  66. "--out-dir", str(out_dir),
  67. "--model", model,
  68. "--max-turns", "300"
  69. ]
  70. if engine != "cyber_runner":
  71. cmd.extend(["--max-retries", "3"])
  72. flags = subprocess.CREATE_NEW_PROCESS_GROUP if sys.platform == "win32" else 0
  73. with open(log_path, "w", encoding="utf-8", buffering=1) as log_fh:
  74. proc = subprocess.Popen(cmd, stdout=log_fh, stderr=subprocess.STDOUT,
  75. cwd=str(HERE), creationflags=flags)
  76. ACTIVE_TASKS[task_key]["pid"] = proc.pid
  77. proc.wait()
  78. if proc.returncode == 0:
  79. try:
  80. import build_workflows
  81. build_workflows.write_one(q, folder_name, runs_dir=HERE / "runs_full")
  82. ACTIVE_TASKS[task_key]["status"] = "success"
  83. except Exception as ex:
  84. ACTIVE_TASKS[task_key]["status"] = "failed"
  85. ACTIVE_TASKS[task_key]["error"] = f"Workflow compilation failed: {ex}"
  86. with open(log_path, "a", encoding="utf-8") as f_err:
  87. f_err.write(f"\n[server error] Workflow compilation failed: {ex}\n")
  88. else:
  89. ACTIVE_TASKS[task_key]["status"] = "failed"
  90. ACTIVE_TASKS[task_key]["error"] = f"Runner failed with exit code {proc.returncode}"
  91. except Exception as e:
  92. ACTIVE_TASKS[task_key]["status"] = "failed"
  93. ACTIVE_TASKS[task_key]["error"] = str(e)
  94. try:
  95. with open(log_path, "a", encoding="utf-8") as f_err:
  96. f_err.write(f"\n[server error] Extraction failed: {e}\n")
  97. except Exception:
  98. pass
  99. # ── 工具解构(fixed_query_eval 新增)──────────────────────────────────────────────
  100. # 单次 LLM 调用(gemini-3.1-flash-lite)即可,比工序解构(多轮 agent)轻得多。
  101. # 仍走 subprocess(tool_extract.py),让 LLM 重依赖留在子进程,server 本身保持轻量。
  102. TOOL_TASKS = {} # {q: {"status", "case_ids", "error", "start_time"}}
  103. def run_tool_extraction_task(q, case_ids, force, model=None):
  104. log_path = HERE / "runs_full" / q / "tools" / "_extract.log"
  105. try:
  106. log_path.parent.mkdir(parents=True, exist_ok=True)
  107. cmd = [sys.executable, "-u", str(HERE / "tool_extract.py"),
  108. "--q", q, "--case-ids", ",".join(case_ids)]
  109. if force:
  110. cmd.append("--force")
  111. if model:
  112. cmd += ["--model", model]
  113. flags = subprocess.CREATE_NEW_PROCESS_GROUP if sys.platform == "win32" else 0
  114. with open(log_path, "w", encoding="utf-8", buffering=1) as log_fh:
  115. proc = subprocess.Popen(cmd, stdout=log_fh, stderr=subprocess.STDOUT,
  116. cwd=str(HERE), creationflags=flags)
  117. TOOL_TASKS[q]["pid"] = proc.pid
  118. proc.wait()
  119. TOOL_TASKS[q]["status"] = "success" if proc.returncode == 0 else "failed"
  120. if proc.returncode != 0:
  121. TOOL_TASKS[q]["error"] = f"tool_extract exit code {proc.returncode}"
  122. except Exception as e:
  123. TOOL_TASKS[q]["status"] = "failed"
  124. TOOL_TASKS[q]["error"] = str(e)
  125. MODSET = {"文", "图", "视频", "音频"}
  126. TOOLQUAL = {"AI": "AI 模型", "软件": "桌面 APP", "电脑端": "桌面 APP", "在线": "云端 Web",
  127. "网页版": "云端 Web", "代码": "API·CLI", "命令行": "API·CLI", "插件": "插件扩展"}
  128. def parse_dims(oq):
  129. """把组合 query(如 '文 元素生成 提示词 教程')解析回 {动作, 类型, 动作L1, 约束}。"""
  130. toks = (oq or "").split()
  131. action = next((t for t in toks if t in ACTION_SET), None)
  132. type_ = next((t for t in toks if t in TYPE_SET), None)
  133. cons = None
  134. if toks:
  135. t0 = toks[0]
  136. if t0 in MODSET:
  137. cons = {"kind": "模态", "value": t0}
  138. elif t0 in TOOLQUAL:
  139. cons = {"kind": "工具类型", "value": TOOLQUAL[t0]}
  140. return {"action": action, "type": type_, "action_l1": ACT_L1.get(action, ""), "constraint": cons}
  141. def flat_scores(sc):
  142. f = {}
  143. for k, v in (sc or {}).items():
  144. if isinstance(v, dict):
  145. for kk, vv in v.items():
  146. try: f[kk] = int(vv)
  147. except Exception: pass
  148. else:
  149. try: f[k] = int(v)
  150. except Exception: pass
  151. return f
  152. def _recency_hard(date_str):
  153. """按 publish_timestamp 头 10 字符(YYYY-MM-DD)算硬时效:半年内=3 / 两年内=2 / 更早=1。
  154. 取代原 LLM 评的 recency 维度——脚本算更稳,发布时间在帖子抓取时就有,无需 LLM token。
  155. """
  156. try:
  157. d = datetime.strptime((date_str or "")[:10], "%Y-%m-%d")
  158. except (ValueError, TypeError):
  159. return None
  160. days = (datetime.now() - d).days
  161. if days <= 180: return 3
  162. if days <= 730: return 2
  163. return 1
  164. def adapt(r, run, form_name=None):
  165. p = r.get("post", {}); e = r.get("llm_evaluation", {})
  166. # 1. 解析 知识类型 (knowledge_type)
  167. kt = []
  168. kt_raw = e.get("知识类型") or e.get("knowledge_type") or []
  169. for k in kt_raw:
  170. if k in ("工序", "procedure"): kt.append("procedure")
  171. elif k in ("能力", "步骤", "step"): kt.append("step")
  172. elif k in ("工具", "tool"): kt.append("tool")
  173. fs = {}
  174. score_reasons = {}
  175. # 检测是否为 eval_prompt_sample-mod 里的新版 0-10 分数 schema
  176. is_mod_schema = "相关性" in e and isinstance(e["相关性"], dict) and ("和内容制作知识相关" in e["相关性"] or "和 query 相关" in e["相关性"])
  177. if is_mod_schema:
  178. # 新版 0-10 分数格式解析
  179. # 1. 相关性
  180. rel = e.get("相关性") or {}
  181. for subkey, item in rel.items():
  182. if isinstance(item, dict):
  183. score_val = item.get("得分")
  184. reason_val = item.get("理由")
  185. code_key = None
  186. if "内容制作" in subkey or "知识" in subkey:
  187. code_key = "relevance_production"
  188. elif "query" in subkey or "检索" in subkey:
  189. code_key = "relevance_query"
  190. if code_key and score_val is not None:
  191. try:
  192. fs[code_key] = float(score_val)
  193. if reason_val:
  194. score_reasons[code_key] = reason_val
  195. except Exception:
  196. pass
  197. # 2. 质量
  198. q_block = e.get("质量") or {}
  199. fixed = q_block.get("固定维度") or {}
  200. # 固定维度
  201. fixed_keys = {
  202. "时效性": "recency",
  203. "热度性": "popularity",
  204. "评论反馈": "feedback"
  205. }
  206. for cn, code in fixed_keys.items():
  207. item = fixed.get(cn)
  208. if isinstance(item, dict):
  209. score_val = item.get("得分")
  210. reason_val = item.get("理由")
  211. if score_val is not None:
  212. try:
  213. fs[code] = float(score_val)
  214. if reason_val:
  215. score_reasons[code] = reason_val
  216. except Exception:
  217. pass
  218. # 用例 (真实感, 表现力)
  219. usecase = fixed.get("用例") or {}
  220. usecase_keys = {
  221. "真实感": "realism",
  222. "表现力": "expressiveness"
  223. }
  224. for cn, code in usecase_keys.items():
  225. item = usecase.get(cn)
  226. if isinstance(item, dict):
  227. score_val = item.get("得分")
  228. reason_val = item.get("理由")
  229. if score_val is not None:
  230. try:
  231. fs[code] = float(score_val)
  232. if reason_val:
  233. score_reasons[code] = reason_val
  234. except Exception:
  235. pass
  236. # 动态维度
  237. dynamic = q_block.get("动态维度") or {}
  238. # 工序
  239. proc = dynamic.get("工序") or {}
  240. if proc:
  241. item = proc.get("流程完整性")
  242. if isinstance(item, dict):
  243. score_val = item.get("得分")
  244. reason_val = item.get("理由")
  245. if score_val is not None:
  246. try:
  247. fs["procedure_completeness"] = float(score_val)
  248. if reason_val:
  249. score_reasons["procedure_completeness"] = reason_val
  250. except Exception:
  251. pass
  252. field = proc.get("字段完整性") or {}
  253. field_keys = {
  254. "输入完整性": "procedure_input",
  255. "实现完整性": "procedure_implementation",
  256. "输出完整性": "procedure_output"
  257. }
  258. for cn, code in field_keys.items():
  259. item = field.get(cn)
  260. if isinstance(item, dict):
  261. score_val = item.get("得分")
  262. reason_val = item.get("理由")
  263. if score_val is not None:
  264. try:
  265. fs[code] = float(score_val)
  266. if reason_val:
  267. score_reasons[code] = reason_val
  268. except Exception:
  269. pass
  270. item = proc.get("泛化性")
  271. if isinstance(item, dict):
  272. score_val = item.get("得分")
  273. reason_val = item.get("理由")
  274. if score_val is not None:
  275. try:
  276. fs["procedure_generality"] = float(score_val)
  277. if reason_val:
  278. score_reasons["procedure_generality"] = reason_val
  279. except Exception:
  280. pass
  281. # 能力
  282. cap = dynamic.get("能力") or dynamic.get("步骤") or {}
  283. if cap:
  284. field = cap.get("字段完整性") or {}
  285. field_keys = {
  286. "输入完整性": "step_input",
  287. "实现完整性": "step_implementation",
  288. "输出完整性": "step_output"
  289. }
  290. for cn, code in field_keys.items():
  291. item = field.get(cn)
  292. if isinstance(item, dict):
  293. score_val = item.get("得分")
  294. reason_val = item.get("理由")
  295. if score_val is not None:
  296. try:
  297. fs[code] = float(score_val)
  298. if reason_val:
  299. score_reasons[code] = reason_val
  300. except Exception:
  301. pass
  302. item = cap.get("泛化性")
  303. if isinstance(item, dict):
  304. score_val = item.get("得分")
  305. reason_val = item.get("理由")
  306. if score_val is not None:
  307. try:
  308. fs["step_generality"] = float(score_val)
  309. if reason_val:
  310. score_reasons["step_generality"] = reason_val
  311. except Exception:
  312. pass
  313. # 工具
  314. tool = dynamic.get("工具") or {}
  315. if tool:
  316. tool_keys = {
  317. "能力边界覆盖": "tool_boundary",
  318. "有效比较": "tool_comparison",
  319. "参数/接口具体性": "tool_specificity",
  320. "实操示例": "tool_example",
  321. "版本&限制": "tool_limits"
  322. }
  323. for cn, code in tool_keys.items():
  324. item = tool.get(cn)
  325. if isinstance(item, dict):
  326. score_val = item.get("得分")
  327. reason_val = item.get("理由")
  328. if score_val is not None:
  329. try:
  330. fs[code] = float(score_val)
  331. if reason_val:
  332. score_reasons[code] = reason_val
  333. except Exception:
  334. pass
  335. else:
  336. # 兼容老版 1-5 分数 schema (带 "评分" 或 old-style flatness)
  337. is_new_schema = "评分" in e or "知识类型" in e or "制作相关性" in e
  338. CN_TO_EN = {
  339. "相关性": "relevance",
  340. "成品质量": "result_quality",
  341. "可信度": "credibility",
  342. "具体用例": "concrete_use_case",
  343. "完整性": "completeness",
  344. "步骤结构": "step_structure",
  345. "步骤可复现": "step_reproducibility",
  346. "步骤可复现性": "step_reproducibility",
  347. "能力定义": "capability_definition",
  348. "实现深度": "implementation_depth",
  349. "边界失败": "boundary_failure_eval",
  350. "通用性": "generality",
  351. "能力覆盖": "capability_coverage",
  352. "有效对比": "effective_comparison",
  353. "参数具体": "param_specificity",
  354. "实操示例": "worked_example",
  355. "实操用例": "worked_example",
  356. "示例完整": "worked_example",
  357. "版本限制": "version_limits",
  358. "版本说明": "version_limits",
  359. "限制说明": "version_limits",
  360. }
  361. if is_new_schema:
  362. pf = e.get("评分") or {}
  363. for cat, metrics in pf.items():
  364. if isinstance(metrics, dict):
  365. for metric, val in metrics.items():
  366. en_key = CN_TO_EN.get(metric, metric)
  367. if isinstance(val, dict) and "得分" in val:
  368. try: fs[en_key] = int(val["得分"])
  369. except Exception: pass
  370. elif isinstance(val, (int, float)):
  371. fs[en_key] = int(val)
  372. if isinstance(val, dict) and "理由" in val:
  373. score_reasons[en_key] = val["理由"]
  374. else:
  375. fs = flat_scores(e.get("scores", {}))
  376. # 计算均分 (overall)
  377. if is_mod_schema:
  378. rel_keys = {"relevance_production", "relevance_query"}
  379. rel_vals = [v for k, v in fs.items() if k in rel_keys]
  380. qual_vals = [v for k, v in fs.items() if k not in rel_keys]
  381. rel_avg = sum(rel_vals) / len(rel_vals) if rel_vals else None
  382. qual_avg = sum(qual_vals) / len(qual_vals) if qual_vals else None
  383. if rel_avg is not None and qual_avg is not None:
  384. overall = round((rel_avg + qual_avg) / 2, 1)
  385. elif rel_avg is not None:
  386. overall = round(rel_avg, 1)
  387. elif qual_avg is not None:
  388. overall = round(qual_avg, 1)
  389. else:
  390. overall = 0.0
  391. else:
  392. overall = round(sum(fs.values()) / len(fs), 1) if fs else 0
  393. anomaly = bool(e.get("error")) or not fs
  394. grade = p.get("_quality_grade", "")
  395. fb = r.get("found_by_queries", [])
  396. # 4. 解析 制作相关性 (production_relevance)
  397. if is_mod_schema:
  398. # 新版使用 "相关性" 中的 "和内容制作知识相关" 代表制作相关性
  399. production_relevance = fs.get("relevance_production")
  400. else:
  401. if is_new_schema:
  402. pr_block = e.get("制作相关性") or {}
  403. pr_raw = pr_block.get("得分") if isinstance(pr_block, dict) else pr_block
  404. if isinstance(pr_block, dict) and "理由" in pr_block:
  405. score_reasons["production_relevance"] = pr_block["理由"]
  406. else:
  407. pr_raw = e.get("production_relevance")
  408. try: production_relevance = int(float(pr_raw)) if pr_raw is not None else None
  409. except (TypeError, ValueError): production_relevance = None
  410. recency_hard = _recency_hard(p.get("publish_timestamp", ""))
  411. # 5. 解析 判定决策 (decision) 和 理由 (reason)
  412. reason = e.get("判定理由") or e.get("reason") or ""
  413. # 根据过滤指标决定是否保留 (过滤指标判定逻辑优先,不依赖文字匹配)
  414. is_discard = False
  415. # 制作相关性低于阈值则丢弃 (新版 0-10 满分,因此低于 4 丢弃;老版低于 2 丢弃)
  416. if production_relevance is not None:
  417. threshold = 4 if is_mod_schema else 2
  418. if production_relevance < threshold:
  419. is_discard = True
  420. # 时效性低于 2 被丢弃(发布时间超两年的老帖)
  421. if recency_hard is not None and recency_hard < 2:
  422. is_discard = True
  423. # 综合均分低于阈值被丢弃 (新版低于 6 丢弃;老版低于 3 丢弃)
  424. if overall is not None:
  425. threshold_ov = 6 if is_mod_schema else 3
  426. if overall < threshold_ov:
  427. is_discard = True
  428. decision = "discard" if is_discard else "report"
  429. # Find matching procedure html
  430. procedure_html = None
  431. case_id = r.get("case_id", "")
  432. title = p.get("title", "")
  433. run_dir = HERE / "runs_full" / run
  434. if run_dir.is_dir():
  435. # 1. 优先扫描该帖子对应的文件夹下的任何 HTML 文件 (不限名称)
  436. # 文件夹名格式: {form}_{platform}_{channel_content_id[:8]}
  437. content_id = r.get("channel_content_id") or ""
  438. if not content_id and case_id and "_" in case_id:
  439. content_id = case_id.split("_", 1)[1]
  440. plat_key = r.get("platform") or ""
  441. if form_name and plat_key and content_id:
  442. folder_name = f"{form_name}_{plat_key}_{content_id[:8]}"
  443. case_dir = run_dir / "procedures" / folder_name
  444. if case_dir.is_dir():
  445. html_files = list(case_dir.glob("*.html"))
  446. if html_files:
  447. procedure_html = f"runs_full/{run}/procedures/{folder_name}/{html_files[0].name}"
  448. # 2. 其次匹配标准文件名: case-{case_id}.html 或 {case_id}.html
  449. candidate_dirs = [run_dir, run_dir / "procedures"]
  450. if not procedure_html and case_id:
  451. named_files = [f"case-{case_id}.html", f"{case_id}.html"]
  452. for d_dir in candidate_dirs:
  453. if d_dir.is_dir():
  454. for name in named_files:
  455. if (d_dir / name).is_file():
  456. procedure_html = f"runs_full/{run}/procedures/{name}" if d_dir.name == "procedures" else f"runs_full/{run}/{name}"
  457. break
  458. if procedure_html:
  459. break
  460. # 3. 再次匹配 HTML 内部的标准声明 (meta 标签或 HTML 注释)
  461. if not procedure_html and case_id:
  462. for d_dir in candidate_dirs:
  463. if d_dir.is_dir():
  464. for html_path in d_dir.glob("*.html"):
  465. try:
  466. content = html_path.read_text(encoding="utf-8")
  467. if f'name="case-id" content="{case_id}"' in content or \
  468. f'name="case_id" content="{case_id}"' in content or \
  469. f'<!-- case_id: {case_id} -->' in content or \
  470. f'<!-- case-id: {case_id} -->' in content:
  471. procedure_html = f"runs_full/{run}/procedures/{html_path.name}" if d_dir.name == "procedures" else f"runs_full/{run}/{html_path.name}"
  472. break
  473. except Exception:
  474. continue
  475. if procedure_html:
  476. break
  477. # 4. 最后使用标题作为兜底模糊匹配
  478. if not procedure_html and title:
  479. for d_dir in candidate_dirs:
  480. if d_dir.is_dir():
  481. for html_path in d_dir.glob("*.html"):
  482. try:
  483. content = html_path.read_text(encoding="utf-8")
  484. if title in content:
  485. procedure_html = f"runs_full/{run}/procedures/{html_path.name}" if d_dir.name == "procedures" else f"runs_full/{run}/{html_path.name}"
  486. break
  487. except Exception:
  488. continue
  489. if procedure_html:
  490. break
  491. return {
  492. "case_id": r.get("case_id", ""),
  493. "platform": PLAT.get(r.get("platform"), r.get("platform")), "platformKey": r.get("platform"),
  494. "title": p.get("title", "") or "(无标题)", "date": (p.get("publish_timestamp", "") or "")[:10],
  495. "url": r.get("source_url", ""), "engagement": f'{p.get("like_count", 0)} 赞',
  496. "knowledge_type": kt, "decision": decision,
  497. "tools": [KT.get(k, k) for k in kt] + ([f"质量 {grade}"] if grade else []), "found_by": fb,
  498. "images": (p.get("images") or [])[:6], "text": p.get("body_text", "") or "",
  499. "scores": fs, "overall": overall, "reason": reason, "score_reasons": score_reasons,
  500. "grade": grade, "qscore": p.get("_quality_score", 0), "anomaly": anomaly,
  501. "production_relevance": production_relevance, "recency_hard": recency_hard,
  502. "run": run, "procedure_html": procedure_html,
  503. }
  504. def scan_runs():
  505. runs = {}
  506. for f in sorted(glob.glob(str(HERE / "runs_full" / "*" / "form_*.json"))):
  507. try:
  508. d = json.load(open(f, encoding="utf-8"))
  509. except Exception:
  510. continue
  511. run = pathlib.Path(f).parent.name
  512. form_name = d.get("form") or ""
  513. results = [adapt(r, run, form_name) for r in d.get("results", [])]
  514. report_val = sum(1 for r in results if r.get("decision") == "report" and not r.get("anomaly"))
  515. discard_val = sum(1 for r in results if r.get("decision") == "discard" and not r.get("anomaly"))
  516. runs.setdefault(run, []).append({
  517. "form": d.get("form"), "query": d.get("query"), "original_q": d.get("original_q", ""),
  518. "requirement": d.get("requirement", ""),
  519. "platforms": d.get("platforms", []), "total": d.get("total"),
  520. "report": report_val, "discard": discard_val,
  521. "results": results,
  522. })
  523. # 数据库回退:仅当本地 runs_full 完全为空时才读库(本地清空后界面仍有数据)。
  524. # 本地有任何数据就信本地,避免每次 /api/data 都查远程 DB 拖慢。
  525. try:
  526. import db
  527. for q, g in (db.fetch_posts_grouped().items() if not runs else []):
  528. if q in runs:
  529. continue
  530. results = [adapt(r, q, "A") for r in g["results"]]
  531. runs[q] = [{
  532. "form": "A", "query": g.get("query_text"), "original_q": g.get("query_text") or "",
  533. "requirement": "", "platforms": [], "total": len(results),
  534. "report": sum(1 for r in results if r.get("decision") == "report" and not r.get("anomaly")),
  535. "discard": sum(1 for r in results if r.get("decision") == "discard" and not r.get("anomaly")),
  536. "results": results, "_from_db": True,
  537. }]
  538. except Exception as e:
  539. print(f"⚠️ DB 回退读取失败(仅用本地数据):{e}")
  540. for v in runs.values():
  541. v.sort(key=lambda x: x.get("form") or "")
  542. def _qnum(name): # "q156" → 156,按数字排,避免 "q156" < "q99" 的字符串误排
  543. m = re.search(r"\d+", name)
  544. return (int(m.group()) if m else 0, name)
  545. out = []
  546. for k, v in sorted(runs.items(), key=lambda kv: _qnum(kv[0])):
  547. oq = v[0].get("original_q") or v[0].get("query") or ""
  548. seen, hits = set(), 0 # 知识命中数 = 各形式采纳(report)且非异常、按 url 去重后的帖子数
  549. for f in v:
  550. for r in f.get("results", []):
  551. if r.get("decision") == "report" and not r.get("anomaly") and r.get("url") not in seen:
  552. seen.add(r.get("url")); hits += 1
  553. out.append({"key": k, "forms": v, "dims": parse_dims(oq), "original_q": oq,
  554. "hits": hits, "tot": sum((f.get("total") or 0) for f in v)})
  555. active_reevals = {k: v["status"] for k, v in ACTIVE_REEVALS.items()}
  556. return {"queries": out, "actions": ACTIONS_TAX, "types": TYPES_TAX, "matrix": _MATRIX, "active_reevals": active_reevals}
  557. class H(BaseHTTPRequestHandler):
  558. def _send(self, code, body, ctype):
  559. b = body.encode("utf-8") if isinstance(body, str) else body
  560. self.send_response(code)
  561. if ctype.startswith("text/") or ctype == "application/json" or ctype == "application/javascript":
  562. self.send_header("Content-Type", ctype + "; charset=utf-8")
  563. else:
  564. self.send_header("Content-Type", ctype)
  565. self.send_header("Content-Length", str(len(b))); self.end_headers(); self.wfile.write(b)
  566. def do_GET(self):
  567. parsed = urlparse(self.path)
  568. path = parsed.path
  569. params = parse_qs(parsed.query)
  570. if path in ("/", "/index.html"):
  571. try:
  572. page = (HERE / "index.html").read_text(encoding="utf-8")
  573. self._send(200, page, "text/html")
  574. except Exception as e:
  575. self._send(500, f"Error reading index.html: {e}", "text/plain")
  576. elif path == "/api/data":
  577. self._send(200, json.dumps(scan_runs(), ensure_ascii=False), "application/json")
  578. elif path == "/api/tools_status":
  579. # 工具解构状态:done=结果文件已存在;running=该 q 解构任务仍在跑
  580. q = (params.get("q") or [""])[0].strip()
  581. case_id = (params.get("case_id") or [""])[0].strip()
  582. if not q or not case_id:
  583. self._send(400, "missing q or case_id", "text/plain"); return
  584. done = (HERE / "runs_full" / q / "tools" / f"{case_id}.json").is_file()
  585. if not done: # 本地无 → 看库里有没有(本地清空后仍算已解构)
  586. try:
  587. import db
  588. done = db.has_tools(q, case_id)
  589. except Exception:
  590. pass
  591. task = TOOL_TASKS.get(q) or {}
  592. running = task.get("status") == "running" and case_id in (task.get("case_ids") or [])
  593. self._send(200, json.dumps({
  594. "done": done, "running": running, "error": task.get("error"),
  595. }, ensure_ascii=False), "application/json")
  596. elif path == "/api/tools_data":
  597. # 取某帖的工具解构结果。可选 version:指定则取该版本(只从库),否则取最新(本地优先)。
  598. # 始终附带 versions(全部历史版本,供前端下拉切换)。
  599. q = (params.get("q") or [""])[0].strip()
  600. case_id = (params.get("case_id") or [""])[0].strip()
  601. version = (params.get("version") or [""])[0].strip() or None
  602. if not q or not case_id:
  603. self._send(400, "missing q or case_id", "text/plain"); return
  604. try:
  605. import db
  606. versions = db.fetch_tool_versions(q, case_id)
  607. except Exception:
  608. db, versions = None, []
  609. def _emit(data):
  610. if data:
  611. data["exists"] = True
  612. data["versions"] = versions
  613. self._send(200, json.dumps(data, ensure_ascii=False), "application/json")
  614. else:
  615. self._send(200, json.dumps({"exists": False, "versions": versions}, ensure_ascii=False), "application/json")
  616. if version: # 指定历史版本 → 只能从库取
  617. _emit(db.fetch_tools(q, case_id, version) if db else None); return
  618. f = HERE / "runs_full" / q / "tools" / f"{case_id}.json" # 默认最新:本地优先
  619. if f.is_file():
  620. try:
  621. _emit(json.loads(f.read_text(encoding="utf-8"))); return
  622. except Exception as e:
  623. self._send(500, json.dumps({"error": f"read failed: {e}"}, ensure_ascii=False), "application/json"); return
  624. _emit(db.fetch_tools(q, case_id) if db else None) # 本地无 → 库最新
  625. elif path == "/api/procedure_status":
  626. q = (params.get("q") or [""])[0].strip()
  627. form = (params.get("form") or [""])[0].strip()
  628. case_id = (params.get("case_id") or [""])[0].strip()
  629. if not q or not form or not case_id:
  630. self._send(400, "missing q, form, or case_id", "text/plain")
  631. return
  632. folder_name = f"{form}_{_short_case(case_id)}"
  633. task_key = f"{q}/{folder_name}"
  634. if task_key in ACTIVE_TASKS:
  635. task = ACTIVE_TASKS[task_key]
  636. res = {
  637. "status": task["status"],
  638. "error": task["error"]
  639. }
  640. if task["status"] == "success":
  641. out_dir = HERE / "runs_full" / q / "procedures" / folder_name
  642. html_files = list(out_dir.glob("*.html")) if out_dir.is_dir() else []
  643. if html_files:
  644. res["procedure_html"] = f"runs_full/{q}/procedures/{folder_name}/{html_files[0].name}"
  645. self._send(200, json.dumps(res, ensure_ascii=False), "application/json")
  646. return
  647. out_dir = HERE / "runs_full" / q / "procedures" / folder_name
  648. html_files = list(out_dir.glob("*.html")) if out_dir.is_dir() else []
  649. if html_files:
  650. self._send(200, json.dumps({
  651. "status": "success",
  652. "procedure_html": f"runs_full/{q}/procedures/{folder_name}/{html_files[0].name}"
  653. }, ensure_ascii=False), "application/json")
  654. return
  655. log_path = out_dir / "_extract.log"
  656. if log_path.is_file():
  657. self._send(200, json.dumps({"status": "failed", "error": "Not running, but no HTML output found (possibly crashed)."}, ensure_ascii=False), "application/json")
  658. return
  659. self._send(200, json.dumps({"status": "not_started"}, ensure_ascii=False), "application/json")
  660. elif path == "/api/procedure_log":
  661. q = (params.get("q") or [""])[0].strip()
  662. form = (params.get("form") or [""])[0].strip()
  663. case_id = (params.get("case_id") or [""])[0].strip()
  664. if not q or not form or not case_id:
  665. self._send(400, "missing q, form, or case_id", "text/plain")
  666. return
  667. folder_name = f"{form}_{_short_case(case_id)}"
  668. log_path = HERE / "runs_full" / q / "procedures" / folder_name / "_extract.log"
  669. if not log_path.is_file():
  670. self._send(200, json.dumps({"log": ""}, ensure_ascii=False), "application/json")
  671. return
  672. try:
  673. content = log_path.read_text(encoding="utf-8", errors="replace")
  674. self._send(200, json.dumps({"log": content}, ensure_ascii=False), "application/json")
  675. except Exception as e:
  676. self._send(500, json.dumps({"error": str(e)}, ensure_ascii=False), "application/json")
  677. elif path == "/api/spec_content":
  678. file_name = (params.get("file") or [""])[0].strip()
  679. allowed = [
  680. "README.md",
  681. "tools.md",
  682. "extraction/phase1-skeleton.md",
  683. "extraction/phase2-normalize.md",
  684. "extraction/phase3-finalize.md",
  685. "taxonomy/type_suggestions.md"
  686. ]
  687. if file_name not in allowed:
  688. self._send(400, "invalid file parameter", "text/plain")
  689. return
  690. target_path = HERE / "procedure-dsl" / "spec" / file_name
  691. if not target_path.is_file():
  692. self._send(404, "spec file not found", "text/plain")
  693. return
  694. try:
  695. content = target_path.read_text(encoding="utf-8", errors="replace")
  696. self._send(200, json.dumps({"content": content}, ensure_ascii=False), "application/json")
  697. except Exception as e:
  698. self._send(500, json.dumps({"error": str(e)}, ensure_ascii=False), "application/json")
  699. elif path == "/api/tool_prompt":
  700. # 工具解构系统 prompt(prompts/tool_extract_system.md)原文,供前端「重新解构」弹框编辑
  701. target_path = HERE / "prompts" / "tool_extract_system.md"
  702. if not target_path.is_file():
  703. self._send(404, json.dumps({"error": "tool prompt not found"}, ensure_ascii=False), "application/json")
  704. return
  705. try:
  706. content = target_path.read_text(encoding="utf-8", errors="replace")
  707. self._send(200, json.dumps({"content": content}, ensure_ascii=False), "application/json")
  708. except Exception as e:
  709. self._send(500, json.dumps({"error": str(e)}, ensure_ascii=False), "application/json")
  710. elif path == "/api/reeval_status":
  711. q = (params.get("q") or [""])[0].strip()
  712. if not q:
  713. self._send(400, "missing q", "text/plain")
  714. return
  715. if q in ACTIVE_REEVALS:
  716. self._send(200, json.dumps({
  717. "status": ACTIVE_REEVALS[q]["status"],
  718. "error": ACTIVE_REEVALS[q].get("error")
  719. }, ensure_ascii=False), "application/json")
  720. else:
  721. self._send(200, json.dumps({"status": "not_started"}, ensure_ascii=False), "application/json")
  722. elif self.path.startswith("/runs_full/"):
  723. try:
  724. clean_path = self.path.split("?")[0]
  725. parts = clean_path.strip("/").split("/")
  726. target_file = HERE
  727. for part in parts:
  728. target_file = target_file / part
  729. runs_dir = HERE / "runs_full"
  730. if runs_dir.resolve() in target_file.resolve().parents and target_file.is_file():
  731. content = target_file.read_bytes()
  732. ext = target_file.suffix.lower()
  733. ctype = "text/html"
  734. if ext in (".png", ".webp"):
  735. ctype = f"image/{ext[1:]}"
  736. elif ext in (".jpg", ".jpeg"):
  737. ctype = "image/jpeg"
  738. elif ext == ".json":
  739. ctype = "application/json"
  740. elif ext == ".js":
  741. ctype = "application/javascript"
  742. elif ext == ".css":
  743. ctype = "text/css"
  744. self._send(200, content, ctype)
  745. else:
  746. self._send(404, "not found", "text/plain")
  747. except Exception as e:
  748. self._send(500, f"Error: {e}", "text/plain")
  749. else:
  750. self._send(404, "not found", "text/plain")
  751. def do_POST(self):
  752. if self.path == "/api/generate_procedure":
  753. length = int(self.headers.get("Content-Length") or 0)
  754. raw = self.rfile.read(length).decode("utf-8") if length > 0 else "{}"
  755. try:
  756. payload = json.loads(raw)
  757. except Exception as e:
  758. self._send(400, json.dumps({"error": f"bad json: {e}"}), "application/json"); return
  759. q = (payload.get("q") or "").strip()
  760. form = (payload.get("form") or "").strip()
  761. case_id = (payload.get("case_id") or "").strip()
  762. engine = (payload.get("engine") or "cyber_runner").strip()
  763. model = (payload.get("model") or "google/gemini-3.1-flash-lite").strip()
  764. if not re.match(r"^q\d+$", q):
  765. self._send(400, json.dumps({"error": f"bad q (expect 'qNN'): {q!r}"}, ensure_ascii=False), "application/json"); return
  766. if form not in ("A", "B", "C"):
  767. self._send(400, json.dumps({"error": f"bad form: {form!r}"}, ensure_ascii=False), "application/json"); return
  768. if not case_id:
  769. self._send(400, json.dumps({"error": "missing case_id"}, ensure_ascii=False), "application/json"); return
  770. q_dir = HERE / "runs_full" / q
  771. form_file = q_dir / f"form_{form}.json"
  772. if not form_file.is_file():
  773. self._send(404, json.dumps({"error": f"form file not found: {form_file.name}"}, ensure_ascii=False), "application/json"); return
  774. try:
  775. with open(form_file, encoding="utf-8") as f:
  776. form_data = json.load(f)
  777. except Exception as e:
  778. self._send(500, json.dumps({"error": f"failed to read form: {e}"}, ensure_ascii=False), "application/json"); return
  779. matching_result = None
  780. for r in form_data.get("results", []):
  781. if r.get("case_id") == case_id:
  782. matching_result = r
  783. break
  784. if not matching_result:
  785. self._send(404, json.dumps({"error": f"case_id {case_id} not found in form {form}"}, ensure_ascii=False), "application/json"); return
  786. folder_name = f"{form}_{_short_case(case_id)}"
  787. out_dir = q_dir / "procedures" / folder_name
  788. out_dir.mkdir(parents=True, exist_ok=True)
  789. src_path = out_dir / "_source.json"
  790. try:
  791. with open(src_path, "w", encoding="utf-8") as f:
  792. json.dump(_source_to_dsl_input(matching_result), f, ensure_ascii=False, indent=2)
  793. score = _composite_score(matching_result.get("llm_evaluation") or {})
  794. _write_meta(out_dir, case_id=case_id, from_q=q, form=form, score=score)
  795. except Exception as e:
  796. self._send(500, json.dumps({"error": f"failed to write inputs: {e}"}, ensure_ascii=False), "application/json"); return
  797. task_key = f"{q}/{folder_name}"
  798. ACTIVE_TASKS[task_key] = {
  799. "status": "running",
  800. "start_time": datetime.now().isoformat(),
  801. "pid": None,
  802. "error": None
  803. }
  804. t = threading.Thread(target=run_extraction_task, args=(q, folder_name, src_path, out_dir, engine, model))
  805. t.daemon = True
  806. t.start()
  807. self._send(200, json.dumps({
  808. "status": "started",
  809. "task_key": task_key,
  810. "log": f"runs_full/{q}/procedures/{folder_name}/_extract.log"
  811. }, ensure_ascii=False), "application/json")
  812. elif self.path == "/api/extract_tools":
  813. # 工具解构:body {q, case_ids:[...], force?} → 起 tool_extract.py 子进程
  814. length = int(self.headers.get("Content-Length") or 0)
  815. raw = self.rfile.read(length).decode("utf-8") if length > 0 else "{}"
  816. try:
  817. payload = json.loads(raw)
  818. except Exception as e:
  819. self._send(400, json.dumps({"error": f"bad json: {e}"}), "application/json"); return
  820. q = (payload.get("q") or "").strip()
  821. case_ids = payload.get("case_ids") or []
  822. force = bool(payload.get("force"))
  823. prompt = payload.get("prompt")
  824. # 模型选择:仅允许白名单 choice key,传给 tool_extract.py --model
  825. TOOL_MODEL_CHOICES = {"gemini-flash-lite", "gemini-3.5-flash", "sonnet"}
  826. model = (payload.get("model") or "").strip() or None
  827. if model and model not in TOOL_MODEL_CHOICES:
  828. self._send(400, json.dumps({"error": f"bad model: {model!r}"}, ensure_ascii=False), "application/json"); return
  829. if not re.match(r"^q\d+$", q):
  830. self._send(400, json.dumps({"error": f"bad q (expect 'qNN'): {q!r}"}, ensure_ascii=False), "application/json"); return
  831. if not isinstance(case_ids, list) or not case_ids:
  832. self._send(400, json.dumps({"error": "case_ids must be a non-empty list"}, ensure_ascii=False), "application/json"); return
  833. if not (HERE / "runs_full" / q / "form_A.json").is_file():
  834. self._send(404, json.dumps({"error": f"runs_full/{q}/form_A.json not found"}, ensure_ascii=False), "application/json"); return
  835. # 前端「重新解构」弹框可带上编辑后的 prompt → 持久化到 prompts/tool_extract_system.md,
  836. # tool_extract.py 子进程会在启动时重新读取该文件,于是按最新 prompt 解构。
  837. if isinstance(prompt, str) and prompt.strip():
  838. try:
  839. (HERE / "prompts" / "tool_extract_system.md").write_text(prompt, encoding="utf-8")
  840. except Exception as e:
  841. self._send(500, json.dumps({"error": f"save prompt failed: {e}"}, ensure_ascii=False), "application/json"); return
  842. TOOL_TASKS[q] = {
  843. "status": "running", "case_ids": case_ids,
  844. "start_time": datetime.now().isoformat(), "pid": None, "error": None,
  845. }
  846. t = threading.Thread(target=run_tool_extraction_task, args=(q, case_ids, force, model))
  847. t.daemon = True
  848. t.start()
  849. self._send(200, json.dumps({
  850. "status": "started", "q": q, "count": len(case_ids),
  851. "log": f"runs_full/{q}/tools/_extract.log",
  852. }, ensure_ascii=False), "application/json")
  853. elif self.path == "/api/reeval":
  854. length = int(self.headers.get("Content-Length") or 0)
  855. raw = self.rfile.read(length).decode("utf-8") if length > 0 else "{}"
  856. try:
  857. payload = json.loads(raw)
  858. except Exception as e:
  859. self._send(400, json.dumps({"error": f"bad json: {e}"}), "application/json"); return
  860. q = (payload.get("q") or "").strip()
  861. if not re.match(r"^q\d+$", q):
  862. self._send(400, json.dumps({"error": f"bad q (expect 'qNN'): {q!r}"},
  863. ensure_ascii=False), "application/json"); return
  864. q_dir = HERE / "runs_full" / q
  865. if not q_dir.is_dir():
  866. self._send(404, json.dumps({"error": f"runs_full/{q} not found"}, ensure_ascii=False),
  867. "application/json"); return
  868. log_path = q_dir / "_reeval.log"
  869. try:
  870. log_fh = open(log_path, "w", encoding="utf-8", buffering=1)
  871. cmd = [sys.executable, "-u", str(HERE / "batch_3forms.py"),
  872. "--reeval", "--reeval-q", q, "--output-dir", str(HERE / "runs_full")]
  873. flags = subprocess.CREATE_NEW_PROCESS_GROUP if sys.platform == "win32" else 0
  874. proc = subprocess.Popen(cmd, stdout=log_fh, stderr=subprocess.STDOUT,
  875. cwd=str(HERE), creationflags=flags)
  876. ACTIVE_REEVALS[q] = {
  877. "status": "running",
  878. "pid": proc.pid,
  879. "error": None
  880. }
  881. def wait_reeval(q_key, p_obj, fh):
  882. try:
  883. p_obj.wait()
  884. if p_obj.returncode == 0:
  885. ACTIVE_REEVALS[q_key]["status"] = "success"
  886. else:
  887. ACTIVE_REEVALS[q_key]["status"] = "failed"
  888. ACTIVE_REEVALS[q_key]["error"] = f"Subprocess exited with code {p_obj.returncode}"
  889. except Exception as ex:
  890. ACTIVE_REEVALS[q_key]["status"] = "failed"
  891. ACTIVE_REEVALS[q_key]["error"] = str(ex)
  892. finally:
  893. try:
  894. fh.close()
  895. except Exception:
  896. pass
  897. t = threading.Thread(target=wait_reeval, args=(q, proc, log_fh))
  898. t.daemon = True
  899. t.start()
  900. self._send(200, json.dumps(
  901. {"status": "started", "pid": proc.pid, "q": q,
  902. "log": str(log_path.relative_to(HERE))},
  903. ensure_ascii=False), "application/json")
  904. except Exception as e:
  905. self._send(500, json.dumps({"error": f"failed to start: {e}"},
  906. ensure_ascii=False), "application/json")
  907. elif self.path == "/api/save_spec":
  908. length = int(self.headers.get("Content-Length") or 0)
  909. raw = self.rfile.read(length).decode("utf-8") if length > 0 else "{}"
  910. try:
  911. payload = json.loads(raw)
  912. except Exception as e:
  913. self._send(400, json.dumps({"error": f"bad json: {e}"}), "application/json"); return
  914. file_name = (payload.get("file") or "").strip()
  915. content = payload.get("content") or ""
  916. allowed = [
  917. "README.md",
  918. "tools.md",
  919. "extraction/phase1-skeleton.md",
  920. "extraction/phase2-normalize.md",
  921. "extraction/phase3-finalize.md",
  922. "taxonomy/type_suggestions.md"
  923. ]
  924. if file_name not in allowed:
  925. self._send(400, json.dumps({"error": "invalid file parameter"}), "application/json"); return
  926. target_path = HERE / "procedure-dsl" / "spec" / file_name
  927. try:
  928. target_path.parent.mkdir(parents=True, exist_ok=True)
  929. target_path.write_text(content, encoding="utf-8")
  930. self._send(200, json.dumps({"status": "ok"}, ensure_ascii=False), "application/json")
  931. except Exception as e:
  932. self._send(500, json.dumps({"error": str(e)}, ensure_ascii=False), "application/json")
  933. else:
  934. self._send(404, json.dumps({"error": "not found"}), "application/json")
  935. def log_message(self, *a): pass
  936. if __name__ == "__main__":
  937. n = len(scan_runs()["queries"])
  938. print(f"搜索评估查看 server:http://0.0.0.0:{PORT} (runs_full/ 下 {n} 个 query,实时扫描)")
  939. ThreadingHTTPServer(("0.0.0.0", PORT), H).serve_forever()