registry.py 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503
  1. """
  2. Tool Registry - 工具注册表和装饰器
  3. 职责:
  4. 1. @tool 装饰器:自动注册工具并生成 Schema
  5. 2. 管理所有工具的 Schema 和实现
  6. 3. 路由工具调用到具体实现
  7. 4. 支持域名过滤、敏感数据处理、工具统计
  8. 从 Resonote/llm/tools/registry.py 抽取并扩展
  9. """
  10. import json
  11. import inspect
  12. import logging
  13. import time
  14. from typing import Any, Callable, Dict, List, Optional
  15. from agent.tools.url_matcher import filter_by_url
  16. logger = logging.getLogger(__name__)
  17. class ToolStats:
  18. """工具使用统计"""
  19. def __init__(self):
  20. self.call_count: int = 0
  21. self.success_count: int = 0
  22. self.failure_count: int = 0
  23. self.total_duration: float = 0.0
  24. self.last_called: Optional[float] = None
  25. @property
  26. def average_duration(self) -> float:
  27. """平均执行时间(秒)"""
  28. return self.total_duration / self.call_count if self.call_count > 0 else 0.0
  29. @property
  30. def success_rate(self) -> float:
  31. """成功率"""
  32. return self.success_count / self.call_count if self.call_count > 0 else 0.0
  33. def to_dict(self) -> Dict[str, Any]:
  34. return {
  35. "call_count": self.call_count,
  36. "success_count": self.success_count,
  37. "failure_count": self.failure_count,
  38. "average_duration": self.average_duration,
  39. "success_rate": self.success_rate,
  40. "last_called": self.last_called
  41. }
  42. class ToolRegistry:
  43. """工具注册表"""
  44. def __init__(self):
  45. self._tools: Dict[str, Dict[str, Any]] = {}
  46. self._stats: Dict[str, ToolStats] = {}
  47. def register(
  48. self,
  49. func: Callable,
  50. schema: Optional[Dict] = None,
  51. requires_confirmation: bool = False,
  52. editable_params: Optional[List[str]] = None,
  53. display: Optional[Dict[str, Dict[str, Any]]] = None,
  54. url_patterns: Optional[List[str]] = None,
  55. hidden_params: Optional[List[str]] = None,
  56. inject_params: Optional[Dict[str, Any]] = None
  57. ):
  58. """
  59. 注册工具
  60. Args:
  61. func: 工具函数
  62. schema: 工具 Schema(如果为 None,自动生成)
  63. requires_confirmation: 是否需要用户确认
  64. editable_params: 允许用户编辑的参数列表
  65. display: i18n 展示信息 {"zh": {"name": "xx", "params": {...}}, "en": {...}}
  66. url_patterns: URL 模式列表(如 ["*.google.com"],None = 无限制)
  67. hidden_params: 隐藏参数列表(不生成 schema,LLM 看不到)
  68. inject_params: 注入参数规则 {param_name: injector_func}
  69. """
  70. func_name = func.__name__
  71. # 如果没有提供 Schema,自动生成
  72. if schema is None:
  73. try:
  74. from agent.tools.schema import SchemaGenerator
  75. schema = SchemaGenerator.generate(func, hidden_params=hidden_params or [])
  76. except Exception as e:
  77. logger.error(f"Failed to generate schema for {func_name}: {e}")
  78. raise
  79. self._tools[func_name] = {
  80. "func": func,
  81. "schema": schema,
  82. "url_patterns": url_patterns,
  83. "hidden_params": hidden_params or [],
  84. "inject_params": inject_params or {},
  85. "ui_metadata": {
  86. "requires_confirmation": requires_confirmation,
  87. "editable_params": editable_params or [],
  88. "display": display or {}
  89. }
  90. }
  91. # 初始化统计
  92. self._stats[func_name] = ToolStats()
  93. logger.debug(
  94. f"[ToolRegistry] Registered: {func_name} "
  95. f"(requires_confirmation={requires_confirmation}, "
  96. f"editable_params={editable_params or []}, "
  97. f"url_patterns={url_patterns or 'none'})"
  98. )
  99. def is_registered(self, tool_name: str) -> bool:
  100. """检查工具是否已注册"""
  101. return tool_name in self._tools
  102. def get_schemas(self, tool_names: Optional[List[str]] = None) -> List[Dict]:
  103. """
  104. 获取工具 Schema
  105. Args:
  106. tool_names: 工具名称列表(None = 所有工具)
  107. Returns:
  108. OpenAI Tool Schema 列表
  109. """
  110. if tool_names is None:
  111. tool_names = list(self._tools.keys())
  112. schemas = []
  113. for name in tool_names:
  114. if name in self._tools:
  115. schemas.append(self._tools[name]["schema"])
  116. else:
  117. logger.warning(f"[ToolRegistry] Tool not found: {name}")
  118. return schemas
  119. def get_tool_names(self, current_url: Optional[str] = None) -> List[str]:
  120. """
  121. 获取工具名称列表(可选 URL 过滤)
  122. Args:
  123. current_url: 当前 URL(None = 返回所有工具)
  124. Returns:
  125. 工具名称列表
  126. """
  127. if current_url is None:
  128. return list(self._tools.keys())
  129. # 过滤工具
  130. tool_items = [
  131. {"name": name, "url_patterns": tool["url_patterns"]}
  132. for name, tool in self._tools.items()
  133. ]
  134. filtered = filter_by_url(tool_items, current_url, url_field="url_patterns")
  135. return [item["name"] for item in filtered]
  136. def get_schemas_for_url(self, current_url: Optional[str] = None) -> List[Dict]:
  137. """
  138. 根据当前 URL 获取匹配的工具 Schema
  139. Args:
  140. current_url: 当前 URL(None = 返回无 URL 限制的工具)
  141. Returns:
  142. 过滤后的工具 Schema 列表
  143. """
  144. tool_names = self.get_tool_names(current_url)
  145. return self.get_schemas(tool_names)
  146. async def execute(
  147. self,
  148. name: str,
  149. arguments: Dict[str, Any],
  150. uid: str = "",
  151. context: Optional[Dict[str, Any]] = None,
  152. sensitive_data: Optional[Dict[str, Any]] = None
  153. ) -> str:
  154. """
  155. 执行工具调用
  156. Args:
  157. name: 工具名称
  158. arguments: 工具参数
  159. uid: 用户ID(自动注入)
  160. context: 额外上下文
  161. sensitive_data: 敏感数据字典(用于替换 <secret> 占位符)
  162. Returns:
  163. JSON 字符串格式的结果
  164. """
  165. if name not in self._tools:
  166. error_msg = f"Unknown tool: {name}"
  167. logger.error(f"[ToolRegistry] {error_msg}")
  168. return json.dumps({"error": error_msg}, ensure_ascii=False)
  169. start_time = time.time()
  170. stats = self._stats[name]
  171. stats.call_count += 1
  172. stats.last_called = start_time
  173. try:
  174. func = self._tools[name]["func"]
  175. tool_info = self._tools[name]
  176. # 处理敏感数据占位符
  177. if sensitive_data:
  178. from agent.tools.sensitive import replace_sensitive_data
  179. current_url = context.get("page_url") if context else None
  180. arguments = replace_sensitive_data(arguments, sensitive_data, current_url)
  181. # 准备参数:只注入函数需要的参数
  182. kwargs = {**arguments}
  183. sig = inspect.signature(func)
  184. # 注入隐藏参数(hidden_params)
  185. hidden_params = tool_info.get("hidden_params", [])
  186. if "uid" in hidden_params and "uid" in sig.parameters:
  187. kwargs["uid"] = uid
  188. if "context" in hidden_params and "context" in sig.parameters:
  189. kwargs["context"] = context
  190. # 注入默认值(inject_params)
  191. inject_params = tool_info.get("inject_params", {})
  192. for param_name, injector in inject_params.items():
  193. if param_name in sig.parameters:
  194. # 如果 LLM 已提供值,不覆盖
  195. if param_name not in kwargs or kwargs[param_name] is None:
  196. if callable(injector):
  197. # 检查 injector 的参数数量
  198. injector_sig = inspect.signature(injector)
  199. if len(injector_sig.parameters) == 1:
  200. # lambda ctx: ...
  201. kwargs[param_name] = injector(context)
  202. elif len(injector_sig.parameters) == 2:
  203. # lambda ctx, args: ...
  204. kwargs[param_name] = injector(context, kwargs)
  205. else:
  206. kwargs[param_name] = injector()
  207. else:
  208. # 直接使用值
  209. kwargs[param_name] = injector
  210. # 执行函数
  211. if inspect.iscoroutinefunction(func):
  212. result = await func(**kwargs)
  213. else:
  214. result = func(**kwargs)
  215. # 记录成功
  216. stats.success_count += 1
  217. duration = time.time() - start_time
  218. stats.total_duration += duration
  219. # 返回结果:ToolResult 转为可序列化格式
  220. if isinstance(result, str):
  221. return result
  222. # 处理 ToolResult 对象
  223. from agent.tools.models import ToolResult
  224. if isinstance(result, ToolResult):
  225. ret = {"text": result.to_llm_message()}
  226. # 保留images
  227. if result.images:
  228. ret["images"] = result.images
  229. # 保留tool_usage
  230. if result.tool_usage:
  231. ret["tool_usage"] = result.tool_usage
  232. # 向后兼容:只有text时返回字符串
  233. if len(ret) == 1:
  234. return ret["text"]
  235. return ret
  236. return json.dumps(result, ensure_ascii=False, indent=2)
  237. except Exception as e:
  238. # 记录失败
  239. stats.failure_count += 1
  240. duration = time.time() - start_time
  241. stats.total_duration += duration
  242. error_msg = f"Error executing tool '{name}': {str(e)}"
  243. logger.error(f"[ToolRegistry] {error_msg}")
  244. import traceback
  245. logger.error(traceback.format_exc())
  246. return json.dumps({"error": error_msg}, ensure_ascii=False)
  247. def get_stats(self, tool_name: Optional[str] = None) -> Dict[str, Dict[str, Any]]:
  248. """
  249. 获取工具统计信息
  250. Args:
  251. tool_name: 工具名称(None = 所有工具)
  252. Returns:
  253. 统计信息字典
  254. """
  255. if tool_name:
  256. if tool_name in self._stats:
  257. return {tool_name: self._stats[tool_name].to_dict()}
  258. return {}
  259. return {name: stats.to_dict() for name, stats in self._stats.items()}
  260. def get_top_tools(self, limit: int = 10, by: str = "call_count") -> List[str]:
  261. """
  262. 获取排名靠前的工具
  263. Args:
  264. limit: 返回数量
  265. by: 排序依据(call_count, success_rate, average_duration)
  266. Returns:
  267. 工具名称列表
  268. """
  269. if by == "call_count":
  270. sorted_tools = sorted(
  271. self._stats.items(),
  272. key=lambda x: x[1].call_count,
  273. reverse=True
  274. )
  275. elif by == "success_rate":
  276. sorted_tools = sorted(
  277. self._stats.items(),
  278. key=lambda x: x[1].success_rate,
  279. reverse=True
  280. )
  281. elif by == "average_duration":
  282. sorted_tools = sorted(
  283. self._stats.items(),
  284. key=lambda x: x[1].average_duration,
  285. reverse=False # 越快越好
  286. )
  287. else:
  288. raise ValueError(f"Invalid sort by: {by}")
  289. return [name for name, _ in sorted_tools[:limit]]
  290. def check_confirmation_required(self, tool_calls: List[Dict]) -> bool:
  291. """检查是否有工具需要用户确认"""
  292. for tc in tool_calls:
  293. tool_name = tc.get("function", {}).get("name")
  294. if tool_name and tool_name in self._tools:
  295. if self._tools[tool_name]["ui_metadata"].get("requires_confirmation", False):
  296. return True
  297. return False
  298. def get_confirmation_flags(self, tool_calls: List[Dict]) -> List[bool]:
  299. """返回每个工具是否需要确认"""
  300. flags = []
  301. for tc in tool_calls:
  302. tool_name = tc.get("function", {}).get("name")
  303. if tool_name and tool_name in self._tools:
  304. flags.append(self._tools[tool_name]["ui_metadata"].get("requires_confirmation", False))
  305. else:
  306. flags.append(False)
  307. return flags
  308. def check_any_param_editable(self, tool_calls: List[Dict]) -> bool:
  309. """检查是否有任何工具允许参数编辑"""
  310. for tc in tool_calls:
  311. tool_name = tc.get("function", {}).get("name")
  312. if tool_name and tool_name in self._tools:
  313. editable_params = self._tools[tool_name]["ui_metadata"].get("editable_params", [])
  314. if editable_params:
  315. return True
  316. return False
  317. def get_editable_params_map(self, tool_calls: List[Dict]) -> Dict[str, List[str]]:
  318. """返回每个工具调用的可编辑参数列表"""
  319. params_map = {}
  320. for tc in tool_calls:
  321. tool_call_id = tc.get("id")
  322. tool_name = tc.get("function", {}).get("name")
  323. if tool_name and tool_name in self._tools:
  324. editable_params = self._tools[tool_name]["ui_metadata"].get("editable_params", [])
  325. params_map[tool_call_id] = editable_params
  326. else:
  327. params_map[tool_call_id] = []
  328. return params_map
  329. def get_ui_metadata(
  330. self,
  331. locale: str = "zh",
  332. tool_names: Optional[List[str]] = None
  333. ) -> Dict[str, Dict[str, Any]]:
  334. """
  335. 获取工具的UI元数据(用于前端展示)
  336. Returns:
  337. {
  338. "tool_name": {
  339. "display_name": "搜索笔记",
  340. "param_display_names": {"query": "搜索关键词"},
  341. "requires_confirmation": false,
  342. "editable_params": ["query"]
  343. }
  344. }
  345. """
  346. if tool_names is None:
  347. tool_names = list(self._tools.keys())
  348. metadata = {}
  349. for name in tool_names:
  350. if name not in self._tools:
  351. continue
  352. ui_meta = self._tools[name]["ui_metadata"]
  353. display = ui_meta.get("display", {}).get(locale, {})
  354. metadata[name] = {
  355. "display_name": display.get("name", name),
  356. "param_display_names": display.get("params", {}),
  357. "requires_confirmation": ui_meta.get("requires_confirmation", False),
  358. "editable_params": ui_meta.get("editable_params", [])
  359. }
  360. return metadata
  361. # 全局单例
  362. _global_registry = ToolRegistry()
  363. def tool(
  364. description: Optional[str] = None,
  365. param_descriptions: Optional[Dict[str, str]] = None,
  366. requires_confirmation: bool = False,
  367. editable_params: Optional[List[str]] = None,
  368. display: Optional[Dict[str, Dict[str, Any]]] = None,
  369. url_patterns: Optional[List[str]] = None,
  370. hidden_params: Optional[List[str]] = None,
  371. inject_params: Optional[Dict[str, Any]] = None
  372. ):
  373. """
  374. 工具装饰器 - 自动注册工具并生成 Schema
  375. Args:
  376. description: 函数描述(可选,从 docstring 提取)
  377. param_descriptions: 参数描述(可选,从 docstring 提取)
  378. requires_confirmation: 是否需要用户确认(默认 False)
  379. editable_params: 允许用户编辑的参数列表
  380. display: i18n 展示信息
  381. url_patterns: URL 模式列表(如 ["*.google.com"],None = 无限制)
  382. hidden_params: 隐藏参数列表(不生成 schema,LLM 看不到)
  383. inject_params: 注入参数规则 {param_name: injector_func}
  384. Example:
  385. @tool(
  386. hidden_params=["context", "uid"],
  387. inject_params={
  388. "owner": lambda ctx: ctx.config.knowledge.get_owner(),
  389. },
  390. editable_params=["query"],
  391. url_patterns=["*.google.com"],
  392. display={
  393. "zh": {"name": "搜索笔记", "params": {"query": "搜索关键词"}},
  394. "en": {"name": "Search Notes", "params": {"query": "Query"}}
  395. }
  396. )
  397. async def search_blocks(
  398. query: str,
  399. limit: int = 10,
  400. owner: Optional[str] = None,
  401. context: Optional[ToolContext] = None,
  402. uid: str = ""
  403. ) -> str:
  404. '''搜索用户的笔记块'''
  405. ...
  406. """
  407. def decorator(func: Callable) -> Callable:
  408. # 注册到全局 registry
  409. _global_registry.register(
  410. func,
  411. requires_confirmation=requires_confirmation,
  412. editable_params=editable_params,
  413. display=display,
  414. url_patterns=url_patterns,
  415. hidden_params=hidden_params,
  416. inject_params=inject_params
  417. )
  418. return func
  419. return decorator
  420. def get_tool_registry() -> ToolRegistry:
  421. """获取全局工具注册表"""
  422. return _global_registry