agent_service.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317
  1. #! /usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. # vim:fenc=utf-8
  4. import re
  5. import sys
  6. import time
  7. import random
  8. from typing import Dict, List, Tuple, Any, Optional
  9. import logging
  10. from datetime import datetime, timedelta
  11. import traceback
  12. import apscheduler.triggers.cron
  13. from apscheduler.schedulers.background import BackgroundScheduler
  14. import chat_service
  15. import configs
  16. import logging_service
  17. from logging_service import logger
  18. from chat_service import CozeChat, ChatServiceType
  19. from dialogue_manager import DialogueManager, DialogueState, DialogueStateCache
  20. from user_manager import UserManager, LocalUserManager, MySQLUserManager, MySQLUserRelationManager, UserRelationManager
  21. from openai import OpenAI
  22. from message_queue_backend import MessageQueueBackend, MemoryQueueBackend, AliyunRocketMQQueueBackend
  23. from user_profile_extractor import UserProfileExtractor
  24. import threading
  25. from message import MessageType, Message, MessageChannel
  26. class AgentService:
  27. def __init__(
  28. self,
  29. receive_backend: MessageQueueBackend,
  30. send_backend: MessageQueueBackend,
  31. human_backend: MessageQueueBackend,
  32. user_manager: UserManager,
  33. user_relation_manager: UserRelationManager,
  34. chat_service_type: ChatServiceType = ChatServiceType.OPENAI_COMPATIBLE
  35. ):
  36. self.receive_queue = receive_backend
  37. self.send_queue = send_backend
  38. self.human_queue = human_backend
  39. # 核心服务模块
  40. self.agent_state_cache = DialogueStateCache()
  41. self.user_manager = user_manager
  42. self.user_relation_manager = user_relation_manager
  43. self.user_profile_extractor = UserProfileExtractor()
  44. self.agent_registry: Dict[str, DialogueManager] = {}
  45. self.llm_client = OpenAI(
  46. api_key=chat_service.VOLCENGINE_API_TOKEN,
  47. base_url=chat_service.VOLCENGINE_BASE_URL
  48. )
  49. # DeepSeek on Volces
  50. self.model_name = chat_service.VOLCENGINE_MODEL_DEEPSEEK_V3
  51. coze_config = configs.get()['chat_api']['coze']
  52. coze_oauth_app = CozeChat.get_oauth_app(
  53. coze_config['oauth_client_id'], coze_config['private_key_path'], str(coze_config['public_key_id']),
  54. account_id=coze_config.get('account_id', None)
  55. )
  56. self.coze_client = CozeChat(
  57. base_url=chat_service.COZE_CN_BASE_URL,
  58. auth_app=coze_oauth_app
  59. )
  60. self.chat_service_type = chat_service_type
  61. # 定时任务调度器
  62. self.scheduler = BackgroundScheduler()
  63. self.scheduler.start()
  64. def setup_initiative_conversations(self, schedule_params: Optional[Dict] = None):
  65. if not schedule_params:
  66. schedule_params = {'hour': '8,16,20'}
  67. self.scheduler.add_job(
  68. self._check_initiative_conversations,
  69. apscheduler.triggers.cron.CronTrigger(**schedule_params)
  70. )
  71. def _get_agent_instance(self, staff_id: str, user_id: str) -> DialogueManager:
  72. """获取Agent实例"""
  73. agent_key = 'agent_{}_{}'.format(staff_id, user_id)
  74. if agent_key not in self.agent_registry:
  75. self.agent_registry[agent_key] = DialogueManager(
  76. staff_id, user_id, self.user_manager, self.agent_state_cache)
  77. return self.agent_registry[agent_key]
  78. def process_messages(self):
  79. """持续处理接收队列消息"""
  80. while True:
  81. message = self.receive_queue.consume()
  82. if message:
  83. try:
  84. self.process_single_message(message)
  85. self.receive_queue.ack(message)
  86. except Exception as e:
  87. logger.error("Error processing message: {}".format(e))
  88. traceback.print_exc()
  89. time.sleep(1)
  90. def _update_user_profile(self, user_id, user_profile, message: str):
  91. profile_to_update = self.user_profile_extractor.extract_profile_info(user_profile, message)
  92. if not profile_to_update:
  93. logger.debug("user_id: {}, no profile info extracted".format(user_id))
  94. return
  95. logger.warning("update user profile: {}".format(profile_to_update))
  96. merged_profile = self.user_profile_extractor.merge_profile_info(user_profile, profile_to_update)
  97. self.user_manager.save_user_profile(user_id, merged_profile)
  98. return merged_profile
  99. def _schedule_aggregation_trigger(self, staff_id: str, user_id: str, delay_sec: int):
  100. logger.debug("user: {}, schedule trigger message after {} seconds".format(user_id, delay_sec))
  101. message_ts = int((time.time() + delay_sec) * 1000)
  102. message = Message.build(MessageType.AGGREGATION_TRIGGER, MessageChannel.SYSTEM, user_id, staff_id, None, message_ts)
  103. # 系统消息使用特定的msgId,无实际意义
  104. message.msgId = -MessageType.AGGREGATION_TRIGGER.value
  105. self.scheduler.add_job(lambda: self.receive_queue.produce(message),
  106. 'date',
  107. run_date=datetime.now() + timedelta(seconds=delay_sec))
  108. def process_single_message(self, message: Message):
  109. user_id = message.sender
  110. staff_id = message.receiver
  111. # 获取用户信息和Agent实例
  112. user_profile = self.user_manager.get_user_profile(user_id)
  113. agent = self._get_agent_instance(staff_id, user_id)
  114. # 更新对话状态
  115. logger.debug("process message: {}".format(message))
  116. need_response, message_text = agent.update_state(message)
  117. logger.debug("user: {}, next state: {}".format(user_id, agent.current_state))
  118. # 根据状态路由消息
  119. if agent.is_in_human_intervention():
  120. self._route_to_human_intervention(user_id, message)
  121. elif agent.current_state == DialogueState.MESSAGE_AGGREGATING:
  122. if message.type != MessageType.AGGREGATION_TRIGGER:
  123. # 产生一个触发器,但是不能由触发器递归产生
  124. logger.debug("user: {}, waiting next message for aggregation".format(user_id))
  125. self._schedule_aggregation_trigger(staff_id, user_id, agent.message_aggregation_sec)
  126. return
  127. elif need_response:
  128. # 先更新用户画像再处理回复
  129. self._update_user_profile(user_id, user_profile, message_text)
  130. self._get_chat_response(user_id, agent, message_text)
  131. else:
  132. logger.debug(f"staff[{staff_id}], user[{user_id}]: do not need response")
  133. def _route_to_human_intervention(self, user_id: str, origin_message: Message):
  134. """路由到人工干预"""
  135. self.human_queue.produce(Message.build(
  136. MessageType.TEXT,
  137. origin_message.channel,
  138. origin_message.sender,
  139. origin_message.receiver,
  140. "用户对话需人工介入,用户名:{}".format(user_id),
  141. int(time.time() * 1000)
  142. ))
  143. def _check_initiative_conversations(self):
  144. """定时检查主动发起对话"""
  145. for staff_user in self.user_relation_manager.list_staff_users():
  146. staff_id = staff_user['staff_id']
  147. user_id = staff_user['user_id']
  148. agent = self._get_agent_instance(staff_id, user_id)
  149. should_initiate = agent.should_initiate_conversation()
  150. if should_initiate:
  151. logger.warning("user: {}, initiate conversation".format(user_id))
  152. resp = self._get_chat_response(user_id, agent, None)
  153. if resp:
  154. time.sleep(random.randint(10,20))
  155. else:
  156. logger.debug("user: {}, do not initiate conversation".format(user_id))
  157. def _get_chat_response(self, user_id: str, agent: DialogueManager,
  158. user_message: Optional[str]):
  159. """处理LLM响应"""
  160. chat_config = agent.build_chat_configuration(user_message, self.chat_service_type)
  161. logger.debug(chat_config)
  162. chat_response = self._call_chat_api(chat_config)
  163. chat_response = self.sanitize_response(chat_response)
  164. if response := agent.generate_response(chat_response):
  165. logger.warning(f"staff[{agent.staff_id}] user[{user_id}]: response: {response}")
  166. current_ts = int(time.time() * 1000)
  167. user_tags = self.user_relation_manager.get_user_tags(user_id)
  168. # FIXME(zhoutian)
  169. # 测试期间临时逻辑,只发送特定的账号或特定用户
  170. if not (agent.staff_id in set(['1688854492669990'])
  171. or 'AgentTest1' in user_tags):
  172. logger.warning(f"staff[{agent.staff_id}] user[{user_id}]: skip reply")
  173. return None
  174. self.send_queue.produce(
  175. Message.build(MessageType.TEXT, MessageChannel.CORP_WECHAT,
  176. agent.staff_id, user_id, response, current_ts)
  177. )
  178. return response
  179. else:
  180. logger.warning(f"staff[{agent.staff_id}] user[{user_id}]: no response generated")
  181. return None
  182. def _call_chat_api(self, chat_config: Dict) -> str:
  183. if configs.get().get('debug_flags', {}).get('disable_llm_api_call', False):
  184. return 'LLM模拟回复 {}'.format(datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
  185. if self.chat_service_type == ChatServiceType.OPENAI_COMPATIBLE:
  186. chat_completion = self.llm_client.chat.completions.create(
  187. messages=chat_config['messages'],
  188. model=self.model_name,
  189. )
  190. response = chat_completion.choices[0].message.content
  191. elif self.chat_service_type == ChatServiceType.COZE_CHAT:
  192. bot_user_id = 'dev_user'
  193. response = self.coze_client.create(
  194. chat_config['bot_id'], bot_user_id, chat_config['messages'],
  195. chat_config['custom_variables']
  196. )
  197. else:
  198. raise Exception('Unsupported chat service type: {}'.format(self.chat_service_type))
  199. return response
  200. @staticmethod
  201. def sanitize_response(response: str):
  202. pattern = r'\[?\d{4}-\d{2}-\d{2} \d{2}:\d{2}:\d{2}\]?'
  203. response = re.sub(pattern, '', response)
  204. response = response.strip()
  205. return response
  206. if __name__ == "__main__":
  207. config = configs.get()
  208. logging_service.setup_root_logger()
  209. logger.warning("current env: {}".format(configs.get_env()))
  210. scheduler_logger = logging.getLogger('apscheduler')
  211. scheduler_logger.setLevel(logging.WARNING)
  212. use_aliyun_mq = config['debug_flags']['use_aliyun_mq']
  213. # 初始化不同队列的后端
  214. if use_aliyun_mq:
  215. receive_queue = AliyunRocketMQQueueBackend(
  216. config['mq']['endpoints'],
  217. config['mq']['instance_id'],
  218. config['mq']['receive_topic'],
  219. has_consumer=True, has_producer=True,
  220. group_id=config['mq']['receive_group']
  221. )
  222. send_queue = AliyunRocketMQQueueBackend(
  223. config['mq']['endpoints'],
  224. config['mq']['instance_id'],
  225. config['mq']['send_topic'],
  226. has_consumer=False, has_producer=True
  227. )
  228. else:
  229. receive_queue = MemoryQueueBackend()
  230. send_queue = MemoryQueueBackend()
  231. human_queue = MemoryQueueBackend()
  232. # 初始化用户管理服务
  233. # FIXME(zhoutian): 如果不使用MySQL,此数据库配置非必须
  234. user_db_config = config['storage']['user']
  235. staff_db_config = config['storage']['staff']
  236. if config['debug_flags'].get('use_local_user_storage', False):
  237. user_manager = LocalUserManager()
  238. else:
  239. user_manager = MySQLUserManager(user_db_config['mysql'], user_db_config['table'], staff_db_config['table'])
  240. wecom_db_config = config['storage']['user_relation']
  241. user_relation_manager = MySQLUserRelationManager(
  242. user_db_config['mysql'], wecom_db_config['mysql'],
  243. config['storage']['staff']['table'],
  244. user_db_config['table'],
  245. wecom_db_config['table']['staff'],
  246. wecom_db_config['table']['relation'],
  247. wecom_db_config['table']['user']
  248. )
  249. # 创建Agent服务
  250. service = AgentService(
  251. receive_backend=receive_queue,
  252. send_backend=send_queue,
  253. human_backend=human_queue,
  254. user_manager=user_manager,
  255. user_relation_manager=user_relation_manager,
  256. chat_service_type=ChatServiceType.COZE_CHAT
  257. )
  258. # 只有企微场景需要主动发起
  259. if not config['debug_flags'].get('disable_active_conversation', False):
  260. service.setup_initiative_conversations({'second': '5,35'})
  261. process_thread = threading.Thread(target=service.process_messages)
  262. process_thread.start()
  263. if not config['debug_flags'].get('console_input', False):
  264. process_thread.join()
  265. sys.exit(0)
  266. message_id = 0
  267. while True:
  268. print("Input next message: ")
  269. text = sys.stdin.readline().strip()
  270. if not text:
  271. continue
  272. message_id += 1
  273. sender = '7881299670930896'
  274. receiver = '1688854492669990'
  275. if text == MessageType.AGGREGATION_TRIGGER.name:
  276. message = Message.build(MessageType.AGGREGATION_TRIGGER, MessageChannel.CORP_WECHAT,
  277. sender, receiver, None, int(time.time() * 1000))
  278. else:
  279. message = Message.build(MessageType.TEXT, MessageChannel.CORP_WECHAT,
  280. sender,receiver, text, int(time.time() * 1000)
  281. )
  282. message.msgId = message_id
  283. receive_queue.produce(message)
  284. time.sleep(0.1)
  285. process_thread.join()