agent_service.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286
  1. #! /usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. # vim:fenc=utf-8
  4. import sys
  5. import time
  6. from typing import Dict, List, Tuple, Any, Optional
  7. import logging
  8. from datetime import datetime, timedelta
  9. import traceback
  10. import apscheduler.triggers.cron
  11. from apscheduler.schedulers.background import BackgroundScheduler
  12. import chat_service
  13. import configs
  14. import logging_service
  15. from chat_service import CozeChat, ChatServiceType
  16. from dialogue_manager import DialogueManager, DialogueState, DialogueStateCache
  17. from user_manager import UserManager, LocalUserManager, MySQLUserManager, MySQLUserRelationManager, UserRelationManager
  18. from openai import OpenAI
  19. from message_queue_backend import MessageQueueBackend, MemoryQueueBackend, AliyunRocketMQQueueBackend
  20. from user_profile_extractor import UserProfileExtractor
  21. import threading
  22. from message import MessageType, Message, MessageChannel
  23. from logging_service import ColoredFormatter
  24. class AgentService:
  25. def __init__(
  26. self,
  27. receive_backend: MessageQueueBackend,
  28. send_backend: MessageQueueBackend,
  29. human_backend: MessageQueueBackend,
  30. user_manager: UserManager,
  31. user_relation_manager: UserRelationManager,
  32. chat_service_type: ChatServiceType = ChatServiceType.OPENAI_COMPATIBLE
  33. ):
  34. self.receive_queue = receive_backend
  35. self.send_queue = send_backend
  36. self.human_queue = human_backend
  37. # 核心服务模块
  38. self.agent_state_cache = DialogueStateCache()
  39. self.user_manager = user_manager
  40. self.user_relation_manager = user_relation_manager
  41. self.user_profile_extractor = UserProfileExtractor()
  42. self.agent_registry: Dict[str, DialogueManager] = {}
  43. self.llm_client = OpenAI(
  44. api_key=chat_service.VOLCENGINE_API_TOKEN,
  45. base_url=chat_service.VOLCENGINE_BASE_URL
  46. )
  47. # DeepSeek on Volces
  48. self.model_name = chat_service.VOLCENGINE_MODEL_DEEPSEEK_V3
  49. coze_config = configs.get()['chat_api']['coze']
  50. coze_oauth_app = CozeChat.get_oauth_app(
  51. coze_config['oauth_client_id'], coze_config['private_key_path'], str(coze_config['public_key_id']))
  52. self.coze_client = CozeChat(
  53. base_url=chat_service.COZE_CN_BASE_URL,
  54. auth_app=coze_oauth_app
  55. )
  56. self.chat_service_type = chat_service_type
  57. # 定时任务调度器
  58. self.scheduler = BackgroundScheduler()
  59. self.scheduler.start()
  60. def setup_initiative_conversations(self, schedule_params: Optional[Dict] = None):
  61. if not schedule_params:
  62. schedule_params = {'hour': '8,16,20'}
  63. self.scheduler.add_job(
  64. self._check_initiative_conversations,
  65. apscheduler.triggers.cron.CronTrigger(**schedule_params)
  66. )
  67. def _get_agent_instance(self, staff_id: str, user_id: str) -> DialogueManager:
  68. """获取Agent实例"""
  69. agent_key = 'agent_{}_{}'.format(staff_id, user_id)
  70. if agent_key not in self.agent_registry:
  71. self.agent_registry[agent_key] = DialogueManager(
  72. staff_id, user_id, self.user_manager, self.agent_state_cache)
  73. return self.agent_registry[agent_key]
  74. def process_messages(self):
  75. """持续处理接收队列消息"""
  76. while True:
  77. message = self.receive_queue.consume()
  78. if message:
  79. try:
  80. self.process_single_message(message)
  81. self.receive_queue.ack(message)
  82. except Exception as e:
  83. logging.error("Error processing message: {}".format(e))
  84. traceback.print_exc()
  85. time.sleep(1)
  86. def _update_user_profile(self, user_id, user_profile, message: str):
  87. profile_to_update = self.user_profile_extractor.extract_profile_info(user_profile, message)
  88. if not profile_to_update:
  89. logging.debug("user_id: {}, no profile info extracted".format(user_id))
  90. return
  91. logging.warning("update user profile: {}".format(profile_to_update))
  92. merged_profile = self.user_profile_extractor.merge_profile_info(user_profile, profile_to_update)
  93. self.user_manager.save_user_profile(user_id, merged_profile)
  94. return merged_profile
  95. def _schedule_aggregation_trigger(self, staff_id: str, user_id: str, delay_sec: int):
  96. logging.debug("user: {}, schedule trigger message after {} seconds".format(user_id, delay_sec))
  97. message_ts = int((time.time() + delay_sec) * 1000)
  98. message = Message.build(MessageType.AGGREGATION_TRIGGER, MessageChannel.SYSTEM, user_id, staff_id, None, message_ts)
  99. # 系统消息使用特定的msgId,无实际意义
  100. message.msgId = -MessageType.AGGREGATION_TRIGGER.value
  101. self.scheduler.add_job(lambda: self.receive_queue.produce(message),
  102. 'date',
  103. run_date=datetime.now() + timedelta(seconds=delay_sec))
  104. def process_single_message(self, message: Message):
  105. user_id = message.sender
  106. staff_id = message.receiver
  107. # 获取用户信息和Agent实例
  108. user_profile = self.user_manager.get_user_profile(user_id)
  109. agent = self._get_agent_instance(staff_id, user_id)
  110. # 更新对话状态
  111. logging.debug("process message: {}".format(message))
  112. need_response, message_text = agent.update_state(message)
  113. logging.debug("user: {}, next state: {}".format(user_id, agent.current_state))
  114. # 根据状态路由消息
  115. if agent.is_in_human_intervention():
  116. self._route_to_human_intervention(user_id, message)
  117. elif agent.current_state == DialogueState.MESSAGE_AGGREGATING:
  118. if message.type != MessageType.AGGREGATION_TRIGGER:
  119. # 产生一个触发器,但是不能由触发器递归产生
  120. logging.debug("user: {}, waiting next message for aggregation".format(user_id))
  121. self._schedule_aggregation_trigger(staff_id, user_id, agent.message_aggregation_sec)
  122. return
  123. elif need_response:
  124. # 先更新用户画像再处理回复
  125. self._update_user_profile(user_id, user_profile, message_text)
  126. self._get_chat_response(user_id, agent, message_text)
  127. else:
  128. logging.debug(f"staff[{staff_id}], user[{user_id}]: do not need response")
  129. def _route_to_human_intervention(self, user_id: str, origin_message: Message):
  130. """路由到人工干预"""
  131. self.human_queue.produce(Message.build(
  132. MessageType.TEXT,
  133. origin_message.channel,
  134. origin_message.sender,
  135. origin_message.receiver,
  136. "用户对话需人工介入,用户名:{}".format(user_id),
  137. int(time.time() * 1000)
  138. ))
  139. def _check_initiative_conversations(self):
  140. """定时检查主动发起对话"""
  141. for staff_user in self.user_relation_manager.list_staff_users():
  142. staff_id = staff_user['staff_id']
  143. user_id = staff_user['user_id']
  144. agent = self._get_agent_instance(staff_id, user_id)
  145. should_initiate = agent.should_initiate_conversation()
  146. if should_initiate:
  147. logging.warning("user: {}, initiate conversation".format(user_id))
  148. self._get_chat_response(user_id, agent, None)
  149. else:
  150. logging.debug("user: {}, do not initiate conversation".format(user_id))
  151. def _get_chat_response(self, user_id: str, agent: DialogueManager,
  152. user_message: Optional[str]):
  153. """处理LLM响应"""
  154. chat_config = agent.build_chat_configuration(user_message, self.chat_service_type)
  155. logging.debug(chat_config)
  156. chat_response = self._call_chat_api(chat_config)
  157. if response := agent.generate_response(chat_response):
  158. logging.warning("user: {}, response: {}".format(user_id, response))
  159. current_ts = int(time.time() * 1000)
  160. self.send_queue.produce(
  161. Message.build(MessageType.TEXT, MessageChannel.CORP_WECHAT,
  162. agent.staff_id, user_id, response, current_ts)
  163. )
  164. def _call_chat_api(self, chat_config: Dict) -> str:
  165. if configs.get().get('debug_flags', {}).get('disable_llm_api_call', False):
  166. return 'LLM模拟回复 {}'.format(datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
  167. if self.chat_service_type == ChatServiceType.OPENAI_COMPATIBLE:
  168. chat_completion = self.llm_client.chat.completions.create(
  169. messages=chat_config['messages'],
  170. model=self.model_name,
  171. )
  172. response = chat_completion.choices[0].message.content
  173. elif self.chat_service_type == ChatServiceType.COZE_CHAT:
  174. bot_user_id = 'dev_user'
  175. response = self.coze_client.create(
  176. chat_config['bot_id'], bot_user_id, chat_config['messages'],
  177. chat_config['custom_variables']
  178. )
  179. else:
  180. raise Exception('Unsupported chat service type: {}'.format(self.chat_service_type))
  181. return response
  182. if __name__ == "__main__":
  183. config = configs.get()
  184. logging_service.setup_root_logger()
  185. scheduler_logger = logging.getLogger('apscheduler')
  186. scheduler_logger.setLevel(logging.WARNING)
  187. use_aliyun_mq = config['debug_flags']['use_aliyun_mq']
  188. # 初始化不同队列的后端
  189. if use_aliyun_mq:
  190. receive_queue = AliyunRocketMQQueueBackend(
  191. config['mq']['endpoints'],
  192. config['mq']['instance_id'],
  193. config['mq']['receive_topic'],
  194. has_consumer=True, has_producer=True,
  195. group_id=config['mq']['receive_group']
  196. )
  197. send_queue = AliyunRocketMQQueueBackend(
  198. config['mq']['endpoints'],
  199. config['mq']['instance_id'],
  200. config['mq']['send_topic'],
  201. has_consumer=False, has_producer=True
  202. )
  203. else:
  204. receive_queue = MemoryQueueBackend()
  205. send_queue = MemoryQueueBackend()
  206. human_queue = MemoryQueueBackend()
  207. # 初始化用户管理服务
  208. # FIXME(zhoutian): 如果不使用MySQL,此数据库配置非必须
  209. user_db_config = config['storage']['user']
  210. staff_db_config = config['storage']['staff']
  211. if config['debug_flags'].get('use_local_user_storage', False):
  212. user_manager = LocalUserManager()
  213. else:
  214. user_manager = MySQLUserManager(user_db_config['mysql'], user_db_config['table'], staff_db_config['table'])
  215. wecom_db_config = config['storage']['user_relation']
  216. user_relation_manager = MySQLUserRelationManager(
  217. user_db_config['mysql'], wecom_db_config['mysql'],
  218. config['storage']['staff']['table'],
  219. user_db_config['table'],
  220. wecom_db_config['table']['staff'],
  221. wecom_db_config['table']['relation'],
  222. wecom_db_config['table']['user']
  223. )
  224. # 创建Agent服务
  225. service = AgentService(
  226. receive_backend=receive_queue,
  227. send_backend=send_queue,
  228. human_backend=human_queue,
  229. user_manager=user_manager,
  230. user_relation_manager=user_relation_manager,
  231. chat_service_type=ChatServiceType.COZE_CHAT
  232. )
  233. # 只有企微场景需要主动发起
  234. if not config['debug_flags'].get('disable_active_conversation', False):
  235. service.setup_initiative_conversations({'second': '5,35'})
  236. process_thread = threading.Thread(target=service.process_messages)
  237. process_thread.start()
  238. if not config['debug_flags'].get('console_input', False):
  239. process_thread.join()
  240. sys.exit(0)
  241. message_id = 0
  242. while True:
  243. print("Input next message: ")
  244. text = sys.stdin.readline().strip()
  245. if not text:
  246. continue
  247. message_id += 1
  248. message = Message.build(MessageType.TEXT, MessageChannel.CORP_WECHAT,
  249. '7881301263964433','1688854492669990', text, int(time.time() * 1000)
  250. )
  251. message.msgId = message_id
  252. receive_queue.produce(message)
  253. time.sleep(0.1)
  254. process_thread.join()