user_manager.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460
  1. #! /usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. # vim:fenc=utf-8
  4. from pqai_agent.logging_service import logger
  5. from typing import Dict, Optional, List
  6. import json
  7. import time
  8. import os
  9. import abc
  10. import pymysql.cursors
  11. from pqai_agent import configs
  12. from pqai_agent.database import MySQLManager
  13. class UserManager(abc.ABC):
  14. @abc.abstractmethod
  15. def get_user_profile(self, user_id) -> Dict:
  16. pass
  17. @abc.abstractmethod
  18. def save_user_profile(self, user_id, profile: Dict) -> None:
  19. pass
  20. @abc.abstractmethod
  21. def list_all_users(self):
  22. pass
  23. @abc.abstractmethod
  24. def get_staff_profile(self, staff_id) -> Dict:
  25. #FIXME(zhoutian): 重新设计用户和员工数据管理模型
  26. pass
  27. @staticmethod
  28. def get_default_profile(**kwargs) -> Dict:
  29. default_profile = {
  30. "name": "",
  31. "nickname": "",
  32. "avatar": "",
  33. "preferred_nickname": "",
  34. "gender": "未知",
  35. "age": 0,
  36. "region": '',
  37. "interests": [],
  38. "family_members": {},
  39. "health_conditions": [],
  40. "medications": [],
  41. "reminder_preferences": {
  42. "medication": True,
  43. "health": True,
  44. "weather": True,
  45. "news": False
  46. },
  47. "interaction_style": "standard", # standard, verbose, concise
  48. "interaction_frequency": "medium", # low, medium, high
  49. "last_topics": [],
  50. "created_at": int(time.time() * 1000),
  51. "human_intervention_history": []
  52. }
  53. for key, value in kwargs.items():
  54. if key in default_profile:
  55. default_profile[key] = value
  56. return default_profile
  57. def list_users(self, **kwargs) -> List[Dict]:
  58. pass
  59. class UserRelationManager(abc.ABC):
  60. @abc.abstractmethod
  61. def list_staffs(self):
  62. pass
  63. @abc.abstractmethod
  64. def list_users(self, staff_id: str, page: int = 1, page_size: int = 100):
  65. pass
  66. @abc.abstractmethod
  67. def list_staff_users(self, staff_id: str = None, tag_id: int = None) -> List[Dict]:
  68. pass
  69. @abc.abstractmethod
  70. def get_user_tags(self, user_id: str) -> List[str]:
  71. pass
  72. @abc.abstractmethod
  73. def stop_user_daily_push(self, user_id: str) -> bool:
  74. pass
  75. class LocalUserManager(UserManager):
  76. def get_user_profile(self, user_id) -> Dict:
  77. """加载用户个人资料,如不存在则创建默认资料。主要用于本地调试"""
  78. default_profile = self.get_default_profile()
  79. try:
  80. with open(f"user_profiles/{user_id}.json", "r", encoding="utf-8") as f:
  81. profile = json.load(f)
  82. entry_added = False
  83. for key, value in default_profile.items():
  84. if key not in profile:
  85. logger.debug(f"user[{user_id}] add profile key[{key}] value[{value}]")
  86. profile[key] = value
  87. entry_added = True
  88. if entry_added:
  89. self.save_user_profile(user_id, profile)
  90. return profile
  91. except FileNotFoundError:
  92. # 创建默认用户资料
  93. self.save_user_profile(user_id, default_profile)
  94. return default_profile
  95. def save_user_profile(self, user_id, profile: Dict) -> None:
  96. if not user_id:
  97. raise Exception("Invalid user_id: {}".format(user_id))
  98. with open(f"user_profiles/{user_id}.json", "w", encoding="utf-8") as f:
  99. json.dump(profile, f, ensure_ascii=False, indent=2)
  100. def list_all_users(self):
  101. user_ids = []
  102. for root, dirs, files in os.walk('../user_profiles/'):
  103. for file in files:
  104. if file.endswith('.json'):
  105. user_ids.append(os.path.splitext(file)[0])
  106. return user_ids
  107. def get_staff_profile(self, staff_id) -> Dict:
  108. try:
  109. with open(f"user_profiles/{staff_id}.json", "r", encoding="utf-8") as f:
  110. profile = json.load(f)
  111. entry_added = False
  112. if entry_added:
  113. self.save_user_profile(staff_id, profile)
  114. return profile
  115. except Exception as e:
  116. logger.error("staff profile not found: {}".format(e))
  117. return {}
  118. def list_users(self, **kwargs) -> List[Dict]:
  119. pass
  120. class MySQLUserManager(UserManager):
  121. PROFILE_EXCLUDE_ITEMS = ['avatar', ]
  122. def __init__(self, db_config, table_name, staff_table):
  123. self.db = MySQLManager(db_config)
  124. self.table_name = table_name
  125. self.staff_table = staff_table
  126. def get_user_profile(self, user_id) -> Dict:
  127. sql = f"SELECT name, wxid, profile_data_v1, gender, iconurl as avatar" \
  128. f" FROM {self.table_name} WHERE third_party_user_id = {user_id}"
  129. data = self.db.select(sql, pymysql.cursors.DictCursor)
  130. if not data:
  131. logger.error(f"user[{user_id}] not found")
  132. return {}
  133. data = data[0]
  134. gender_map = {0: '未知', 1: '男', 2: '女', None: '未知'}
  135. gender = gender_map[data['gender']]
  136. default_profile = self.get_default_profile(nickname=data['name'], gender=gender, avatar=data['avatar'])
  137. if not data['profile_data_v1']:
  138. logger.warning(f"user[{user_id}] profile not found, create a default one")
  139. self.save_user_profile(user_id, default_profile)
  140. return default_profile
  141. else:
  142. profile = json.loads(data['profile_data_v1'])
  143. # 资料条目有增加时,需合并更新
  144. entry_added = False
  145. for key, value in default_profile.items():
  146. if key not in profile:
  147. # logger.debug(f"user[{user_id}] add profile key[{key}] value[{value}]")
  148. profile[key] = value
  149. entry_added = True
  150. if entry_added:
  151. self.save_user_profile(user_id, profile)
  152. return profile
  153. def save_user_profile(self, user_id, profile: Dict) -> None:
  154. if not user_id:
  155. raise Exception("Invalid user_id: {}".format(user_id))
  156. if configs.get().get('debug_flags', {}).get('disable_database_write', False):
  157. return
  158. profile = profile.copy()
  159. for name in self.PROFILE_EXCLUDE_ITEMS:
  160. profile.pop(name, None)
  161. sql = f"UPDATE {self.table_name} SET profile_data_v1 = %s WHERE third_party_user_id = {user_id}"
  162. self.db.execute(sql, (json.dumps(profile),))
  163. def list_all_users(self):
  164. sql = f"SELECT third_party_user_id FROM {self.table_name}"
  165. data = self.db.select(sql, pymysql.cursors.DictCursor)
  166. return [user['third_party_user_id'] for user in data]
  167. def get_staff_profile(self, staff_id) -> Dict:
  168. if not self.staff_table:
  169. raise Exception("staff_table is not set")
  170. return self.get_staff_profile_v3(staff_id)
  171. def get_staff_profile_v1(self, staff_id) -> Dict:
  172. sql = f"SELECT agent_name, agent_gender, agent_age, agent_region, agent_profile " \
  173. f"FROM {self.staff_table} WHERE third_party_user_id = '{staff_id}'"
  174. data = self.db.select(sql, pymysql.cursors.DictCursor)
  175. if not data:
  176. logger.error(f"staff[{staff_id}] not found")
  177. return {}
  178. profile = data[0]
  179. # 转换性别格式
  180. gender_map = {0: '未知', 1: '男', 2: '女', None: '未知'}
  181. profile['agent_gender'] = gender_map[profile['agent_gender']]
  182. return profile
  183. def get_staff_profile_v2(self, staff_id) -> Dict:
  184. sql = f"SELECT agent_name as name, agent_gender as gender, agent_age as age, agent_region as region, agent_profile " \
  185. f"FROM {self.staff_table} WHERE third_party_user_id = '{staff_id}'"
  186. data = self.db.select(sql, pymysql.cursors.DictCursor)
  187. if not data:
  188. logger.error(f"staff[{staff_id}] not found")
  189. return {}
  190. profile = data[0]
  191. # 转换性别格式
  192. gender_map = {0: '未知', 1: '男', 2: '女', None: '未知'}
  193. profile['gender'] = gender_map[profile['gender']]
  194. # 合并JSON字段(新版本)数据
  195. if profile['agent_profile']:
  196. detail_profile = json.loads(profile['agent_profile'])
  197. profile.update(detail_profile)
  198. # 去除原始字段
  199. profile.pop('agent_profile', None)
  200. return profile
  201. def get_staff_profile_v3(self, staff_id) -> Dict:
  202. sql = f"SELECT agent_profile " \
  203. f"FROM {self.staff_table} WHERE third_party_user_id = '{staff_id}'"
  204. data = self.db.select(sql)
  205. if not data:
  206. logger.error(f"staff[{staff_id}] not found")
  207. return {}
  208. profile_str = data[0][0]
  209. if not profile_str:
  210. return {}
  211. profile = json.loads(profile_str)
  212. return profile
  213. def save_staff_profile(self, staff_id: str, profile: Dict):
  214. # 正常情况下不应该有此操作
  215. if not self.staff_table:
  216. raise Exception("staff_table is not set")
  217. if not staff_id:
  218. raise Exception("Invalid staff_id: {}".format(staff_id))
  219. sql = f"UPDATE {self.staff_table} SET agent_profile = %s WHERE third_party_user_id = '{staff_id}'"
  220. self.db.execute(sql, (json.dumps(profile),))
  221. def list_users(self, **kwargs) -> List[Dict]:
  222. user_union_id = kwargs.get('user_union_id', None)
  223. user_name = kwargs.get('user_name', None)
  224. if not user_union_id and not user_name:
  225. raise Exception("user_union_id or user_name is required")
  226. sql = f"SELECT third_party_user_id, wxid, name, iconurl, gender FROM {self.table_name} WHERE 1=1 "
  227. if user_name:
  228. sql += f"AND name = '{user_name}' COLLATE utf8mb4_bin "
  229. if user_union_id:
  230. sql += f"AND wxid = '{user_union_id}' "
  231. data = self.db.select(sql, pymysql.cursors.DictCursor)
  232. return data
  233. def get_staff_list(self, page_id: int, page_size: int) -> Dict:
  234. """
  235. :param page_size:
  236. :param page_id:
  237. :return:
  238. """
  239. sql = f"""
  240. select t1.third_party_user_id as staff_id, t1.name as staff_name, t2.iconurl as avatar
  241. from qywx_employee t1 left join third_party_user t2
  242. on t1.third_party_user_id = t2.third_party_user_id
  243. limit %s offset %s;
  244. """
  245. staff_list = self.db.select(
  246. sql=sql,
  247. cursor_type=pymysql.cursors.DictCursor,
  248. args=(page_size + 1, page_size * (page_id - 1))
  249. )
  250. if len(staff_list) > page_size:
  251. has_next_page = True
  252. next_page_id = page_id + 1
  253. staff_list = staff_list[:page_size]
  254. else:
  255. has_next_page = False
  256. next_page_id = None
  257. return {
  258. "has_next_page": has_next_page,
  259. "next_page": next_page_id,
  260. "data": staff_list
  261. }
  262. class LocalUserRelationManager(UserRelationManager):
  263. def __init__(self):
  264. pass
  265. def list_staffs(self):
  266. return [
  267. {"third_party_user_id": '1688855931724582', "name": "", "wxid": "ShengHuoLeQu", "agent_name": "小芳"}
  268. ]
  269. def list_users(self, staff_id: str, page: int = 1, page_size: int = 100):
  270. return []
  271. def list_staff_users(self, staff_id: str = None, tag_id: int = None):
  272. user_ids = ['7881299453089278', '7881299453132630', '7881299454186909', '7881299455103430', '7881299455173476',
  273. '7881299456216398', '7881299457990953', '7881299461167644', '7881299463002136', '7881299464081604',
  274. '7881299465121735', '7881299465998082', '7881299466221881', '7881299467152300', '7881299470051791',
  275. '7881299470112816', '7881299471149567', '7881299471168030', '7881299471277650', '7881299473321703']
  276. user_ids = user_ids[:5]
  277. return [
  278. {"staff_id": "1688855931724582", "user_id": "7881299670930896"},
  279. *[{"staff_id": "1688855931724582", "user_id": user_id} for user_id in user_ids]
  280. ]
  281. def get_user_tags(self, user_id: str):
  282. return []
  283. def stop_user_daily_push(self, user_id: str) -> bool:
  284. return True
  285. class MySQLUserRelationManager(UserRelationManager):
  286. def __init__(self, agent_db_config, wecom_db_config,
  287. agent_staff_table, agent_user_table,
  288. staff_table, relation_table, user_table):
  289. # FIXME(zhoutian): 因为现在数据库表不统一,需要从两个库读取
  290. self.agent_db = MySQLManager(agent_db_config)
  291. self.wecom_db = MySQLManager(wecom_db_config)
  292. self.agent_staff_table = agent_staff_table
  293. self.staff_table = staff_table
  294. self.relation_table = relation_table
  295. self.agent_user_table = agent_user_table
  296. self.user_table = user_table
  297. def list_staffs(self):
  298. sql = f"SELECT third_party_user_id, name, wxid, agent_name FROM {self.agent_staff_table} WHERE status = 1"
  299. data = self.agent_db.select(sql, pymysql.cursors.DictCursor)
  300. return data
  301. def list_users(self, staff_id: str, page: int = 1, page_size: int = 100):
  302. return []
  303. def list_staff_users(self, staff_id: str = None, tag_id: int = None):
  304. sql = f"SELECT third_party_user_id, wxid FROM {self.agent_staff_table} WHERE status = 1"
  305. if staff_id:
  306. sql += f" AND third_party_user_id = '{staff_id}'"
  307. agent_staff_data = self.agent_db.select(sql, pymysql.cursors.DictCursor)
  308. if not agent_staff_data:
  309. return []
  310. ret = []
  311. for agent_staff in agent_staff_data:
  312. wxid = agent_staff['wxid']
  313. sql = f"SELECT id FROM {self.staff_table} WHERE carrier_id = '{wxid}'"
  314. staff_data = self.wecom_db.select(sql, pymysql.cursors.DictCursor)
  315. if not staff_data:
  316. logger.error(f"staff[{wxid}] not found in wecom database")
  317. continue
  318. staff_id = staff_data[0]['id']
  319. sql = f"SELECT user_id FROM {self.relation_table} WHERE staff_id = '{staff_id}' AND is_delete = 0"
  320. user_data = self.wecom_db.select(sql, pymysql.cursors.DictCursor)
  321. if not user_data:
  322. logger.warning(f"staff[{wxid}] has no user")
  323. continue
  324. user_ids = tuple(user['user_id'] for user in user_data)
  325. sql = f"SELECT union_id FROM {self.user_table} WHERE id IN {str(user_ids)} AND union_id is not null"
  326. if tag_id:
  327. sql += f" AND id in (SELECT distinct user_id FROM we_com_user_with_tag WHERE tag_id = {tag_id} and is_delete = 0)"
  328. user_data = self.wecom_db.select(sql, pymysql.cursors.DictCursor)
  329. if not user_data:
  330. logger.warning(f"staff[{wxid}] users not found in wecom database")
  331. continue
  332. user_union_ids = tuple(user['union_id'] for user in user_data)
  333. batch_size = 500
  334. n_batches = (len(user_union_ids) + batch_size - 1) // batch_size
  335. agent_user_data = []
  336. for i in range(n_batches):
  337. idx_begin = i * batch_size
  338. idx_end = min((i + 1) * batch_size, len(user_union_ids))
  339. batch_union_ids = user_union_ids[idx_begin:idx_end]
  340. sql = f"SELECT third_party_user_id, wxid FROM {self.agent_user_table} WHERE wxid IN {str(batch_union_ids)}"
  341. batch_agent_user_data = self.agent_db.select(sql, pymysql.cursors.DictCursor)
  342. if len(agent_user_data) != len(batch_union_ids):
  343. # logger.debug(f"staff[{wxid}] some users not found in agent database")
  344. pass
  345. agent_user_data.extend(batch_agent_user_data)
  346. staff_user_pairs = [
  347. {
  348. 'staff_id': agent_staff['third_party_user_id'],
  349. 'user_id': agent_user['third_party_user_id']
  350. }
  351. for agent_user in agent_user_data
  352. ]
  353. ret.extend(staff_user_pairs)
  354. return ret
  355. def get_user_union_id(self, user_id: str) -> Optional[str]:
  356. sql = f"SELECT wxid FROM {self.agent_user_table} WHERE third_party_user_id = '{user_id}' AND wxid is not null"
  357. user_data = self.agent_db.select(sql, pymysql.cursors.DictCursor)
  358. if not user_data:
  359. logger.error(f"user[{user_id}] has no union id")
  360. return None
  361. union_id = user_data[0]['wxid']
  362. return union_id
  363. def get_user_tags(self, user_id: str) -> List[str]:
  364. union_id = self.get_user_union_id(user_id)
  365. if not union_id:
  366. return []
  367. sql = f"""
  368. select b.tag_id, c.`tag_name` from `we_com_user` as a
  369. join `we_com_user_with_tag` as b
  370. join `we_com_tag` as c
  371. on a.`id` = b.`user_id`
  372. and b.`tag_id` = c.id
  373. where a.union_id = '{union_id}' """
  374. tag_data = self.wecom_db.select(sql, pymysql.cursors.DictCursor)
  375. tag_names = [tag['tag_name'] for tag in tag_data]
  376. return tag_names
  377. def stop_user_daily_push(self, user_id: str) -> bool:
  378. try:
  379. union_id = self.get_user_union_id(user_id)
  380. if not union_id:
  381. return False
  382. sql = f"UPDATE {self.user_table} SET group_msg_disabled = 1 WHERE union_id = %s"
  383. rows = self.wecom_db.execute(sql, (union_id, ))
  384. if rows > 0:
  385. return True
  386. else:
  387. return False
  388. except Exception as e:
  389. logger.error(f"stop_user_daily_push failed: {e}")
  390. return False
  391. if __name__ == '__main__':
  392. config = configs.get()
  393. user_db_config = config['storage']['user']
  394. staff_db_config = config['storage']['staff']
  395. user_manager = MySQLUserManager(user_db_config['mysql'], user_db_config['table'], staff_db_config['table'])
  396. user_profile = user_manager.get_user_profile('7881301263964433')
  397. print(user_profile)
  398. wecom_db_config = config['storage']['user_relation']
  399. user_relation_manager = MySQLUserRelationManager(
  400. user_db_config['mysql'], wecom_db_config['mysql'],
  401. config['storage']['staff']['table'],
  402. user_db_config['table'],
  403. wecom_db_config['table']['staff'],
  404. wecom_db_config['table']['relation'],
  405. wecom_db_config['table']['user']
  406. )
  407. # all_staff_users = user_relation_manager.list_staff_users()
  408. user_tags = user_relation_manager.get_user_tags('7881302078008656')
  409. print(user_tags)