recommend.py 6.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150
  1. import time
  2. import multiprocessing
  3. import traceback
  4. from datetime import datetime
  5. from log import Log
  6. from config import set_config
  7. from video_recall import PoolRecall
  8. from video_rank import video_rank, bottom_strategy
  9. from db_helper import RedisHelper
  10. import gevent
  11. log_ = Log()
  12. config_ = set_config()
  13. def video_recommend(mid, uid, size, app_type, algo_type, client_info):
  14. """
  15. 首页线上推荐逻辑
  16. :param mid: mid type-string
  17. :param uid: uid type-string
  18. :param size: 请求视频数量 type-int
  19. :param app_type: 产品标识 type-int
  20. :param algo_type: 算法类型 type-string
  21. :param client_info: 用户位置信息 {"country": "国家", "province": "省份", "city": "城市"}
  22. :return:
  23. """
  24. ab_code = config_.AB_CODE
  25. # ####### 多进程召回
  26. start_recall = time.time()
  27. # log_.info('====== recall')
  28. '''
  29. cores = multiprocessing.cpu_count()
  30. pool = multiprocessing.Pool(processes=cores)
  31. pool_recall = PoolRecall(app_type=app_type, mid=mid, uid=uid, ab_code=ab_code)
  32. _, last_rov_recall_key, _ = pool_recall.get_video_last_idx()
  33. pool_list = [
  34. # rov召回池
  35. pool.apply_async(pool_recall.rov_pool_recall, (size,)),
  36. # 流量池
  37. pool.apply_async(pool_recall.flow_pool_recall, (size,))
  38. ]
  39. recall_result_list = [p.get() for p in pool_list]
  40. pool.close()
  41. pool.join()
  42. '''
  43. recall_result_list = []
  44. pool_recall = PoolRecall(app_type=app_type, mid=mid, uid=uid, ab_code=ab_code, client_info=client_info)
  45. _, last_rov_recall_key, _ = pool_recall.get_video_last_idx()
  46. t = [gevent.spawn(pool_recall.rov_pool_recall, size), gevent.spawn(pool_recall.flow_pool_recall, size) ]
  47. gevent.joinall(t)
  48. recall_result_list = [i.get() for i in t]
  49. end_recall = time.time()
  50. log_.info('mid: {}, uid: {}, recall: {}, execute time = {}ms'.format(
  51. mid, uid, recall_result_list, (end_recall - start_recall) * 1000))
  52. # ####### 排序
  53. start_rank = time.time()
  54. # log_.info('====== rank')
  55. data = {
  56. 'rov_pool_recall': recall_result_list[0],
  57. 'flow_pool_recall': recall_result_list[1]
  58. }
  59. rank_result = video_rank(data=data, size=size)
  60. end_rank = time.time()
  61. log_.info('mid: {}, uid: {}, rank_result: {}, execute time = {}ms'.format(
  62. mid, uid, rank_result, (end_rank - start_rank) * 1000))
  63. if not rank_result:
  64. # 兜底策略
  65. # log_.info('====== bottom strategy')
  66. start_bottom = time.time()
  67. rank_result = bottom_strategy(size=size, app_type=app_type, ab_code=ab_code)
  68. end_bottom = time.time()
  69. log_.info('mid: {}, uid: {}, bottom strategy result: {}, execute time = {}ms'.format(
  70. mid, uid, rank_result, (end_bottom - start_bottom) * 1000))
  71. # ####### redis数据刷新
  72. # log_.info('====== update redis')
  73. # 预曝光数据同步刷新到Redis, 过期时间为0.5h
  74. redis_helper = RedisHelper()
  75. preview_key_name = config_.PREVIEW_KEY_PREFIX + '{}.{}'.format(app_type, mid)
  76. preview_video_ids = [int(item['videoId']) for item in rank_result]
  77. if preview_video_ids:
  78. # log_.error('key_name = {} \n values = {}'.format(preview_key_name, tuple(preview_video_ids)))
  79. redis_helper.add_data_with_set(key_name=preview_key_name, values=tuple(preview_video_ids), expire_time=30*60)
  80. log_.info('preview redis update success!')
  81. # 将此次获取的ROV召回池config_.K末位视频id同步刷新到Redis中,方便下次快速定位到召回位置,过期时间为1天
  82. rov_recall_video = [item['videoId'] for item in rank_result[:3] if item['pushFrom'] == 'recall_pool']
  83. if 0 < len(rov_recall_video) <= config_.K:
  84. if not redis_helper.get_score_with_value(key_name=config_.UPDATE_ROV_KEY_NAME, value=rov_recall_video[-1]):
  85. redis_helper.set_data_to_redis(key_name=last_rov_recall_key, value=rov_recall_video[-1])
  86. elif len(rov_recall_video) > config_.K:
  87. if not redis_helper.get_score_with_value(key_name=config_.UPDATE_ROV_KEY_NAME, value=rov_recall_video[config_.K - 1]):
  88. redis_helper.set_data_to_redis(key_name=last_rov_recall_key, value=rov_recall_video[config_.K - 1])
  89. log_.info('last video redis update success!')
  90. # 将此次分发的流量池视频,对 本地分发数-1 进行记录
  91. flow_recall_video = [item for item in rank_result if item['pushFrom'] == 'flow_pool']
  92. if flow_recall_video:
  93. update_local_distribute_count(flow_recall_video)
  94. log_.info('update local distribute count success!')
  95. return rank_result
  96. def update_local_distribute_count(videos):
  97. """
  98. 更新本地分发数
  99. :param videos: 视频列表 type-list [{'videoId':'', 'flowPool':'', 'distributeCount': '',
  100. 'rovScore': '', 'pushFrom': 'flow_pool', 'abCode': self.ab_code}, ....]
  101. :return:
  102. """
  103. try:
  104. redis_helper = RedisHelper()
  105. for item in videos:
  106. key_name = '{}{}.{}'.format(config_.LOCAL_DISTRIBUTE_COUNT_PREFIX, item['videoId'], item['flowPool'])
  107. # 本地记录的分发数 - 1
  108. redis_helper.decr_key(key_name=key_name, amount=1, expire_time=5 * 60)
  109. # if redis_helper.key_exists(key_name=key_name):
  110. # # 该视频本地有记录,本地记录的分发数 - 1
  111. # redis_helper.decr_key(key_name=key_name, amount=1, expire_time=5 * 60)
  112. # else:
  113. # # 该视频本地无记录,接口获取的分发数 - 1
  114. # redis_helper.incr_key(key_name=key_name, amount=int(item['distributeCount']) - 1, expire_time=5 * 60)
  115. except Exception as e:
  116. log_.error('update_local_distribute_count error...')
  117. log_.error(traceback.format_exc())
  118. def video_relevant_recommend(mid, uid, size, app_type):
  119. """
  120. 相关推荐逻辑
  121. :param mid: mid type-string
  122. :param uid: uid type-string
  123. :param size: 请求视频数量 type-int
  124. :param app_type: 产品标识 type-int
  125. :return: videos type-list
  126. """
  127. videos = video_recommend(mid=mid, uid=uid, size=size, app_type=app_type, algo_type='', client_info=None)
  128. return videos
  129. if __name__ == '__main__':
  130. videos = [{'videoId': '12345', 'flowPool': '133#442#2', 'distributeCount': 10}]
  131. update_local_distribute_count(videos)