utils.py 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184
  1. import requests
  2. import json
  3. import time
  4. from db_helper import HologresHelper, RedisHelper
  5. from config import set_config
  6. from log import Log
  7. config_ = set_config()
  8. log_ = Log()
  9. def request_post(request_url, request_data, timeout=1.0):
  10. """
  11. post 请求 HTTP接口
  12. :param request_url: 接口URL
  13. :param request_data: 请求参数
  14. :param timeout: 超时时间,默认为1秒,type-float
  15. :return: res_data json格式
  16. """
  17. try:
  18. response = requests.post(url=request_url, json=request_data, timeout=timeout)
  19. if response.status_code == 200:
  20. res_data = json.loads(response.text)
  21. return res_data
  22. else:
  23. return None
  24. except requests.exceptions.Timeout as e:
  25. log_.error('url: {} timeout, exception: {}'.format(request_url, e))
  26. return None
  27. def get_videos_remain_view_count(app_type, videos):
  28. """
  29. 获取视频在流量池中的剩余可分发数
  30. :param app_type: 产品标识 type-int
  31. :param videos: 视频信息 (视频id, 流量池标记) type-list,[{'videoId': video_id, 'flowPool': flow_pool}, ...]
  32. :return: data type-list,[(video_id, flow_pool, view_count), ...]
  33. """
  34. if not videos:
  35. return []
  36. request_data = {'appType': app_type, 'videos': videos}
  37. result = request_post(request_url=config_.GET_REMAIN_VIEW_COUNT_URL, request_data=request_data, timeout=1)
  38. if result is None:
  39. return []
  40. if result['code'] != 0:
  41. log_.info('获取视频在流量池中的剩余可分发数失败')
  42. return []
  43. data = [(item['videoId'], item['flowPool'], item['distributeCount']) for item in result['data']]
  44. return data
  45. class FilterVideos(object):
  46. """视频过滤"""
  47. def __init__(self, app_type, video_ids, mid='', uid=''):
  48. """
  49. 初始化
  50. :param app_type: 产品标识 type-int
  51. :param video_ids: 需过滤的视频列表 type-list
  52. :param mid: mid type-string
  53. :param uid: uid type-string
  54. """
  55. self.app_type = app_type
  56. self.mid = mid
  57. self.uid = uid
  58. self.video_ids = video_ids
  59. def filter_videos(self):
  60. """视频过滤"""
  61. # 预曝光过滤
  62. st_pre = time.time()
  63. filtered_pre_result = self.filter_video_previewed(self.video_ids)
  64. et_pre = time.time()
  65. log_.info('filter by previewed: app_type = {}, result = {}, execute time = {}ms'.format(
  66. self.app_type, filtered_pre_result, (et_pre - st_pre) * 1000))
  67. if not filtered_pre_result:
  68. return None
  69. # 视频状态过滤
  70. st_status = time.time()
  71. filtered_status_result = self.filter_video_status(video_ids=filtered_pre_result)
  72. et_status = time.time()
  73. log_.info('filter by video status: result = {}, execute time = {}ms'.format(
  74. filtered_status_result, (et_status - st_status) * 1000))
  75. if not filtered_status_result:
  76. return None
  77. # 视频已曝光过滤
  78. st_viewed = time.time()
  79. filtered_viewed_result = self.filter_video_viewed(video_ids=filtered_status_result)
  80. et_viewed = time.time()
  81. log_.info('filter by viewed: app_type = {}, mid = {}, uid = {}, result = {}, execute time = {}ms'.format(
  82. self.app_type, self.mid, self.uid, filtered_viewed_result, (et_viewed - st_viewed) * 1000))
  83. if not filtered_viewed_result:
  84. return None
  85. else:
  86. return filtered_viewed_result
  87. def filter_video_previewed(self, video_ids):
  88. """
  89. 预曝光过滤
  90. :param video_ids: 需过滤的视频列表 type-list
  91. :return: filtered_videos 过滤后的列表 type-list
  92. """
  93. # 根据Redis缓存中的数据过滤
  94. redis_helper = RedisHelper()
  95. # key拼接
  96. key_name = config_.PREVIEW_KEY_PREFIX + '{}.{}'.format(self.app_type, self.mid)
  97. pe_videos_list = redis_helper.get_data_from_set(key_name)
  98. if not pe_videos_list:
  99. return video_ids
  100. pe_videos = [eval(video) for video in pe_videos_list]
  101. filtered_videos = [video_id for video_id in video_ids if video_id not in pe_videos]
  102. return filtered_videos
  103. def filter_video_status(self, video_ids):
  104. """
  105. 对视频状态进行过滤
  106. :param video_ids: 视频id列表 type-list
  107. :return: filtered_videos
  108. """
  109. if len(video_ids) == 1:
  110. sql = "set hg_experimental_enable_shard_pruning=off; " \
  111. "SELECT video_id " \
  112. "FROM {} " \
  113. "WHERE audit_status = 5 " \
  114. "AND applet_rec_status IN (1, -6) " \
  115. "AND open_status = 1 " \
  116. "AND payment_status = 0 " \
  117. "AND encryption_status IS NULL " \
  118. "AND transcoding_status = 3 " \
  119. "AND video_id IN ({});".format(config_.VIDEO_STATUS, video_ids[0])
  120. else:
  121. sql = "set hg_experimental_enable_shard_pruning=off; " \
  122. "SELECT video_id " \
  123. "FROM {} " \
  124. "WHERE audit_status = 5 " \
  125. "AND applet_rec_status IN (1, -6) " \
  126. "AND open_status = 1 " \
  127. "AND payment_status = 0 " \
  128. "AND encryption_status IS NULL " \
  129. "AND transcoding_status = 3 " \
  130. "AND video_id IN {};".format(config_.VIDEO_STATUS, tuple(video_ids))
  131. hologres_helper = HologresHelper()
  132. data = hologres_helper.get_data(sql=sql)
  133. filtered_videos = [temp[0] for temp in data]
  134. return filtered_videos
  135. def filter_video_viewed(self, video_ids, types=(1,)):
  136. """
  137. 调用后端接口过滤用户已观看视频
  138. :param video_ids: 视频id列表 type-list
  139. :param types: 过滤参数 type-tuple, 默认(1, ) 1-已观看 2-视频状态 3-是否进入老年人社区 4-话题状态 5-推荐状态
  140. :return: filtered_videos
  141. """
  142. # 调用http接口
  143. request_data = {"appType": self.app_type,
  144. "mid": self.mid,
  145. "uid": self.uid,
  146. "types": list(types),
  147. "videoIds": video_ids}
  148. result = request_post(request_url=config_.VIDEO_FILTER_URL, request_data=request_data, timeout=2.5)
  149. if result is None:
  150. log_.info('过滤失败,types: {}'.format(types))
  151. return video_ids
  152. if result['code'] != 0:
  153. log_.info('过滤失败,types: {}'.format(types))
  154. return video_ids
  155. filtered_videos = result['data']
  156. return filtered_videos
  157. if __name__ == '__main__':
  158. filter_ = FilterVideos(app_type=1, mid='22', uid='www', video_ids=[1, 2, 3, 55])
  159. filter_.filter_videos()
  160. filter_.filter_video_status(video_ids=[1, 3, 5])