download_sendtime.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/4/18
  4. """
  5. 下载并上传:发布时间榜
  6. 规则:
  7. 1.基本规则:send_time_rule()
  8. 2.视频发布3日内,播放量大于2万(当前时间 - 发布时间 <= 3 天)
  9. """
  10. import json
  11. import os
  12. import random
  13. import sys
  14. import time
  15. import requests
  16. import urllib3
  17. sys.path.append(os.getcwd())
  18. from main.common import Common
  19. from main.get_feeds import get_feeds
  20. from main.publish import Publish
  21. from main.feishu_lib import Feishu
  22. proxies = {"http": None, "https": None}
  23. class DownloadSendtime:
  24. @staticmethod
  25. def send_time_rule(send_time_width, send_time_height, send_time_duration, send_time_share_cnt):
  26. """
  27. 1.分辨率,宽或者高 >= 720 or == 0
  28. 2.600s >= 时长 >= 60s
  29. 3.视频播放量 >= 0
  30. """
  31. if int(send_time_width) >= 720 or int(send_time_height) >= 720 \
  32. or send_time_width == "0" or send_time_height == "0":
  33. if 600 >= int(send_time_duration) >= 60:
  34. if int(send_time_share_cnt) > 0:
  35. return True
  36. else:
  37. return False
  38. else:
  39. return False
  40. else:
  41. return False
  42. @classmethod
  43. def download_sendtime_video(cls, env):
  44. """
  45. 视频发布3日内,播放量大于2万(当前时间 - 发布时间 <= 3 天)
  46. :param env: 测试环境:dev;正式环境:prod
  47. :return: 下载并上传视频
  48. """
  49. if len(Feishu.get_values_batch("Y8N3Vl")) == 1:
  50. pass
  51. else:
  52. for i in range(len(Feishu.get_values_batch("Y8N3Vl"))):
  53. try:
  54. sendtime_session = Common.get_session()
  55. Common.crawler_log().info("获取视频info时,session:{}".format(sendtime_session))
  56. download_video_id = Feishu.get_values_batch("Y8N3Vl")[i+1][1]
  57. download_video_title = Feishu.get_values_batch("Y8N3Vl")[i+1][3]
  58. url = "https://search.weixin.qq.com/cgi-bin/recwxa/recwxagetonevideoinfo?"
  59. param = {
  60. "session": sendtime_session,
  61. "vid": download_video_id,
  62. "wxaVersion": "3.9.2",
  63. "channelid": "208201",
  64. "scene": "32",
  65. "subscene": "1089",
  66. "model": "iPhone 11<iPhone12,1>14.7.1",
  67. "clientVersion": "8.0.18",
  68. "sharesearchid": "447665862521758270",
  69. "sharesource": "-1"
  70. }
  71. urllib3.disable_warnings()
  72. r = requests.get(url=url, params=param, proxies=proxies, verify=False)
  73. response = json.loads(r.content.decode("utf8"))
  74. if "data" not in response:
  75. Common.crawler_log().error("获取视频info时错误,删除该视频:{}".format(download_video_title))
  76. # 删除行或列,可选 ROWS、COLUMNS
  77. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  78. else:
  79. data = response["data"]
  80. v_duration = data["duration"]
  81. v_play_cnt_sendtime = data["played_cnt"]
  82. v_comment_cnt = data["comment_cnt"]
  83. v_liked_cnt = data["liked_cnt"]
  84. v_shared_cnt = data["shared_cnt"]
  85. v_width = data["width"]
  86. v_height = data["height"]
  87. v_resolution = str(v_width) + "*" + str(v_height)
  88. v_send_date = data["upload_time"]
  89. v_username = data["user_info"]["nickname"].strip().replace("\n", "")
  90. v_user_cover = data["user_info"]["headimg_url"]
  91. v_video_cover = data["cover_url"]
  92. if "items" not in data["play_info"]:
  93. if len(data["play_info"]) > 2:
  94. download_url_up = data["play_info"][2]["play_url"]
  95. # Common.crawler_log().info('视频下载地址:{}'.format(download_url_up))
  96. else:
  97. download_url_up = data["play_info"][0]["play_url"]
  98. # Common.crawler_log().info('视频下载地址:{}'.format(download_url_up))
  99. else:
  100. if len(data["play_info"]["items"]) > 2:
  101. download_url_up = data["play_info"]["items"][2]["play_url"]
  102. # Common.crawler_log().info('视频下载地址:{}'.format(download_url_up))
  103. else:
  104. download_url_up = data["play_info"]["items"][0]["play_url"]
  105. # Common.crawler_log().info('视频下载地址:{}'.format(download_url_up))
  106. # 判断基本规则
  107. if cls.send_time_rule(v_width, v_height, v_duration, v_play_cnt_sendtime) is True \
  108. and download_video_id != "" and download_video_title != "" and v_duration != "" \
  109. and v_play_cnt_sendtime != "" and v_comment_cnt != "" and v_liked_cnt != "" \
  110. and v_shared_cnt != "" and v_width != "" and v_height != "" \
  111. and v_send_date != "" and v_username != "" and v_user_cover != "" \
  112. and v_video_cover != "" and download_url_up != "":
  113. # 满足下载条件:当前时间 - 发布时间 <= 3天,播放量大于1万
  114. if int(time.time()) - int(v_send_date) <= 604800:
  115. if int(v_play_cnt_sendtime) >= 10000:
  116. Common.crawler_log().info("该视频:{}".format(
  117. download_video_title) + " " + "在7天内的播放量{}>=10000".format(v_play_cnt_sendtime))
  118. # 下载封面
  119. Common.download_method("cover", download_video_title, v_video_cover)
  120. # 下载视频
  121. Common.download_method("video", download_video_title, download_url_up)
  122. # 保存视频信息到 "./files/{视频标题}/videoinfo.txt"
  123. with open(r"./videos/" + download_video_title +
  124. "/" + "info.txt", "a", encoding="utf8") as f_a2:
  125. f_a2.write(str(download_video_id) + "\n" +
  126. str(download_video_title) + "\n" +
  127. str(v_duration) + "\n" +
  128. str(v_play_cnt_sendtime) + "\n" +
  129. str(v_comment_cnt) + "\n" +
  130. str(v_liked_cnt) + "\n" +
  131. str(v_shared_cnt) + "\n" +
  132. str(v_resolution) + "\n" +
  133. str(v_send_date) + "\n" +
  134. str(v_username) + "\n" +
  135. str(v_user_cover) + "\n" +
  136. str(download_url_up) + "\n" +
  137. str(v_video_cover) + "\n" +
  138. str(sendtime_session))
  139. # 上传该视频
  140. Common.crawler_log().info("开始上传视频:{}".format(download_video_title))
  141. Publish.upload_and_publish(env, "send_time")
  142. # 保存视频 ID 到云文档:
  143. # https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=20ce0c
  144. Common.crawler_log().info("保存视频ID至云文档:{}".format(download_video_title))
  145. # 看一看+ ,视频ID工作表,插入首行
  146. Feishu.insert_columns("20ce0c")
  147. # 看一看+ ,视频ID工作表,首行写入数据
  148. Feishu.update_values("20ce0c", download_video_id, "", "", "",
  149. "", "", "", "", "", "", "", "", "", "", "")
  150. # 从云文档删除该视频信息:https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=Y8N3Vl
  151. Common.crawler_log().info("从云文档删除该视频信息:{}".format(download_video_title))
  152. # 删除行或列,可选 ROWS、COLUMNS
  153. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  154. else:
  155. # 从云文档删除该视频信息:https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=Y8N3Vl
  156. Common.crawler_log().info("该视频7天播放量:{}<10000".format(
  157. int(v_play_cnt_sendtime)) + ";" + "不满足下载规则:{}".format(download_video_title))
  158. # 删除行或列,可选 ROWS、COLUMNS
  159. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  160. else:
  161. # 从云文档删除该视频信息:https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=Y8N3Vl
  162. Common.crawler_log().info("视频发布时间大于7天:{}天".format(
  163. int((int(time.time()) - int(v_send_date)) / 86400))
  164. + ";" + "标题:{}".format(download_video_title))
  165. # 删除行或列,可选 ROWS、COLUMNS
  166. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  167. else:
  168. # 从云文档删除该视频信息:https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=Y8N3Vl
  169. Common.crawler_log().info("不满足下载规则:{}".format(download_video_title))
  170. # 删除行或列,可选 ROWS、COLUMNS
  171. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  172. except Exception as e:
  173. Common.crawler_log().error("获取视频info异常:{},删除该视频".format(e))
  174. # 删除行或列,可选 ROWS、COLUMNS
  175. Feishu.dimension_range("Y8N3Vl", "ROWS", i + 2, i + 2)
  176. cls.download_sendtime_video("prod")
  177. if __name__ == "__main__":
  178. download_sendtime = DownloadSendtime()
  179. get_feeds()
  180. download_sendtime.download_sendtime_video("dev")