xiaoniangao_person_list.py 35 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/7/5
  4. import random
  5. import time
  6. import requests
  7. import urllib3
  8. from main.common import Common
  9. from main.feishu_lib import Feishu
  10. from main.xiaoniangao_publish import Publish
  11. proxies = {"http": None, "https": None}
  12. class Person:
  13. # 小程序关注列表翻页参数
  14. wechat_follow_start_t = None
  15. # 小程序个人主页视频列表翻页参数
  16. wechat_person_start_t = None
  17. # 视频发布时间
  18. send_time = 0
  19. # 配置微信
  20. wechat_sheet = Feishu.get_values_batch("follow", "xiaoniangao", "dzcWHw")
  21. follow_x_mid = wechat_sheet[2][3]
  22. follow_x_token_id = wechat_sheet[3][3]
  23. follow_referer = wechat_sheet[4][3]
  24. follow_uid = wechat_sheet[5][3]
  25. follow_token = wechat_sheet[6][3]
  26. # 过滤敏感词
  27. @classmethod
  28. def sensitive_words(cls, log_type):
  29. # 敏感词库列表
  30. word_list = []
  31. # 从云文档读取所有敏感词,添加到词库列表
  32. lists = Feishu.get_values_batch(log_type, "xiaoniangao", "DRAnZh")
  33. for i in lists:
  34. for j in i:
  35. # 过滤空的单元格内容
  36. if j is None:
  37. pass
  38. else:
  39. word_list.append(j)
  40. return word_list
  41. # 基础门槛规则
  42. @staticmethod
  43. def download_rule(d_duration, d_width, d_height, d_play_cnt, d_share_cnt):
  44. """
  45. 下载视频的基本规则
  46. :param d_duration: 时长
  47. :param d_width: 宽
  48. :param d_height: 高
  49. :param d_play_cnt: 播放量
  50. :param d_share_cnt: 分享量
  51. :return: 满足规则,返回 True;反之,返回 False
  52. """
  53. # 视频时长
  54. if int(float(d_duration)) >= 40:
  55. # 宽或高
  56. if int(d_width) >= 0 or int(d_height) >= 0:
  57. # 播放量
  58. if int(d_play_cnt) >= 500:
  59. # 分享量
  60. if int(d_share_cnt) >= 0:
  61. return True
  62. else:
  63. return False
  64. else:
  65. return False
  66. else:
  67. return False
  68. else:
  69. return False
  70. # # 从小程序中,关注用户列表同步至云文档
  71. # @classmethod
  72. # def get_sub_or_fans_list(cls, log_type):
  73. # try:
  74. # follow_list = []
  75. # follow_sheet = Feishu.get_values_batch(log_type, "xiaoniangao", "oNpThi")
  76. # url = "https://api.xiaoniangao.cn/account/get_sub_or_fans_list"
  77. # headers = {
  78. # "X-Mid": str(cls.follow_x_mid),
  79. # "X-Token-Id": str(cls.follow_x_token_id),
  80. # "content-type": "application/json",
  81. # "uuid": str(cls.follow_uid),
  82. # "Accept-Encoding": "gzip,compress,br,deflate",
  83. # "User-Agent": "Mozilla/5.0 (iPhone; CPU iPhone OS 14_7_1 like Mac OS X)"
  84. # " AppleWebKit/605.1.15 (KHTML, like Gecko) Mobile/15E148 "
  85. # "MicroMessenger/8.0.20(0x18001435) NetType/WIFI Language/zh_CN",
  86. # "Referer": str(cls.follow_referer)
  87. # }
  88. # json_text = {
  89. # "visited_mid": str(cls.follow_x_mid),
  90. # "start_t": cls.wechat_follow_start_t,
  91. # "limit": 20,
  92. # "h_qs": "imageMogr2/gravity/center/rotate/$/thumbnail/!84x84r/crop/84x84/interlace/1/format/jpg",
  93. # "type": 1,
  94. # "token": str(cls.follow_token),
  95. # "uid": str(cls.follow_uid),
  96. # "proj": "ma",
  97. # "wx_ver": "8.0.23",
  98. # "code_ver": "3.68.0",
  99. # "log_common_params": {
  100. # "e": [{
  101. # "data": {
  102. # "page": "followFansPage"
  103. # }
  104. # }],
  105. # "ext": {
  106. # "brand": "iPhone",
  107. # "device": "iPhone 11",
  108. # "os": "iOS 14.7.1",
  109. # "weixinver": "8.0.23",
  110. # "srcver": "2.24.7",
  111. # "net": "wifi",
  112. # "scene": "1089"
  113. # },
  114. # "pj": "1",
  115. # "pf": "2",
  116. # "session_id": "7468cf52-00ea-432e-8505-6ea3ad7ec164"
  117. # }
  118. # }
  119. # r = requests.post(url=url, headers=headers, json=json_text, proxies=proxies, verify=False)
  120. # if "data" not in r.json():
  121. # Common.logger(log_type).warning("从小程序中获取关注用户列表:{}", r.text)
  122. # else:
  123. # users = r.json()["data"]["list"]
  124. # for i in range(len(users)):
  125. # profile_mid = users[i]["mid"]
  126. # nick = users[i]["nick"]
  127. # follow_list.append(profile_mid)
  128. # # 同步已关注的用户至云文档
  129. # if profile_mid not in [j for i in follow_sheet for j in i]:
  130. # Feishu.insert_columns(log_type, "xiaoniangao", "oNpThi", "ROWS", 1, 2)
  131. # time.sleep(1)
  132. # values = [[profile_mid, nick]]
  133. # Feishu.update_values(log_type, "xiaoniangao", "oNpThi", "B2:C2", values)
  134. # else:
  135. # Common.logger(log_type).info("用户:{},在云文档中已存在", nick)
  136. # cls.wechat_follow_start_t = r.json()["data"]["next_t"]
  137. # # 翻页,直至到底了
  138. # if cls.wechat_follow_start_t != 0:
  139. # cls.get_sub_or_fans_list(log_type)
  140. # else:
  141. # Common.logger(log_type).info("从小程序中同步关注用户至云文档完成\n")
  142. # return follow_list
  143. # except Exception as e:
  144. # Common.logger(log_type).error("从小程序中,关注用户列表同步至云文档异常:{}", e)
  145. # 从云文档获取关注用户列表
  146. @classmethod
  147. def get_follow_users(cls, log_type):
  148. try:
  149. follow_sheet = Feishu.get_values_batch(log_type, "xiaoniangao", "oNpThi")
  150. if len(follow_sheet) == 1:
  151. Common.logger(log_type).info("暂无定向爬取账号")
  152. else:
  153. follow_list = []
  154. nick_list = []
  155. for i in range(1, len(follow_sheet)):
  156. profile_mid = follow_sheet[i][1]
  157. nick = follow_sheet[i][2]
  158. nick_list.append(nick)
  159. follow_list.append(profile_mid)
  160. Common.logger(log_type).info("关注用户列表:{}", nick_list)
  161. return follow_list
  162. except Exception as e:
  163. Common.logger(log_type).error("从云文档获取关注用户列表异常:{}", e)
  164. # 从云文档获取取消关注用户列表
  165. @classmethod
  166. def get_unfollow_users(cls, log_type):
  167. try:
  168. unfollow_sheet = Feishu.get_values_batch(log_type, "xiaoniangao", "tuMNhn")
  169. if len(unfollow_sheet) == 1:
  170. Common.logger(log_type).info("暂无定向账号")
  171. return None
  172. else:
  173. unfollow_list = []
  174. nick_list = []
  175. for i in range(1, len(unfollow_sheet)):
  176. profile_mid = unfollow_sheet[i][1]
  177. nick = unfollow_sheet[i][2]
  178. nick_list.append(nick)
  179. unfollow_list.append(profile_mid)
  180. Common.logger(log_type).info("取消关注用户列表:{}", nick_list)
  181. return unfollow_list
  182. except Exception as e:
  183. Common.logger(log_type).error("从云文档获取取消关注用户列表异常:{}", e)
  184. # 关注云文档中的用户
  185. @classmethod
  186. def sub_users(cls, log_type):
  187. try:
  188. profile_mids = cls.get_follow_users(log_type)
  189. for profile_mid in profile_mids:
  190. url = "https://api.xiaoniangao.cn/V1/account/sub_user"
  191. headers = {
  192. "x-b3-traceid": str(cls.follow_x_mid),
  193. "X-Token-Id": str(cls.follow_x_token_id),
  194. "content-type": "application/json",
  195. "uuid": str(cls.follow_uid),
  196. "Accept-Encoding": "gzip,compress,br,deflate",
  197. "User-Agent": "Mozilla/5.0 (iPhone; CPU iPhone OS 14_7_1 like Mac OS X)"
  198. " AppleWebKit/605.1.15 (KHTML, like Gecko) Mobile/15E148 "
  199. "MicroMessenger/8.0.20(0x18001435) NetType/WIFI Language/zh_CN",
  200. "Referer": str(cls.follow_referer)
  201. }
  202. data = {
  203. "visited_mid": int(profile_mid),
  204. "log_common_params": {
  205. "e": [{
  206. "data": {
  207. "page": "profilePage",
  208. "topic": "public",
  209. "type": "follow",
  210. "name": "user",
  211. "smid": str(profile_mid)
  212. },
  213. "ab": {}
  214. }],
  215. "ext": {
  216. "brand": "iPhone",
  217. "device": "iPhone 11",
  218. "os": "iOS 14.7.1",
  219. "weixinver": "8.0.20",
  220. "srcver": "2.24.2",
  221. "net": "wifi",
  222. "scene": "1089"
  223. },
  224. "pj": "1",
  225. "pf": "2",
  226. "session_id": "d53b6125-942b-4ec1-8d22-f9451a35e9f9"
  227. },
  228. "token": str(cls.follow_token),
  229. "uid": str(cls.follow_uid),
  230. "proj": "ma",
  231. "wx_ver": "8.0.20",
  232. "code_ver": "3.62.0"
  233. }
  234. urllib3.disable_warnings()
  235. r = requests.post(headers=headers, url=url, json=data, proxies=proxies, verify=False)
  236. Common.logger(log_type).info("关注用户:{},{}", profile_mid, r)
  237. except Exception as e:
  238. Common.logger(log_type).error("关注云文档中的用户异常:{}", e)
  239. # 取消关注云文档中的用户
  240. @classmethod
  241. def unsub_users(cls, log_type):
  242. try:
  243. unsub_profile_mids = cls.get_unfollow_users(log_type)
  244. if unsub_profile_mids is None:
  245. pass
  246. else:
  247. for profile_mid in unsub_profile_mids:
  248. url = "https://api.xiaoniangao.cn/V1/account/unsub_user"
  249. headers = {
  250. "x-b3-traceid": str(cls.follow_x_mid),
  251. "X-Token-Id": str(cls.follow_x_token_id),
  252. "content-type": "application/json",
  253. "uuid": str(cls.follow_uid),
  254. "Accept-Encoding": "gzip,compress,br,deflate",
  255. "User-Agent": "Mozilla/5.0 (iPhone; CPU iPhone OS 14_7_1 like Mac OS X)"
  256. " AppleWebKit/605.1.15 (KHTML, like Gecko) Mobile/15E148 "
  257. "MicroMessenger/8.0.20(0x18001435) NetType/WIFI Language/zh_CN",
  258. "Referer": str(cls.follow_referer)
  259. }
  260. data = {
  261. "visited_mid": int(profile_mid),
  262. "log_common_params": {
  263. "e": [{
  264. "data": {
  265. "page": "profilePage",
  266. "topic": "public",
  267. "type": "unfollow",
  268. "name": "user",
  269. "smid": str(profile_mid)
  270. },
  271. "ab": {}
  272. }],
  273. "ext": {
  274. "brand": "iPhone",
  275. "device": "iPhone 11",
  276. "os": "iOS 14.7.1",
  277. "weixinver": "8.0.20",
  278. "srcver": "2.24.4",
  279. "net": "wifi",
  280. "scene": "1089"
  281. },
  282. "pj": "1",
  283. "pf": "2",
  284. "session_id": "6a2959c7-3f98-411f-8bc9-8d2a8a5c6f16"
  285. },
  286. "token": str(cls.follow_token),
  287. "uid": str(cls.follow_uid),
  288. "proj": "ma",
  289. "wx_ver": "8.0.20",
  290. "code_ver": "3.64.1"}
  291. urllib3.disable_warnings()
  292. r = requests.post(headers=headers, url=url, json=data, proxies=proxies, verify=False)
  293. Common.logger(log_type).info("取消关注:{},{}", profile_mid, r)
  294. except Exception as e:
  295. Common.logger(log_type).error("取消关注云文档中的用户异常:{}", e)
  296. # 获取个人主页视频
  297. @classmethod
  298. def get_videos_from_person(cls, log_type, p_mid):
  299. try:
  300. url = "https://api.xiaoniangao.cn/profile/list_album"
  301. headers = {
  302. "X-Mid": str(cls.follow_x_mid),
  303. "X-Token-Id": str(cls.follow_x_token_id),
  304. "content-type": "application/json",
  305. "uuid": str(cls.follow_uid),
  306. "Accept-Encoding": "gzip,compress,br,deflate",
  307. "User-Agent": "Mozilla/5.0 (iPhone; CPU iPhone OS 14_7_1 like Mac OS X)"
  308. " AppleWebKit/605.1.15 (KHTML, like Gecko) Mobile/15E148 "
  309. "MicroMessenger/8.0.20(0x18001435) NetType/WIFI Language/zh_CN",
  310. "Referer": str(cls.follow_referer)
  311. }
  312. json_text = {
  313. "visited_mid": p_mid,
  314. "start_t": cls.wechat_person_start_t,
  315. "qs": "imageMogr2/gravity/center/rotate/$/thumbnail/!690x385r/crop/690x385/interlace/1/format/jpg",
  316. "h_qs": "imageMogr2/gravity/center/rotate/$/thumbnail/!120x120r/crop/120x120/interlace/1/format/jpg",
  317. "limit": 20,
  318. "token": str(cls.follow_token),
  319. "uid": str(cls.follow_uid),
  320. "proj": "ma",
  321. "wx_ver": "8.0.23",
  322. "code_ver": "3.68.0",
  323. "log_common_params": {
  324. "e": [{
  325. "data": {
  326. "page": "profilePage",
  327. "topic": "public"
  328. }
  329. }],
  330. "ext": {
  331. "brand": "iPhone",
  332. "device": "iPhone 11",
  333. "os": "iOS 14.7.1",
  334. "weixinver": "8.0.23",
  335. "srcver": "2.24.7",
  336. "net": "wifi",
  337. "scene": "1089"
  338. },
  339. "pj": "1",
  340. "pf": "2",
  341. "session_id": "7468cf52-00ea-432e-8505-6ea3ad7ec164"
  342. }
  343. }
  344. r = requests.post(url=url, headers=headers, json=json_text, proxies=proxies, verify=False)
  345. cls.wechat_person_start_t = r.json()["data"]["next_t"]
  346. feeds = r.json()["data"]["list"]
  347. for i in range(len(feeds)):
  348. # 标题,表情随机加在片头、片尾,或替代句子中间的标点符号
  349. char_sheet = Feishu.get_values_batch("hour", "xiaoniangao", "BhlbST")
  350. expression_list = []
  351. char_list = []
  352. for q in range(len(char_sheet)):
  353. if char_sheet[q][0] is not None:
  354. expression_list.append(char_sheet[q][0])
  355. if char_sheet[q][1] is not None:
  356. char_list.append(char_sheet[q][1])
  357. befor_video_title = feeds[i]["title"].strip().replace("\n", "") \
  358. .replace("/", "").replace("\r", "").replace("#", "") \
  359. .replace(".", "。").replace("\\", "").replace("&NBSP", "") \
  360. .replace(":", "").replace("*", "").replace("?", "") \
  361. .replace("?", "").replace('"', "").replace("<", "") \
  362. .replace(">", "").replace("|", "").replace(" ", "")
  363. expression = random.choice(expression_list)
  364. expression_title_list = [expression + befor_video_title, befor_video_title + expression]
  365. # 标题,表情随机加在片头
  366. title_list1 = random.choice(expression_title_list)
  367. # 标题,表情随机加在片尾
  368. title_list2 = befor_video_title + random.choice(char_list)
  369. # 替代句子中间的标点符号
  370. title_list3 = befor_video_title.replace(
  371. ",", random.choice(expression_list)).replace(",", random.choice(expression_list))
  372. title_list4 = [title_list1, title_list2]
  373. video_title = random.choice(title_list4)
  374. # 用户名
  375. user_name = feeds[i]["album_user"]["nick"].strip().replace("\n", "") \
  376. .replace("/", "").replace("快手", "").replace(" ", "") \
  377. .replace(" ", "").replace("&NBSP", "").replace("\r", "")
  378. # 视频 ID
  379. if "vid" in feeds[i]:
  380. video_id = feeds[i]["vid"]
  381. else:
  382. video_id = 0
  383. # 播放量
  384. if "play_pv" in feeds[i]:
  385. video_play_cnt = feeds[i]["play_pv"]
  386. else:
  387. video_play_cnt = 0
  388. # 点赞
  389. if "total" in feeds[i]["favor"]:
  390. video_like_cnt = feeds[i]["favor"]["total"]
  391. else:
  392. video_like_cnt = 0
  393. # 评论数
  394. if "comment_count" in feeds[i]:
  395. video_comment_cnt = feeds[i]["comment_count"]
  396. else:
  397. video_comment_cnt = 0
  398. # 分享
  399. if "share" in feeds[i]:
  400. video_share_cnt = feeds[i]["share"]
  401. else:
  402. video_share_cnt = 0
  403. # 时长
  404. if "du" in feeds[i]:
  405. video_duration = int(feeds[i]["du"] / 1000)
  406. else:
  407. video_duration = 0
  408. # 发布时间
  409. if "t" in feeds[i]:
  410. video_send_time = feeds[i]["t"]
  411. else:
  412. video_send_time = 0
  413. cls.send_time = video_send_time / 1000
  414. # 宽和高
  415. if "w" in feeds[i] or "h" in feeds[i]:
  416. video_width = feeds[i]["w"]
  417. video_height = feeds[i]["h"]
  418. else:
  419. video_width = 0
  420. video_height = 0
  421. # 头像
  422. if "hurl" in feeds[i]["album_user"]:
  423. head_url = feeds[i]["album_user"]["hurl"]
  424. else:
  425. head_url = 0
  426. # 用户 ID
  427. if "id" in feeds[i]:
  428. profile_id = feeds[i]["id"]
  429. else:
  430. profile_id = 0
  431. # 用户 mid
  432. if "mid" in feeds[i]:
  433. profile_mid = feeds[i]["mid"]
  434. else:
  435. profile_mid = 0
  436. # 封面
  437. if "url" in feeds[i]:
  438. cover_url = feeds[i]["url"]
  439. else:
  440. cover_url = 0
  441. # 视频播放地址
  442. if "v_url" in feeds[i]:
  443. video_url = feeds[i]["v_url"]
  444. else:
  445. video_url = 0
  446. Common.logger(log_type).info("标题:{}", video_title)
  447. Common.logger(log_type).info("视频ID:{}", video_id)
  448. Common.logger(log_type).info("用户名:{}", user_name)
  449. Common.logger(log_type).info("播放量:{}", video_play_cnt)
  450. Common.logger(log_type).info(
  451. "发布时间:{}", time.strftime("%Y/%m/%d %H:%M:%S", time.localtime(int(video_send_time) / 1000)))
  452. Common.logger(log_type).info("播放地址:{}", video_url)
  453. # 过滤无效视频
  454. if video_id == 0 \
  455. or video_title == 0 \
  456. or video_send_time == 0 \
  457. or video_duration == 0 \
  458. or video_url == 0:
  459. Common.logger(log_type).info("无效视频\n")
  460. elif int(time.time()) - int(video_send_time / 1000) >= 259200:
  461. Common.logger(log_type).info("发布时间:{},超过72小时\n", time.strftime(
  462. "%Y/%m/%d %H:%M:%S", time.localtime(int(video_send_time) / 1000)))
  463. cls.wechat_person_start_t = None
  464. break
  465. elif cls.download_rule(video_duration, video_width, video_height, video_play_cnt,
  466. video_share_cnt) is False:
  467. Common.logger(log_type).info("不满足基础门槛\n")
  468. elif any(str(word) if str(word) in video_title else False for word in cls.sensitive_words(log_type)) is True:
  469. Common.logger(log_type).info("视频已中敏感词:{}\n".format(video_title))
  470. # 从云文档去重: 小时级_已下载表
  471. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "yatRv2") for m in n]:
  472. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  473. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "InCA1I") for m in n]:
  474. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  475. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "66n2um") for m in n]:
  476. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  477. # 从云文档去重: 用户主页_已下载表
  478. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "Wu0CeL") for m in n]:
  479. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  480. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "bkIrcr") for m in n]:
  481. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  482. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "FcQ4MN") for m in n]:
  483. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  484. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "zI9QJz") for m in n]:
  485. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  486. # 从云文档去重: 播放量_已下载表
  487. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "c85k1C") for m in n]:
  488. Common.logger(log_type).info("该视频已下载:{}\n", video_title)
  489. # 从云文档去重: 用户主页_feeds
  490. elif video_id in [m for n in Feishu.get_values_batch(log_type, "xiaoniangao", "k6ldje") for m in n]:
  491. Common.logger(log_type).info("该视频已在个人主页feeds:{}\n", video_title)
  492. else:
  493. Feishu.insert_columns(log_type, "xiaoniangao", "k6ldje", "ROWS", 1, 2)
  494. # 获取当前时间
  495. get_feeds_time = int(time.time())
  496. # 看一看云文档,工作表中写入数据
  497. values = [[time.strftime("%Y/%m/%d %H:%M:%S", time.localtime(int(get_feeds_time))),
  498. "用户主页",
  499. video_id,
  500. video_title,
  501. video_play_cnt,
  502. video_comment_cnt,
  503. video_like_cnt,
  504. video_share_cnt,
  505. video_duration,
  506. str(video_width) + "*" + str(video_height),
  507. time.strftime(
  508. "%Y/%m/%d %H:%M:%S", time.localtime(int(video_send_time) / 1000)),
  509. user_name,
  510. profile_id,
  511. profile_mid,
  512. head_url,
  513. cover_url,
  514. video_url]]
  515. # 等待 1s,防止操作云文档太频繁,导致报错
  516. time.sleep(1)
  517. Feishu.update_values(log_type, "xiaoniangao", "k6ldje", "F2:V2", values)
  518. Common.logger(log_type).info("添加视频至个人主页_feeds成功:{}\n", video_title)
  519. if int(time.time()) - int(cls.send_time) <= 259200:
  520. cls.get_videos_from_person(log_type, p_mid)
  521. else:
  522. cls.wechat_person_start_t = None
  523. return
  524. except Exception as e:
  525. Common.logger(log_type).error("获取个人主页视频异常:{}", e)
  526. # 获取所有关注列表的用户视频
  527. @classmethod
  528. def get_videos_from_follow(cls, log_type):
  529. try:
  530. # 已关注的用户列表 mids
  531. profile_mids = cls.get_follow_users(log_type)
  532. # Common.logger(log_type).info('profile_mids:{}', profile_mids)
  533. for profile_mid in profile_mids:
  534. Common.logger(log_type).info("获取用户:{}主页视频\n", profile_mid)
  535. cls.get_videos_from_person(log_type, profile_mid)
  536. except Exception as e:
  537. Common.logger(log_type).error("获取个人主页视频异常:{}", e)
  538. # 下载/上传
  539. @classmethod
  540. def download_publish(cls, log_type, env):
  541. try:
  542. person_sheet = Feishu.get_values_batch(log_type, "xiaoniangao", "k6ldje")
  543. for i in range(1, len(person_sheet) + 1):
  544. time.sleep(1)
  545. download_video_id = person_sheet[i][7]
  546. download_video_title = person_sheet[i][8]
  547. download_video_play_cnt = person_sheet[i][9]
  548. download_video_comment_cnt = person_sheet[i][10]
  549. download_video_like_cnt = person_sheet[i][11]
  550. download_video_share_cnt = person_sheet[i][12]
  551. download_video_duration = person_sheet[i][13]
  552. download_video_resolution = person_sheet[i][14]
  553. download_video_send_time = person_sheet[i][15]
  554. download_user_name = person_sheet[i][16]
  555. download_user_id = person_sheet[i][17]
  556. download_user_mid = person_sheet[i][18]
  557. download_head_url = person_sheet[i][19]
  558. download_cover_url = person_sheet[i][20]
  559. download_video_url = person_sheet[i][21]
  560. Common.logger("person").info("正在判断第{}行,视频:{}", i + 1, download_video_title)
  561. # 过滤空行及空标题视频
  562. if download_video_id is None \
  563. or download_video_id == "" \
  564. or download_video_title is None \
  565. or download_video_title == "":
  566. # 删除行或列,可选 ROWS、COLUMNS
  567. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  568. Common.logger("person").warning("标题为空或空行,删除成功\n")
  569. return
  570. # 播放量不小于 2000
  571. elif download_video_play_cnt < 100:
  572. # 删除行或列,可选 ROWS、COLUMNS
  573. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  574. Common.logger("person").info("播放量:{}<2000,删除成功\n", download_video_play_cnt)
  575. return
  576. # 从云文档去重: 小时级_已下载表
  577. elif download_video_id in [j for m in Feishu.get_values_batch("person", "xiaoniangao", "yatRv2") for j in m] \
  578. or download_video_id in [j for m in Feishu.get_values_batch("person", "xiaoniangao", "InCA1I") for j in m]:
  579. # 删除行或列,可选 ROWS、COLUMNS
  580. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  581. Common.logger("person").info("视频已下载:{},删除成功\n", download_video_title)
  582. return
  583. # 从云文档去重: 用户主页_已下载表
  584. elif download_video_id in [j for m in Feishu.get_values_batch("person", "xiaoniangao", "Wu0CeL") for j in m] \
  585. or download_video_id in [j for m in Feishu.get_values_batch("person", "xiaoniangao", "bkIrcr") for j in m]:
  586. # 删除行或列,可选 ROWS、COLUMNS
  587. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  588. Common.logger("person").info("视频已下载:{},删除成功\n", download_video_title)
  589. return
  590. # 从云文档去重: 播放量_已下载表
  591. elif download_video_id in [j for m in Feishu.get_values_batch(
  592. "person", "xiaoniangao", "c85k1C") for j in m]:
  593. # 删除行或列,可选 ROWS、COLUMNS
  594. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  595. Common.logger("person").info("视频已下载:{},删除成功\n", download_video_title)
  596. return
  597. else:
  598. # 下载封面
  599. Common.download_method(log_type="person", text="cover",
  600. d_name=str(download_video_title), d_url=str(download_cover_url))
  601. # 下载视频
  602. Common.download_method(log_type="person", text="video",
  603. d_name=str(download_video_title), d_url=str(download_video_url))
  604. # 保存视频信息至 "./videos/{download_video_title}/info.txt"
  605. with open("./videos/" + download_video_title + "/" + "info.txt",
  606. "a", encoding="UTF-8") as f_a:
  607. f_a.write(str(download_video_id) + "\n" +
  608. str(download_video_title) + "\n" +
  609. str(download_video_duration) + "\n" +
  610. str(download_video_play_cnt) + "\n" +
  611. str(download_video_comment_cnt) + "\n" +
  612. str(download_video_like_cnt) + "\n" +
  613. str(download_video_share_cnt) + "\n" +
  614. str(download_video_resolution) + "\n" +
  615. str(int(time.mktime(
  616. time.strptime(download_video_send_time, "%Y/%m/%d %H:%M:%S")))) + "\n" +
  617. str(download_user_name) + "\n" +
  618. str(download_head_url) + "\n" +
  619. str(download_video_url) + "\n" +
  620. str(download_cover_url) + "\n" +
  621. "xiaoniangao_person")
  622. Common.logger("person").info("==========视频信息已保存至info.txt==========")
  623. # 上传视频
  624. Common.logger("person").info("开始上传视频:{}".format(download_video_title))
  625. our_video_id = Publish.upload_and_publish("person", env, "follow")
  626. our_video_link = "https://admin.piaoquantv.com/cms/post-detail/" + str(our_video_id) + "/info"
  627. Common.logger("person").info("视频上传完成:{}", download_video_title)
  628. # 保存视频: 用户主页_已下载表
  629. Common.logger("person").info("保存视频至用户主页_已下载表:{}", download_video_title)
  630. # 视频ID工作表,插入首行
  631. Feishu.insert_columns("person", "xiaoniangao", "Wu0CeL", "ROWS", 1, 2)
  632. # 视频ID工作表,首行写入数据
  633. upload_time = int(time.time())
  634. values = [[time.strftime("%Y/%m/%d %H:%M:%S", time.localtime(upload_time)),
  635. "用户主页",
  636. str(download_video_id),
  637. str(download_video_title),
  638. our_video_link,
  639. download_video_play_cnt,
  640. download_video_comment_cnt,
  641. download_video_like_cnt,
  642. download_video_share_cnt,
  643. download_video_duration,
  644. str(download_video_resolution),
  645. str(download_video_send_time),
  646. str(download_user_name),
  647. str(download_user_id),
  648. str(download_user_mid),
  649. str(download_head_url),
  650. str(download_cover_url),
  651. str(download_video_url)]]
  652. time.sleep(1)
  653. Feishu.update_values("person", "xiaoniangao", "Wu0CeL", "F2:W2", values)
  654. # 删除行或列,可选 ROWS、COLUMNS
  655. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", i + 1, i + 1)
  656. Common.logger("person").info("视频:{},下载/上传成功\n", download_video_title)
  657. return
  658. except Exception as e:
  659. Common.logger(log_type).error("下载/上传异常:{}", e)
  660. Feishu.dimension_range("person", "xiaoniangao", "k6ldje", "ROWS", 2, 2)
  661. # 执行下载/上传
  662. @classmethod
  663. def run_download_publish(cls, log_type, env):
  664. try:
  665. while True:
  666. person_sheet = Feishu.get_values_batch(log_type, "xiaoniangao", "k6ldje")
  667. if len(person_sheet) == 1:
  668. Common.logger(log_type).info("下载/上传完成")
  669. break
  670. else:
  671. cls.download_publish(log_type, env)
  672. except Exception as e:
  673. Common.logger(log_type).error("执行下载/上传异常:{}", e)
  674. if __name__ == "__main__":
  675. person = Person()
  676. # person.get_videos_from_follow('person')
  677. # word_list = person.sensitive_words('person')
  678. # for word in word_list:
  679. # print(f"{str(word)} ,{type(str(word))}")
  680. pass