feishu.py 33 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2023/1/31
  4. """
  5. 飞书表配置: token 鉴权 / 增删改查 / 机器人报警
  6. """
  7. import json
  8. import os
  9. import sys
  10. import requests
  11. import urllib3
  12. sys.path.append(os.getcwd())
  13. from common.common import Common
  14. # from common import Common
  15. proxies = {"http": None, "https": None}
  16. class Feishu:
  17. """
  18. 编辑飞书云文档
  19. """
  20. # 看一看爬虫数据表
  21. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  22. # 快手爬虫数据表
  23. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?"
  24. # 微视爬虫数据表
  25. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  26. # 小年糕爬虫数据表
  27. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  28. # 音乐相册
  29. music_album = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g?"
  30. # 本山祝福数据表
  31. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  32. # 公众号爬虫表
  33. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  34. # 数据监控表
  35. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  36. # 微群视频爬虫表
  37. crawler_weiqun_video = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc?"
  38. # 视频号爬虫表
  39. crawler_shipinhao = 'https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?'
  40. # 西瓜视频
  41. crawler_xigua = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?'
  42. # 知乎 PC 端
  43. crawler_zhihu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?'
  44. # 吉祥幸福
  45. crawler_jixiangxingfu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnSx4nafMbLTq7xl7RHBwHBf?'
  46. # 众妙音信
  47. crawler_zmyx = 'https://w42nne6hzg.feishu.cn/sheets/shtcnbZIxstPeM0xshW07b26sve?'
  48. # 岁岁年年迎福气
  49. crawler_ssnnyfq = 'https://w42nne6hzg.feishu.cn/sheets/shtcnyJmJSJynHDLLbLTkySfvZe?'
  50. # 祝福猫视频
  51. crawler_zhufumao = 'https://w42nne6hzg.feishu.cn/sheets/shtcnXfIJthvkjhI5zlEJq84i6g?'
  52. # 宗教公众号
  53. crawler_zongjiao = 'https://w42nne6hzg.feishu.cn/sheets/shtcn73NW0CyoOeF21HWO15KBsb?'
  54. # 好看视频
  55. crawler_haokan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd'
  56. # 看到就是福气
  57. crawler_kandaojiushifuqi = 'https://w42nne6hzg.feishu.cn/sheets/shtcnEokBkIjOUPAk8vbbPKnXgb'
  58. # 胜胜影音
  59. crawler_shengshengyingyin = 'https://w42nne6hzg.feishu.cn/sheets/shtcnz1ymxHL1u8WHblfqfys7qe'
  60. # 刚刚都传
  61. crawler_ganggangdouchuan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnTuJgeZU2bc7VaesAqk3QJx'
  62. # 公众号_信欣
  63. crawler_gongzhonghao = 'https://w42nne6hzg.feishu.cn/sheets/shtcna98M2mX7TbivTj9Sb7WKBN?'
  64. # YouTube
  65. crawler_youtube = 'https://w42nne6hzg.feishu.cn/sheets/shtcnrLyr1zbYbhhZyqpN7Xrd5f?'
  66. # 微信指数
  67. weixinzhishu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?'
  68. # 微信指数_搜索词
  69. weixinzhishu_search_word = 'https://w42nne6hzg.feishu.cn/sheets/shtcnHxCj6dZBYMuK1Q3tIJVlqg?'
  70. # 飞书路径token
  71. @classmethod
  72. def spreadsheettoken(cls, crawler):
  73. """
  74. :param crawler: 哪个爬虫
  75. """
  76. if crawler == "kanyikan":
  77. return "shtcngRPoDYAi24x52j2nDuHMih"
  78. elif crawler == "kuaishou":
  79. return "shtcnICEfaw9llDNQkKgdymM1xf"
  80. elif crawler == "weishi":
  81. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  82. elif crawler == "xiaoniangao":
  83. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  84. elif crawler == "monitor":
  85. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  86. elif crawler == "music_album":
  87. return "shtcnT6zvmfsYe1g0iv4pt7855g"
  88. elif crawler == "bszf":
  89. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  90. elif crawler == "gzh":
  91. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  92. elif crawler == "weiqun":
  93. return "shtcnoKThNquYRweaylMFVyo9Hc"
  94. elif crawler == 'shipinhao':
  95. return 'shtcn9rOdZRAGFbRkWpn7hqEHGc'
  96. elif crawler == 'xigua':
  97. return 'shtcnvOpx2P8vBXiV91Ot1MKIw8'
  98. elif crawler == 'zhihu':
  99. return 'shtcnkGPBmGsjaqapgzouuj8MXe'
  100. elif crawler == 'jxxf':
  101. return 'shtcnSx4nafMbLTq7xl7RHBwHBf'
  102. elif crawler == 'zmyx':
  103. return 'shtcnbZIxstPeM0xshW07b26sve'
  104. elif crawler == 'ssnnyfq':
  105. return 'shtcnyJmJSJynHDLLbLTkySfvZe'
  106. elif crawler == 'zhufumao':
  107. return 'shtcnXfIJthvkjhI5zlEJq84i6g'
  108. elif crawler == 'zongjiao':
  109. return 'shtcn73NW0CyoOeF21HWO15KBsb'
  110. elif crawler == 'haokan':
  111. return 'shtcnaYz8Nhv8q6DbWtlL6rMEBd'
  112. elif crawler == 'kdjsfq':
  113. return 'shtcnEokBkIjOUPAk8vbbPKnXgb'
  114. elif crawler == 'ssyy':
  115. return 'shtcnz1ymxHL1u8WHblfqfys7qe'
  116. elif crawler == 'ggdc':
  117. return 'shtcnTuJgeZU2bc7VaesAqk3QJx'
  118. elif crawler == 'gongzhonghao_xinxin':
  119. return 'shtcna98M2mX7TbivTj9Sb7WKBN'
  120. elif crawler == 'youtube':
  121. return 'shtcnrLyr1zbYbhhZyqpN7Xrd5f'
  122. elif crawler == 'weixinzhishu':
  123. return 'shtcnqhMRUGunIfGnGXMOBYiy4K'
  124. elif crawler == 'weixinzhishu_search_word':
  125. return 'shtcnHxCj6dZBYMuK1Q3tIJVlqg'
  126. # 获取飞书api token
  127. @classmethod
  128. def get_token(cls, log_type, crawler):
  129. """
  130. 获取飞书api token
  131. :return:
  132. """
  133. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  134. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  135. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  136. try:
  137. urllib3.disable_warnings()
  138. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  139. tenant_access_token = response.json()["tenant_access_token"]
  140. return tenant_access_token
  141. except Exception as e:
  142. Common.logger(log_type, crawler).error("获取飞书 api token 异常:{}", e)
  143. # 获取表格元数据
  144. @classmethod
  145. def get_metainfo(cls, log_type, crawler):
  146. """
  147. 获取表格元数据
  148. :return:
  149. """
  150. try:
  151. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  152. + cls.spreadsheettoken(crawler) + "/metainfo"
  153. headers = {
  154. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  155. "Content-Type": "application/json; charset=utf-8"
  156. }
  157. params = {
  158. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  159. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  160. }
  161. urllib3.disable_warnings()
  162. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  163. response = json.loads(r.content.decode("utf8"))
  164. return response
  165. except Exception as e:
  166. Common.logger(log_type, crawler).error("获取表格元数据异常:{}", e)
  167. # 读取工作表中所有数据
  168. @classmethod
  169. def get_values_batch(cls, log_type, crawler, sheetid):
  170. """
  171. 读取工作表中所有数据
  172. :param log_type: 启用哪个 log
  173. :param crawler: 哪个爬虫
  174. :param sheetid: 哪张表
  175. :return: 所有数据
  176. """
  177. try:
  178. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  179. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  180. headers = {
  181. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  182. "Content-Type": "application/json; charset=utf-8"
  183. }
  184. params = {
  185. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  186. "ranges": sheetid,
  187. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  188. # valueRenderOption=FormattedValue 计算并格式化单元格;
  189. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  190. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  191. "valueRenderOption": "ToString",
  192. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  193. "dateTimeRenderOption": "",
  194. # 返回的用户id类型,可选open_id,union_id
  195. "user_id_type": "open_id"
  196. }
  197. urllib3.disable_warnings()
  198. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  199. # print(r.text)
  200. response = json.loads(r.content.decode("utf8"))
  201. values = response["data"]["valueRanges"][0]["values"]
  202. return values
  203. except Exception as e:
  204. Common.logger(log_type, crawler).error("读取工作表所有数据异常:{}", e)
  205. # 工作表,插入行或列
  206. @classmethod
  207. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  208. """
  209. 工作表插入行或列
  210. :param log_type: 日志路径
  211. :param crawler: 哪个爬虫的云文档
  212. :param sheetid:哪张工作表
  213. :param majordimension:行或者列, ROWS、COLUMNS
  214. :param startindex:开始位置
  215. :param endindex:结束位置
  216. """
  217. try:
  218. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  219. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  220. headers = {
  221. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  222. "Content-Type": "application/json; charset=utf-8"
  223. }
  224. body = {
  225. "dimension": {
  226. "sheetId": sheetid,
  227. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  228. "startIndex": startindex, # 开始的位置
  229. "endIndex": endindex # 结束的位置
  230. },
  231. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  232. }
  233. urllib3.disable_warnings()
  234. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  235. Common.logger(log_type, crawler).info("插入行或列:{}", r.json()["msg"])
  236. except Exception as e:
  237. Common.logger(log_type, crawler).error("插入行或列异常:{}", e)
  238. # 写入数据
  239. @classmethod
  240. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  241. """
  242. 写入数据
  243. :param log_type: 日志路径
  244. :param crawler: 哪个爬虫的云文档
  245. :param sheetid:哪张工作表
  246. :param ranges:单元格范围
  247. :param values:写入的具体数据,list
  248. """
  249. try:
  250. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  251. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  252. headers = {
  253. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  254. "Content-Type": "application/json; charset=utf-8"
  255. }
  256. body = {
  257. "valueRanges": [
  258. {
  259. "range": sheetid + "!" + ranges,
  260. "values": values
  261. },
  262. ],
  263. }
  264. urllib3.disable_warnings()
  265. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  266. Common.logger(log_type, crawler).info("写入数据:{}", r.json()["msg"])
  267. except Exception as e:
  268. Common.logger(log_type, crawler).error("写入数据异常:{}", e)
  269. # 合并单元格
  270. @classmethod
  271. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  272. """
  273. 合并单元格
  274. :param log_type: 日志路径
  275. :param crawler: 哪个爬虫
  276. :param sheetid:哪张工作表
  277. :param ranges:需要合并的单元格范围
  278. """
  279. try:
  280. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  281. + cls.spreadsheettoken(crawler) + "/merge_cells"
  282. headers = {
  283. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  284. "Content-Type": "application/json; charset=utf-8"
  285. }
  286. body = {
  287. "range": sheetid + "!" + ranges,
  288. "mergeType": "MERGE_ROWS"
  289. }
  290. urllib3.disable_warnings()
  291. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  292. Common.logger(log_type, crawler).info("合并单元格:{}", r.json()["msg"])
  293. except Exception as e:
  294. Common.logger(log_type, crawler).error("合并单元格异常:{}", e)
  295. # 读取单元格数据
  296. @classmethod
  297. def get_range_value(cls, log_type, crawler, sheetid, cell):
  298. """
  299. 读取单元格内容
  300. :param log_type: 日志路径
  301. :param crawler: 哪个爬虫
  302. :param sheetid: 哪张工作表
  303. :param cell: 哪个单元格
  304. :return: 单元格内容
  305. """
  306. try:
  307. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  308. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  309. headers = {
  310. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  311. "Content-Type": "application/json; charset=utf-8"
  312. }
  313. params = {
  314. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  315. # valueRenderOption=FormattedValue 计算并格式化单元格;
  316. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  317. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  318. "valueRenderOption": "FormattedValue",
  319. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  320. "dateTimeRenderOption": "",
  321. # 返回的用户id类型,可选open_id,union_id
  322. "user_id_type": "open_id"
  323. }
  324. urllib3.disable_warnings()
  325. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  326. # print(r.text)
  327. return r.json()["data"]["valueRange"]["values"][0]
  328. except Exception as e:
  329. Common.logger(log_type, crawler).error("读取单元格数据异常:{}", e)
  330. # 获取表内容
  331. @classmethod
  332. def get_sheet_content(cls, log_type, crawler, sheet_id):
  333. try:
  334. sheet = Feishu.get_values_batch(log_type, crawler, sheet_id)
  335. content_list = []
  336. for x in sheet:
  337. for y in x:
  338. if y is None:
  339. pass
  340. else:
  341. content_list.append(y)
  342. return content_list
  343. except Exception as e:
  344. Common.logger(log_type, crawler).error(f'get_sheet_content:{e}\n')
  345. # 删除行或列,可选 ROWS、COLUMNS
  346. @classmethod
  347. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  348. """
  349. 删除行或列
  350. :param log_type: 日志路径
  351. :param crawler: 哪个爬虫
  352. :param sheetid:工作表
  353. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  354. :param startindex:开始的位置
  355. :param endindex:结束的位置
  356. :return:
  357. """
  358. try:
  359. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  360. + cls.spreadsheettoken(crawler) + "/dimension_range"
  361. headers = {
  362. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  363. "Content-Type": "application/json; charset=utf-8"
  364. }
  365. body = {
  366. "dimension": {
  367. "sheetId": sheetid,
  368. "majorDimension": major_dimension,
  369. "startIndex": startindex,
  370. "endIndex": endindex
  371. }
  372. }
  373. urllib3.disable_warnings()
  374. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  375. Common.logger(log_type, crawler).info("删除视频数据:{}", r.json()["msg"])
  376. except Exception as e:
  377. Common.logger(log_type, crawler).error("删除视频数据异常:{}", e)
  378. # 获取用户 ID
  379. @classmethod
  380. def get_userid(cls, log_type, crawler, username):
  381. try:
  382. url = "https://open.feishu.cn/open-apis/user/v1/batch_get_id?"
  383. headers = {
  384. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  385. "Content-Type": "application/json; charset=utf-8"
  386. }
  387. if username == "wangkun":
  388. username = "13426262515"
  389. elif username == "gaonannan":
  390. username = "18501180073"
  391. elif username == "xinxin":
  392. username = "15546206651"
  393. elif username == "huxinxue":
  394. username = "18832292015"
  395. elif username == "wuchaoyue":
  396. username = "15712941385"
  397. elif username == "muxinyi":
  398. username = '13699208058'
  399. data = {"mobiles": [username]}
  400. urllib3.disable_warnings()
  401. r = requests.get(url=url, headers=headers, params=data, verify=False, proxies=proxies)
  402. open_id = r.json()["data"]["mobile_users"][username][0]["open_id"]
  403. Common.logger(log_type, crawler).info(f"{username}:{open_id}")
  404. # print(f"{username}:{open_id}")
  405. return open_id
  406. except Exception as e:
  407. Common.logger(log_type, crawler).error(f"get_userid异常:{e}\n")
  408. # 飞书机器人
  409. @classmethod
  410. def bot(cls, log_type, crawler, text):
  411. try:
  412. url = "https://open.feishu.cn/open-apis/bot/v2/hook/96989577-50e7-4653-9ec2-308fe3f2c5fe"
  413. headers = {'Content-Type': 'application/json'}
  414. if crawler == "kanyikan":
  415. content = "看一看爬虫表"
  416. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih"
  417. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  418. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  419. elif crawler == "weixinzhishu_out":
  420. content = "微信指数_站外指数"
  421. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=YVuVgQ"
  422. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  423. cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  424. elif crawler == "weixinzhishu_inner_sort":
  425. content = "微信指数_站内短期指数"
  426. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=DrZHpa"
  427. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  428. cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  429. elif crawler == "weixinzhishu_inner_long":
  430. content = "微信指数_站内长期指数"
  431. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=JpgyAv"
  432. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  433. cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  434. elif crawler == "xiaoniangao_hour":
  435. content = "小年糕_小时级_已下载表"
  436. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=yatRv2"
  437. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  438. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  439. elif crawler == "xiaoniangao_person":
  440. content = "小年糕_用户主页_已下载表"
  441. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=Wu0CeL"
  442. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  443. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  444. elif crawler == "xiaoniangao_play":
  445. content = "小年糕_播放量_已下载表"
  446. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=c85k1C"
  447. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  448. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  449. elif crawler == 'xigua':
  450. content = '西瓜视频_用户主页_已下载表'
  451. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?sheet=e075e9'
  452. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  453. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  454. elif crawler == 'xigua_little_video':
  455. content = '西瓜视频_小视频_已下载表'
  456. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?sheet=hDSDnv'
  457. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  458. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  459. elif crawler == 'zhihu_hot':
  460. content = '知乎_热门_已下载表'
  461. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?sheet=8871e3'
  462. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  463. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  464. elif crawler == 'zhihu_follow':
  465. content = '知乎_定向_已下载表'
  466. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?sheet=4MGuux'
  467. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  468. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  469. elif crawler == 'haokan_hot':
  470. content = '好看_热榜_已下载表'
  471. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=5pWipX'
  472. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  473. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  474. elif crawler == 'haokan_channel':
  475. content = '好看_频道_已下载表'
  476. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=7f05d8'
  477. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  478. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  479. elif crawler == 'haokan_follow':
  480. content = '好看_定向_已下载表'
  481. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=kVaSjf'
  482. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  483. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  484. elif crawler == "music_album":
  485. content = "音乐相册爬虫表"
  486. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g"
  487. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  488. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  489. elif crawler == "ssyy":
  490. content = "胜胜影音爬虫表"
  491. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnz1ymxHL1u8WHblfqfys7qe"
  492. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  493. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  494. elif crawler == "ggdc":
  495. content = "刚刚都传爬虫表"
  496. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnTuJgeZU2bc7VaesAqk3QJx"
  497. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  498. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  499. elif crawler == "bszf":
  500. content = "本山祝福爬虫表"
  501. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb"
  502. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  503. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  504. elif crawler == "jxxf":
  505. content = "吉祥幸福爬虫表"
  506. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnSx4nafMbLTq7xl7RHBwHBf"
  507. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  508. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  509. elif crawler == "zmyx":
  510. content = "众妙音信爬虫表"
  511. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnbZIxstPeM0xshW07b26sve"
  512. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  513. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  514. elif crawler == "zhufumao":
  515. content = "祝福猫视频爬虫表"
  516. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnXfIJthvkjhI5zlEJq84i6g"
  517. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  518. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  519. elif crawler == "kuaishou_follow":
  520. content = "快手_用户主页_已下载表"
  521. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?sheet=fYdA8F"
  522. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  523. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  524. elif crawler == "kuaishou_recommend":
  525. content = "快手_推荐榜_已下载表"
  526. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?sheet=3cd128"
  527. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  528. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  529. elif crawler == "ssnnyfq":
  530. content = "岁岁年年迎福气_已下载表"
  531. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnyJmJSJynHDLLbLTkySfvZe?sheet=290bae"
  532. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  533. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  534. elif crawler == "kdjsfq":
  535. content = "看到就是福气_已下载表"
  536. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnEokBkIjOUPAk8vbbPKnXgb?sheet=ad3b6d"
  537. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  538. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  539. elif crawler == "gzh":
  540. content = "公众号爬虫表"
  541. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA"
  542. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  543. cls.get_userid(log_type, crawler, "huxinxue")) + "></at>\n"
  544. elif crawler == "gongzhonghao_xinxin":
  545. content = "公众号_信欣_爬虫表"
  546. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcna98M2mX7TbivTj9Sb7WKBN?"
  547. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  548. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  549. elif crawler == "weiqun":
  550. content = "微群爬虫表"
  551. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc"
  552. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  553. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  554. elif crawler == "weishi":
  555. content = "微视爬虫表"
  556. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh"
  557. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  558. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  559. elif crawler == "shipinhao_recommend":
  560. content = "视频号_推荐_已下载表"
  561. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?sheet=c77cf9"
  562. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  563. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  564. elif crawler == "shipinhao_follow":
  565. content = "视频号_定向_已下载表"
  566. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?sheet=KsVtLe"
  567. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  568. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  569. elif crawler == "youtube":
  570. content = "youtube_定向_已下载表"
  571. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnrLyr1zbYbhhZyqpN7Xrd5f?sheet=GVxlYk"
  572. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  573. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  574. elif crawler == "zongjiao":
  575. content = "宗教公众号爬虫表"
  576. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn73NW0CyoOeF21HWO15KBsb"
  577. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  578. cls.get_userid(log_type, crawler, "huxinxue")) + "></at>\n"
  579. else:
  580. content = "小年糕爬虫表"
  581. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  582. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at>\n"
  583. data = json.dumps({
  584. "msg_type": "interactive",
  585. "card": {
  586. "config": {
  587. "wide_screen_mode": True,
  588. "enable_forward": True
  589. },
  590. "elements": [{
  591. "tag": "div",
  592. "text": {
  593. "content": users + text,
  594. "tag": "lark_md"
  595. }
  596. }, {
  597. "actions": [{
  598. "tag": "button",
  599. "text": {
  600. "content": content,
  601. "tag": "lark_md"
  602. },
  603. "url": sheet_url,
  604. "type": "default",
  605. "value": {}
  606. }],
  607. "tag": "action"
  608. }],
  609. "header": {
  610. "title": {
  611. "content": "📣您有新的信息,请注意查收",
  612. "tag": "plain_text"
  613. }
  614. }
  615. }
  616. })
  617. urllib3.disable_warnings()
  618. r = requests.post(url, headers=headers, data=data, verify=False, proxies=proxies)
  619. Common.logger(log_type, crawler).info(f'触发机器人消息:{r}, {r.json()["StatusMessage"]}')
  620. except Exception as e:
  621. Common.logger(log_type, crawler).error(f"bot异常:{e}\n")
  622. if __name__ == "__main__":
  623. Feishu.bot('follow', 'weixinzhishu_out', 'test:微信指数_站外指数已抓取完毕')