feishu.py 36 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2023/1/31
  4. """
  5. 飞书表配置: token 鉴权 / 增删改查 / 机器人报警
  6. """
  7. import json
  8. import os
  9. import sys
  10. import requests
  11. import urllib3
  12. sys.path.append(os.getcwd())
  13. from application.common.log import Local
  14. proxies = {"http": None, "https": None}
  15. class Feishu:
  16. """
  17. 编辑飞书云文档
  18. """
  19. # 看一看爬虫数据表
  20. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  21. # 快手爬虫数据表
  22. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?"
  23. # 微视爬虫数据表
  24. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  25. # 小年糕爬虫数据表
  26. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  27. # 音乐相册
  28. music_album = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g?"
  29. # 本山祝福数据表
  30. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  31. # 公众号爬虫表
  32. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  33. # 数据监控表
  34. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  35. # 微群视频爬虫表
  36. crawler_weiqun_video = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc?"
  37. # 视频号爬虫表
  38. crawler_shipinhao = 'https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?'
  39. # 西瓜视频
  40. crawler_xigua = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?'
  41. # 知乎 PC 端
  42. crawler_zhihu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?'
  43. # 吉祥幸福
  44. crawler_jixiangxingfu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnSx4nafMbLTq7xl7RHBwHBf?'
  45. # 福小顺
  46. crawler_fuxiaoshun = 'https://w42nne6hzg.feishu.cn/sheets/CoXEsl6MDhMaKKt6GUBcvLwsnWb?'
  47. # 众妙音信
  48. crawler_zmyx = 'https://w42nne6hzg.feishu.cn/sheets/shtcnbZIxstPeM0xshW07b26sve?'
  49. # 岁岁年年迎福气
  50. crawler_ssnnyfq = 'https://w42nne6hzg.feishu.cn/sheets/shtcnyJmJSJynHDLLbLTkySfvZe?'
  51. # 祝福猫视频
  52. crawler_zhufumao = 'https://w42nne6hzg.feishu.cn/sheets/shtcnXfIJthvkjhI5zlEJq84i6g?'
  53. # 宗教公众号
  54. crawler_zongjiao = 'https://w42nne6hzg.feishu.cn/sheets/shtcn73NW0CyoOeF21HWO15KBsb?'
  55. # 好看视频
  56. crawler_haokan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd'
  57. # 看到就是福气
  58. crawler_kandaojiushifuqi = 'https://w42nne6hzg.feishu.cn/sheets/shtcnEokBkIjOUPAk8vbbPKnXgb'
  59. # 胜胜影音
  60. crawler_shengshengyingyin = 'https://w42nne6hzg.feishu.cn/sheets/shtcnz1ymxHL1u8WHblfqfys7qe'
  61. # 刚刚都传
  62. crawler_ganggangdouchuan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnTuJgeZU2bc7VaesAqk3QJx'
  63. # 知青天天看
  64. crawler_zhiqingtiantiankan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnjmhKdJOKdqnEzJcZb5xaHc?'
  65. # 公众号_信欣
  66. crawler_gongzhonghao = 'https://w42nne6hzg.feishu.cn/sheets/shtcna98M2mX7TbivTj9Sb7WKBN?'
  67. # YouTube
  68. crawler_youtube = 'https://w42nne6hzg.feishu.cn/sheets/shtcnrLyr1zbYbhhZyqpN7Xrd5f?'
  69. # 微信指数
  70. weixinzhishu = 'https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?'
  71. # 微信指数_搜索词
  72. weixinzhishu_search_word = 'https://w42nne6hzg.feishu.cn/sheets/shtcnHxCj6dZBYMuK1Q3tIJVlqg?'
  73. # 海豚祝福
  74. crawler_haitunzhufu = 'https://w42nne6hzg.feishu.cn/sheets/VbyAsUGq3h9TQ7tG3GpczGjhn1M?'
  75. # 飞书路径token
  76. @classmethod
  77. def spreadsheettoken(cls, crawler):
  78. """
  79. :param crawler: 哪个爬虫
  80. """
  81. if crawler == "kanyikan":
  82. return "shtcngRPoDYAi24x52j2nDuHMih"
  83. elif crawler == "kuaishou":
  84. return "shtcnICEfaw9llDNQkKgdymM1xf"
  85. elif crawler == "weishi":
  86. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  87. elif crawler == "xiaoniangao":
  88. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  89. elif crawler == "control":
  90. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  91. elif crawler == "music_album":
  92. return "shtcnT6zvmfsYe1g0iv4pt7855g"
  93. elif crawler == "benshanzhufu":
  94. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  95. elif crawler == "gzh":
  96. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  97. elif crawler == "weiqun":
  98. return "shtcnoKThNquYRweaylMFVyo9Hc"
  99. elif crawler == 'shipinhao':
  100. return 'shtcn9rOdZRAGFbRkWpn7hqEHGc'
  101. elif crawler == 'xigua':
  102. return 'shtcnvOpx2P8vBXiV91Ot1MKIw8'
  103. elif crawler == 'zhihu':
  104. return 'shtcnkGPBmGsjaqapgzouuj8MXe'
  105. elif crawler == 'jixiangxingfu':
  106. return 'shtcnSx4nafMbLTq7xl7RHBwHBf'
  107. elif crawler == 'fuxiaoshun':
  108. return 'CoXEsl6MDhMaKKt6GUBcvLwsnWb'
  109. elif crawler == 'zhongmiaoyinxin':
  110. return 'shtcnbZIxstPeM0xshW07b26sve'
  111. elif crawler == 'suisuiniannianyingfuqi':
  112. return 'shtcnyJmJSJynHDLLbLTkySfvZe'
  113. elif crawler == 'zhufumao':
  114. return 'shtcnXfIJthvkjhI5zlEJq84i6g'
  115. elif crawler == 'zongjiao':
  116. return 'shtcn73NW0CyoOeF21HWO15KBsb'
  117. elif crawler == 'haokan':
  118. return 'shtcnaYz8Nhv8q6DbWtlL6rMEBd'
  119. elif crawler == 'kandaojiushifuqi':
  120. return 'shtcnEokBkIjOUPAk8vbbPKnXgb'
  121. elif crawler == 'shengshengyingyin':
  122. return 'shtcnz1ymxHL1u8WHblfqfys7qe'
  123. elif crawler == 'ganggangdouchuan':
  124. return 'shtcnTuJgeZU2bc7VaesAqk3QJx'
  125. elif crawler == 'youtube':
  126. return 'shtcnrLyr1zbYbhhZyqpN7Xrd5f'
  127. elif crawler == 'weixinzhishu':
  128. return 'shtcnqhMRUGunIfGnGXMOBYiy4K'
  129. elif crawler == 'weixinzhishu_search_word':
  130. return 'shtcnHxCj6dZBYMuK1Q3tIJVlqg'
  131. elif crawler == 'gongzhonghao':
  132. return 'shtcna98M2mX7TbivTj9Sb7WKBN'
  133. elif crawler == 'douyin':
  134. return 'shtcnhq63MoXOpqbkuLuoapYIAh'
  135. elif crawler == 'zhiqingtiantiankan':
  136. return 'shtcnjmhKdJOKdqnEzJcZb5xaHc'
  137. elif crawler == 'haitunzhufu':
  138. return 'VbyAsUGq3h9TQ7tG3GpczGjhn1M'
  139. # 获取飞书api token
  140. @classmethod
  141. def get_token(cls, log_type, crawler):
  142. """
  143. 获取飞书api token
  144. :return:
  145. """
  146. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  147. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  148. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  149. try:
  150. urllib3.disable_warnings()
  151. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  152. tenant_access_token = response.json()["tenant_access_token"]
  153. return tenant_access_token
  154. except Exception as e:
  155. Local.logger(log_type, crawler).error("获取飞书 api token 异常:{}", e)
  156. # 获取表格元数据
  157. @classmethod
  158. def get_metainfo(cls, log_type, crawler):
  159. """
  160. 获取表格元数据
  161. :return:
  162. """
  163. try:
  164. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  165. + cls.spreadsheettoken(crawler) + "/metainfo"
  166. headers = {
  167. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  168. "Content-Type": "application/json; charset=utf-8"
  169. }
  170. params = {
  171. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  172. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  173. }
  174. urllib3.disable_warnings()
  175. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  176. response = json.loads(r.content.decode("utf8"))
  177. return response
  178. except Exception as e:
  179. Local.logger(log_type, crawler).error("获取表格元数据异常:{}", e)
  180. # 读取工作表中所有数据
  181. @classmethod
  182. def get_values_batch(cls, log_type, crawler, sheetid):
  183. """
  184. 读取工作表中所有数据
  185. :param log_type: 启用哪个 log
  186. :param crawler: 哪个爬虫
  187. :param sheetid: 哪张表
  188. :return: 所有数据
  189. """
  190. try:
  191. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  192. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  193. headers = {
  194. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  195. "Content-Type": "application/json; charset=utf-8"
  196. }
  197. params = {
  198. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  199. "ranges": sheetid,
  200. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  201. # valueRenderOption=FormattedValue 计算并格式化单元格;
  202. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  203. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  204. "valueRenderOption": "ToString",
  205. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  206. "dateTimeRenderOption": "",
  207. # 返回的用户id类型,可选open_id,union_id
  208. "user_id_type": "open_id"
  209. }
  210. urllib3.disable_warnings()
  211. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  212. # print(r.text)
  213. response = json.loads(r.content.decode("utf8"))
  214. values = response["data"]["valueRanges"][0]["values"]
  215. return values
  216. except Exception as e:
  217. Local.logger(log_type, crawler).error("读取工作表所有数据异常:{}", e)
  218. # 工作表,插入行或列
  219. @classmethod
  220. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  221. """
  222. 工作表插入行或列
  223. :param log_type: 日志路径
  224. :param crawler: 哪个爬虫的云文档
  225. :param sheetid:哪张工作表
  226. :param majordimension:行或者列, ROWS、COLUMNS
  227. :param startindex:开始位置
  228. :param endindex:结束位置
  229. """
  230. try:
  231. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  232. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  233. headers = {
  234. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  235. "Content-Type": "application/json; charset=utf-8"
  236. }
  237. body = {
  238. "dimension": {
  239. "sheetId": sheetid,
  240. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  241. "startIndex": startindex, # 开始的位置
  242. "endIndex": endindex # 结束的位置
  243. },
  244. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  245. }
  246. urllib3.disable_warnings()
  247. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  248. Local.logger(log_type, crawler).info("插入行或列:{}", r.json()["msg"])
  249. except Exception as e:
  250. Local.logger(log_type, crawler).error("插入行或列异常:{}", e)
  251. # 写入数据
  252. @classmethod
  253. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  254. """
  255. 写入数据
  256. :param log_type: 日志路径
  257. :param crawler: 哪个爬虫的云文档
  258. :param sheetid:哪张工作表
  259. :param ranges:单元格范围
  260. :param values:写入的具体数据,list
  261. """
  262. try:
  263. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  264. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  265. headers = {
  266. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  267. "Content-Type": "application/json; charset=utf-8"
  268. }
  269. body = {
  270. "valueRanges": [
  271. {
  272. "range": sheetid + "!" + ranges,
  273. "values": values
  274. },
  275. ],
  276. }
  277. urllib3.disable_warnings()
  278. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  279. Local.logger(log_type, crawler).info("写入数据:{}", r.json()["msg"])
  280. except Exception as e:
  281. Local.logger(log_type, crawler).error("写入数据异常:{}", e)
  282. # 合并单元格
  283. @classmethod
  284. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  285. """
  286. 合并单元格
  287. :param log_type: 日志路径
  288. :param crawler: 哪个爬虫
  289. :param sheetid:哪张工作表
  290. :param ranges:需要合并的单元格范围
  291. """
  292. try:
  293. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  294. + cls.spreadsheettoken(crawler) + "/merge_cells"
  295. headers = {
  296. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  297. "Content-Type": "application/json; charset=utf-8"
  298. }
  299. body = {
  300. "range": sheetid + "!" + ranges,
  301. "mergeType": "MERGE_ROWS"
  302. }
  303. urllib3.disable_warnings()
  304. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  305. Local.logger(log_type, crawler).info("合并单元格:{}", r.json()["msg"])
  306. except Exception as e:
  307. Local.logger(log_type, crawler).error("合并单元格异常:{}", e)
  308. # 读取单元格数据
  309. @classmethod
  310. def get_range_value(cls, log_type, crawler, sheetid, cell):
  311. """
  312. 读取单元格内容
  313. :param log_type: 日志路径
  314. :param crawler: 哪个爬虫
  315. :param sheetid: 哪张工作表
  316. :param cell: 哪个单元格
  317. :return: 单元格内容
  318. """
  319. try:
  320. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  321. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  322. headers = {
  323. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  324. "Content-Type": "application/json; charset=utf-8"
  325. }
  326. params = {
  327. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  328. # valueRenderOption=FormattedValue 计算并格式化单元格;
  329. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  330. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  331. "valueRenderOption": "FormattedValue",
  332. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  333. "dateTimeRenderOption": "",
  334. # 返回的用户id类型,可选open_id,union_id
  335. "user_id_type": "open_id"
  336. }
  337. urllib3.disable_warnings()
  338. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  339. # print(r.text)
  340. return r.json()["data"]["valueRange"]["values"][0]
  341. except Exception as e:
  342. Local.logger(log_type, crawler).error("读取单元格数据异常:{}", e)
  343. # 获取表内容
  344. @classmethod
  345. def get_sheet_content(cls, log_type, crawler, sheet_id):
  346. try:
  347. sheet = Feishu.get_values_batch(log_type, crawler, sheet_id)
  348. content_list = []
  349. for x in sheet:
  350. for y in x:
  351. if y is None:
  352. pass
  353. else:
  354. content_list.append(y)
  355. return content_list
  356. except Exception as e:
  357. Local.logger(log_type, crawler).error(f'get_sheet_content:{e}\n')
  358. # 删除行或列,可选 ROWS、COLUMNS
  359. @classmethod
  360. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  361. """
  362. 删除行或列
  363. :param log_type: 日志路径
  364. :param crawler: 哪个爬虫
  365. :param sheetid:工作表
  366. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  367. :param startindex:开始的位置
  368. :param endindex:结束的位置
  369. :return:
  370. """
  371. try:
  372. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  373. + cls.spreadsheettoken(crawler) + "/dimension_range"
  374. headers = {
  375. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  376. "Content-Type": "application/json; charset=utf-8"
  377. }
  378. body = {
  379. "dimension": {
  380. "sheetId": sheetid,
  381. "majorDimension": major_dimension,
  382. "startIndex": startindex,
  383. "endIndex": endindex
  384. }
  385. }
  386. urllib3.disable_warnings()
  387. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  388. Local.logger(log_type, crawler).info("删除视频数据:{}", r.json()["msg"])
  389. except Exception as e:
  390. Local.logger(log_type, crawler).error("删除视频数据异常:{}", e)
  391. # 获取用户 ID
  392. @classmethod
  393. def get_userid(cls, log_type, crawler, username):
  394. try:
  395. url = "https://open.feishu.cn/open-apis/user/v1/batch_get_id?"
  396. headers = {
  397. "Authorization": "Bearer " + cls.get_token(log_type, crawler),
  398. "Content-Type": "application/json; charset=utf-8"
  399. }
  400. name_phone_dict = {
  401. "xinxin": "15546206651",
  402. "muxinyi": "13699208058",
  403. "wangxueke": "13513479926",
  404. "yuzhuoyi": "18624010360",
  405. "luojunhui": "18801281360",
  406. "fanjun": "15200827642",
  407. "zhangyong": "17600025055"
  408. }
  409. # if username == "wangkun":
  410. # username = "13426262515"
  411. # # elif username == "gaonannan":
  412. # # username = "18501180073"
  413. # elif username == "xinxin":
  414. # username = "15546206651"
  415. # # elif username == "huxinxue":
  416. # # username = "18832292015"
  417. # # elif username == "wuchaoyue":
  418. # # username = "15712941385"
  419. # elif username == "muxinyi":
  420. # username = '13699208058'
  421. # elif username == "wangxueke":
  422. # username = '13513479926'
  423. # elif username == "yuzhuoyi":
  424. # username = '18624010360'
  425. # elif username == "luojunhui":
  426. # username = '18801281360'
  427. username = name_phone_dict.get(username)
  428. data = {"mobiles": [username]}
  429. urllib3.disable_warnings()
  430. r = requests.get(url=url, headers=headers, params=data, verify=False, proxies=proxies)
  431. open_id = r.json()["data"]["mobile_users"][username][0]["open_id"]
  432. # Common.logger(log_type, crawler).info(f"{username}:{open_id}")
  433. # print(f"{username}:{open_id}")
  434. return open_id
  435. except Exception as e:
  436. Local.logger(log_type, crawler).error(f"get_userid异常:{e}\n")
  437. # 飞书机器人
  438. @classmethod
  439. def bot(cls, log_type, crawler, text):
  440. try:
  441. url = "https://open.feishu.cn/open-apis/bot/v2/hook/96989577-50e7-4653-9ec2-308fe3f2c5fe"
  442. headers = {'Content-Type': 'application/json'}
  443. if crawler == "kanyikan":
  444. content = "看一看爬虫表"
  445. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih"
  446. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  447. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  448. # elif crawler == "weixinzhishu_out":
  449. # content = "微信指数_站外指数"
  450. # sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=YVuVgQ"
  451. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  452. # cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  453. # elif crawler == "weixinzhishu_inner_sort":
  454. # content = "微信指数_站内短期指数"
  455. # sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=DrZHpa"
  456. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  457. # cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  458. # elif crawler == "weixinzhishu_inner_long":
  459. # content = "微信指数_站内长期指数"
  460. # sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=JpgyAv"
  461. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  462. # cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  463. #
  464. # elif crawler == "weixinzhishu" and text == "今日微信指数抓取完毕":
  465. # content = "微信指数"
  466. # sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=sVL74k"
  467. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "yuzhuoyi")) + "></at>\n"
  468. # elif crawler == "weixinzhishu":
  469. # content = "微信指数"
  470. # sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnqhMRUGunIfGnGXMOBYiy4K?sheet=sVL74k"
  471. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  472. # cls.get_userid(log_type, crawler, "muxinyi")) + "></at>\n"
  473. elif crawler == "xiaoniangao_hour":
  474. content = "小年糕_小时级_已下载表"
  475. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=yatRv2"
  476. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  477. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  478. elif crawler == "xiaoniangao_person":
  479. content = "小年糕_用户主页_已下载表"
  480. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=Wu0CeL"
  481. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  482. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  483. elif crawler == "xiaoniangao_play":
  484. content = "小年糕_播放量_已下载表"
  485. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=c85k1C"
  486. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  487. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  488. elif crawler == 'xigua' and log_type == "recommend":
  489. content = '西瓜视频_推荐_已下载表'
  490. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?sheet=ZzsClu'
  491. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  492. cls.get_userid(log_type, crawler, "wangxueke")) + "></at>\n"
  493. # elif crawler == 'xigua':
  494. # content = '西瓜视频_用户主页_已下载表'
  495. # sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?sheet=e075e9'
  496. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  497. # cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  498. # elif crawler == 'xigua_little_video':
  499. # content = '西瓜视频_小视频_已下载表'
  500. # sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnvOpx2P8vBXiV91Ot1MKIw8?sheet=hDSDnv'
  501. # users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  502. # cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  503. elif crawler == 'zhihu_hot':
  504. content = '知乎_热门_已下载表'
  505. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?sheet=8871e3'
  506. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  507. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  508. elif crawler == 'zhihu_follow':
  509. content = '知乎_定向_已下载表'
  510. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnkGPBmGsjaqapgzouuj8MXe?sheet=4MGuux'
  511. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  512. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  513. elif crawler == 'haokan_hot':
  514. content = '好看_热榜_已下载表'
  515. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=5pWipX'
  516. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  517. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  518. elif crawler == 'haokan_channel':
  519. content = '好看_频道_已下载表'
  520. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=7f05d8'
  521. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  522. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  523. elif crawler == 'haokan_follow':
  524. content = '好看_定向_已下载表'
  525. sheet_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnaYz8Nhv8q6DbWtlL6rMEBd?sheet=kVaSjf'
  526. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  527. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  528. elif crawler == "music_album":
  529. content = "音乐相册爬虫表"
  530. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g"
  531. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  532. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  533. elif crawler == "ssyy":
  534. content = "胜胜影音爬虫表"
  535. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnz1ymxHL1u8WHblfqfys7qe"
  536. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  537. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  538. elif crawler == "ggdc":
  539. content = "刚刚都传爬虫表"
  540. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnTuJgeZU2bc7VaesAqk3QJx"
  541. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  542. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  543. elif crawler == "bszf":
  544. content = "本山祝福爬虫表"
  545. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb"
  546. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  547. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  548. elif crawler == "jxxf":
  549. content = "吉祥幸福爬虫表"
  550. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnSx4nafMbLTq7xl7RHBwHBf"
  551. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  552. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  553. elif crawler == "zmyx":
  554. content = "众妙音信爬虫表"
  555. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnbZIxstPeM0xshW07b26sve"
  556. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  557. cls.get_userid(log_type, crawler, "zhangyong")) + "></at>\n"
  558. elif crawler == "zhufumao":
  559. content = "祝福猫视频爬虫表"
  560. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnXfIJthvkjhI5zlEJq84i6g"
  561. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  562. cls.get_userid(log_type, crawler, "gaonannan")) + "></at>\n"
  563. elif crawler == "kuaishou_follow":
  564. content = "快手_用户主页_已下载表"
  565. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?sheet=fYdA8F"
  566. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  567. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  568. elif crawler == "kuaishou_recommend":
  569. content = "快手_推荐榜_已下载表"
  570. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?sheet=3cd128"
  571. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  572. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  573. elif crawler == "ssnnyfq":
  574. content = "岁岁年年迎福气_已下载表"
  575. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnyJmJSJynHDLLbLTkySfvZe?sheet=290bae"
  576. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "luojunhui")) + "></at> <at id=" + str(
  577. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  578. elif crawler == "kdjsfq":
  579. content = "看到就是福气_已下载表"
  580. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnEokBkIjOUPAk8vbbPKnXgb?sheet=ad3b6d"
  581. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  582. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  583. elif crawler == "gzh":
  584. content = "公众号爬虫表"
  585. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA"
  586. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  587. cls.get_userid(log_type, crawler, "huxinxue")) + "></at>\n"
  588. elif crawler == "gongzhonghao":
  589. content = "公众号_信欣_爬虫表"
  590. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcna98M2mX7TbivTj9Sb7WKBN?"
  591. users = f"\n<at id={str(cls.get_userid(log_type, crawler, 'fanjun'))}></at> <at id={str(cls.get_userid(log_type, crawler, 'wangxueke'))}></at> <at id={str(cls.get_userid(log_type, crawler, 'luojunhui'))}></at>\n"
  592. elif crawler == "weiqun":
  593. content = "微群爬虫表"
  594. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc"
  595. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  596. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  597. elif crawler == "weishi":
  598. content = "微视爬虫表"
  599. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh"
  600. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  601. cls.get_userid(log_type, crawler, "xinxin")) + "></at>\n"
  602. elif crawler == "shipinhao_recommend":
  603. content = "视频号_推荐_已下载表"
  604. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?sheet=c77cf9"
  605. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  606. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  607. elif crawler == "shipinhao_follow":
  608. content = "视频号_定向_已下载表"
  609. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?sheet=KsVtLe"
  610. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  611. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  612. elif crawler == "youtube":
  613. content = "youtube_定向_已下载表"
  614. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnrLyr1zbYbhhZyqpN7Xrd5f?sheet=GVxlYk"
  615. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  616. cls.get_userid(log_type, crawler, "wuchaoyue")) + "></at>\n"
  617. elif crawler == "zongjiao":
  618. content = "宗教公众号爬虫表"
  619. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn73NW0CyoOeF21HWO15KBsb"
  620. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at> <at id=" + str(
  621. cls.get_userid(log_type, crawler, "huxinxue")) + "></at>\n"
  622. else:
  623. content = "小年糕爬虫表"
  624. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  625. users = "\n<at id=" + str(cls.get_userid(log_type, crawler, "wangkun")) + "></at>\n"
  626. data = json.dumps({
  627. "msg_type": "interactive",
  628. "card": {
  629. "config": {
  630. "wide_screen_mode": True,
  631. "enable_forward": True
  632. },
  633. "elements": [{
  634. "tag": "div",
  635. "text": {
  636. "content": users + text,
  637. "tag": "lark_md"
  638. }
  639. }, {
  640. "actions": [{
  641. "tag": "button",
  642. "text": {
  643. "content": content,
  644. "tag": "lark_md"
  645. },
  646. "url": sheet_url,
  647. "type": "default",
  648. "value": {}
  649. }],
  650. "tag": "action"
  651. }],
  652. "header": {
  653. "title": {
  654. "content": "📣您有新的信息,请注意查收",
  655. "tag": "plain_text"
  656. }
  657. }
  658. }
  659. })
  660. urllib3.disable_warnings()
  661. r = requests.post(url, headers=headers, data=data, verify=False, proxies=proxies)
  662. Local.logger(log_type, crawler).info(f'触发机器人消息:{r.status_code}, {text}')
  663. except Exception as e:
  664. Local.logger(log_type, crawler).error(f"bot异常:{e}\n")
  665. if __name__ == "__main__":
  666. Feishu.bot('recommend', 'xigua', '测试: 西瓜推荐,登录失效')
  667. # print(Feishu.get_userid('bot', 'weixinzhishu', 'wangkun'))
  668. # print(Feishu.get_userid('bot', 'weixinzhishu', 'yuzhuoyi'))