feishu_lib.py 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/8/9
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?"
  17. # 微视爬虫数据表
  18. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  19. # 小年糕爬虫数据表
  20. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  21. # 音乐相册
  22. music_album = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g?"
  23. # 本山祝福数据表
  24. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  25. # 公众号爬虫表
  26. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  27. # 数据监控表
  28. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  29. # 微群视频爬虫表
  30. crawler_weiqun_video = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc?"
  31. # 视频号爬虫表
  32. crawler_shipinhao = 'https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?'
  33. # 手机号
  34. wangkun = "13426262515"
  35. gaonannan = "18501180073"
  36. xinxin = "15546206651"
  37. huxinxue = "18832292015"
  38. # 飞书路径token
  39. @classmethod
  40. def spreadsheettoken(cls, crawler):
  41. """
  42. :param crawler: 哪个爬虫
  43. """
  44. if crawler == "kanyikan":
  45. return "shtcngRPoDYAi24x52j2nDuHMih"
  46. elif crawler == "kuaishou":
  47. return "shtcnICEfaw9llDNQkKgdymM1xf"
  48. elif crawler == "weishi":
  49. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  50. elif crawler == "xiaoniangao":
  51. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  52. elif crawler == "monitor":
  53. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  54. elif crawler == "music_album":
  55. return "shtcnT6zvmfsYe1g0iv4pt7855g"
  56. elif crawler == "bszf":
  57. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  58. elif crawler == "gzh":
  59. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  60. elif crawler == "weiqun":
  61. return "shtcnoKThNquYRweaylMFVyo9Hc"
  62. elif crawler == 'shipinhao':
  63. return 'shtcn9rOdZRAGFbRkWpn7hqEHGc'
  64. # 获取飞书api token
  65. @classmethod
  66. def get_token(cls, log_type):
  67. """
  68. 获取飞书api token
  69. :return:
  70. """
  71. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  72. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  73. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  74. try:
  75. urllib3.disable_warnings()
  76. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  77. tenant_access_token = response.json()["tenant_access_token"]
  78. return tenant_access_token
  79. except Exception as e:
  80. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  81. # 获取表格元数据
  82. @classmethod
  83. def get_metainfo(cls, log_type, crawler):
  84. """
  85. 获取表格元数据
  86. :return:
  87. """
  88. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  89. + cls.spreadsheettoken(crawler) + "/metainfo"
  90. headers = {
  91. "Authorization": "Bearer " + cls.get_token(log_type),
  92. "Content-Type": "application/json; charset=utf-8"
  93. }
  94. params = {
  95. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  96. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  97. }
  98. try:
  99. urllib3.disable_warnings()
  100. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  101. response = json.loads(r.content.decode("utf8"))
  102. return response
  103. except Exception as e:
  104. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  105. # 读取工作表中所有数据
  106. @classmethod
  107. def get_values_batch(cls, log_type, crawler, sheetid):
  108. """
  109. 读取工作表中所有数据
  110. :param log_type: 启用哪个 log
  111. :param crawler: 哪个爬虫
  112. :param sheetid: 哪张表
  113. :return: 所有数据
  114. """
  115. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  116. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  117. headers = {
  118. "Authorization": "Bearer " + cls.get_token(log_type),
  119. "Content-Type": "application/json; charset=utf-8"
  120. }
  121. params = {
  122. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  123. "ranges": sheetid,
  124. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  125. # valueRenderOption=FormattedValue 计算并格式化单元格;
  126. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  127. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  128. "valueRenderOption": "ToString",
  129. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  130. "dateTimeRenderOption": "",
  131. # 返回的用户id类型,可选open_id,union_id
  132. "user_id_type": "open_id"
  133. }
  134. try:
  135. urllib3.disable_warnings()
  136. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  137. # print(r.text)
  138. response = json.loads(r.content.decode("utf8"))
  139. values = response["data"]["valueRanges"][0]["values"]
  140. return values
  141. except Exception as e:
  142. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  143. # 工作表,插入行或列
  144. @classmethod
  145. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  146. """
  147. 工作表插入行或列
  148. :param log_type: 日志路径
  149. :param crawler: 哪个爬虫的云文档
  150. :param sheetid:哪张工作表
  151. :param majordimension:行或者列, ROWS、COLUMNS
  152. :param startindex:开始位置
  153. :param endindex:结束位置
  154. """
  155. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  156. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  157. headers = {
  158. "Authorization": "Bearer " + cls.get_token(log_type),
  159. "Content-Type": "application/json; charset=utf-8"
  160. }
  161. body = {
  162. "dimension": {
  163. "sheetId": sheetid,
  164. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  165. "startIndex": startindex, # 开始的位置
  166. "endIndex": endindex # 结束的位置
  167. },
  168. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  169. }
  170. try:
  171. urllib3.disable_warnings()
  172. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  173. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  174. except Exception as e:
  175. Common.logger(log_type).error("插入行或列异常:{}", e)
  176. # 写入数据
  177. @classmethod
  178. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  179. """
  180. 写入数据
  181. :param log_type: 日志路径
  182. :param crawler: 哪个爬虫的云文档
  183. :param sheetid:哪张工作表
  184. :param ranges:单元格范围
  185. :param values:写入的具体数据,list
  186. """
  187. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  188. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  189. headers = {
  190. "Authorization": "Bearer " + cls.get_token(log_type),
  191. "Content-Type": "application/json; charset=utf-8"
  192. }
  193. body = {
  194. "valueRanges": [
  195. {
  196. "range": sheetid + "!" + ranges,
  197. "values": values
  198. },
  199. ],
  200. }
  201. try:
  202. urllib3.disable_warnings()
  203. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  204. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  205. except Exception as e:
  206. Common.logger(log_type).error("写入数据异常:{}", e)
  207. # 合并单元格
  208. @classmethod
  209. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  210. """
  211. 合并单元格
  212. :param log_type: 日志路径
  213. :param crawler: 哪个爬虫
  214. :param sheetid:哪张工作表
  215. :param ranges:需要合并的单元格范围
  216. """
  217. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  218. + cls.spreadsheettoken(crawler) + "/merge_cells"
  219. headers = {
  220. "Authorization": "Bearer " + cls.get_token(log_type),
  221. "Content-Type": "application/json; charset=utf-8"
  222. }
  223. body = {
  224. "range": sheetid + "!" + ranges,
  225. "mergeType": "MERGE_ROWS"
  226. }
  227. try:
  228. urllib3.disable_warnings()
  229. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  230. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  231. except Exception as e:
  232. Common.logger(log_type).error("合并单元格异常:{}", e)
  233. # 读取单元格数据
  234. @classmethod
  235. def get_range_value(cls, log_type, crawler, sheetid, cell):
  236. """
  237. 读取单元格内容
  238. :param log_type: 日志路径
  239. :param crawler: 哪个爬虫
  240. :param sheetid: 哪张工作表
  241. :param cell: 哪个单元格
  242. :return: 单元格内容
  243. """
  244. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  245. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  246. headers = {
  247. "Authorization": "Bearer " + cls.get_token(log_type),
  248. "Content-Type": "application/json; charset=utf-8"
  249. }
  250. params = {
  251. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  252. # valueRenderOption=FormattedValue 计算并格式化单元格;
  253. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  254. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  255. "valueRenderOption": "FormattedValue",
  256. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  257. "dateTimeRenderOption": "",
  258. # 返回的用户id类型,可选open_id,union_id
  259. "user_id_type": "open_id"
  260. }
  261. try:
  262. urllib3.disable_warnings()
  263. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  264. # print(r.text)
  265. return r.json()["data"]["valueRange"]["values"][0]
  266. except Exception as e:
  267. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  268. # 删除行或列,可选 ROWS、COLUMNS
  269. @classmethod
  270. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  271. """
  272. 删除行或列
  273. :param log_type: 日志路径
  274. :param crawler: 哪个爬虫
  275. :param sheetid:工作表
  276. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  277. :param startindex:开始的位置
  278. :param endindex:结束的位置
  279. :return:
  280. """
  281. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  282. + cls.spreadsheettoken(crawler) + "/dimension_range"
  283. headers = {
  284. "Authorization": "Bearer " + cls.get_token(log_type),
  285. "Content-Type": "application/json; charset=utf-8"
  286. }
  287. body = {
  288. "dimension": {
  289. "sheetId": sheetid,
  290. "majorDimension": major_dimension,
  291. "startIndex": startindex,
  292. "endIndex": endindex
  293. }
  294. }
  295. try:
  296. urllib3.disable_warnings()
  297. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  298. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  299. except Exception as e:
  300. Common.logger(log_type).error("删除视频数据异常:{}", e)
  301. # 获取用户 ID
  302. @classmethod
  303. def get_userid(cls, log_type, username):
  304. try:
  305. url = "https://open.feishu.cn/open-apis/user/v1/batch_get_id?"
  306. headers = {
  307. "Authorization": "Bearer " + cls.get_token(log_type),
  308. "Content-Type": "application/json; charset=utf-8"
  309. }
  310. if username == "wangkun":
  311. username = cls.wangkun
  312. elif username == "gaonannan":
  313. username = cls.gaonannan
  314. elif username == "xinxin":
  315. username = cls.xinxin
  316. elif username == "huxinxue":
  317. username = cls.huxinxue
  318. data = {"mobiles": [username]}
  319. urllib3.disable_warnings()
  320. r = requests.get(url=url, headers=headers, params=data, verify=False, proxies=proxies)
  321. open_id = r.json()["data"]["mobile_users"][username][0]["open_id"]
  322. Common.logger(log_type).info("{}:{}", username, open_id)
  323. # print(f"{username}:{open_id}")
  324. return open_id
  325. except Exception as e:
  326. Common.logger(log_type).error("get_userid异常:{}", e)
  327. # 飞书机器人
  328. @classmethod
  329. def bot(cls, log_type, crawler, text):
  330. try:
  331. url = "https://open.feishu.cn/open-apis/bot/v2/hook/96989577-50e7-4653-9ec2-308fe3f2c5fe"
  332. headers = {
  333. 'Content-Type': 'application/json'
  334. }
  335. if crawler == "kanyikan":
  336. content = "看一看爬虫表"
  337. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih"
  338. elif crawler == "xiaoniangao_hour":
  339. content = "小年糕_小时级_已下载表"
  340. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=yatRv2"
  341. elif crawler == "xiaoniangao_person":
  342. content = "小年糕_用户主页_已下载表"
  343. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=Wu0CeL"
  344. elif crawler == "xiaoniangao_play":
  345. content = "小年糕_播放量_已下载表"
  346. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=c85k1C"
  347. elif crawler == "music_album":
  348. content = "音乐相册爬虫表"
  349. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g"
  350. elif crawler == "bszf":
  351. content = "本山祝福爬虫表"
  352. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb"
  353. elif crawler == "kuaishou":
  354. content = "快手爬虫表"
  355. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf"
  356. elif crawler == "gzh":
  357. content = "公众号爬虫表"
  358. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA"
  359. elif crawler == "weiqun":
  360. content = "微群爬虫表"
  361. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnoKThNquYRweaylMFVyo9Hc"
  362. elif crawler == "weishi":
  363. content = "微视爬虫表"
  364. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh"
  365. elif crawler == "shipinhao":
  366. content = "视频号爬虫表"
  367. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc"
  368. else:
  369. content = "小年糕爬虫表"
  370. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  371. data = json.dumps({
  372. "msg_type": "interactive",
  373. "card": {
  374. "config": {
  375. "wide_screen_mode": True,
  376. "enable_forward": True
  377. },
  378. "elements": [{
  379. "tag": "div",
  380. "text": {
  381. "content": "\n<at id=" + str(cls.get_userid(log_type, "wangkun")) + "></at>\n" + text,
  382. "tag": "lark_md"
  383. }
  384. }, {
  385. "actions": [{
  386. "tag": "button",
  387. "text": {
  388. "content": content,
  389. "tag": "lark_md"
  390. },
  391. "url": sheet_url,
  392. "type": "default",
  393. "value": {}
  394. }],
  395. "tag": "action"
  396. }],
  397. "header": {
  398. "title": {
  399. "content": "📣您有新的报警,请注意查收",
  400. "tag": "plain_text"
  401. }
  402. }
  403. }
  404. })
  405. urllib3.disable_warnings()
  406. r = requests.post(url, headers=headers, data=data, verify=False, proxies=proxies)
  407. Common.logger(log_type).info("触发机器人消息:{}, {}", r, r.json()["StatusMessage"])
  408. except Exception as e:
  409. Common.logger(log_type).error("bot异常:{}", e)
  410. if __name__ == "__main__":
  411. Feishu.bot("bot", "xiaoniangao_hour", "嘿。嘿嘿。。嘿嘿嘿")
  412. # Feishu.get_userid("kuaishou", "huxinxue")
  413. pass