feishu_lib.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/8/9
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. # kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  17. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?"
  18. # 微视爬虫数据表
  19. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  20. # 小年糕爬虫数据表
  21. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  22. # 音乐相册
  23. music_album = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g?"
  24. # 本山祝福数据表
  25. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  26. # 公众号爬虫表
  27. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  28. # 数据监控表
  29. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  30. # 手机号
  31. wangkun = "13426262515"
  32. gaonannan = "18501180073"
  33. xinxin = "15546206651"
  34. huxinxue = "18832292015"
  35. # 飞书路径token
  36. @classmethod
  37. def spreadsheettoken(cls, crawler):
  38. """
  39. :param crawler: 哪个爬虫
  40. """
  41. if crawler == "kanyikan":
  42. return "shtcngRPoDYAi24x52j2nDuHMih"
  43. elif crawler == "kuaishou":
  44. # return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  45. return "shtcnICEfaw9llDNQkKgdymM1xf"
  46. elif crawler == "weishi":
  47. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  48. elif crawler == "xiaoniangao":
  49. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  50. elif crawler == "monitor":
  51. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  52. elif crawler == "music_album":
  53. return "shtcnT6zvmfsYe1g0iv4pt7855g"
  54. elif crawler == "bszf":
  55. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  56. elif crawler == "gzh":
  57. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  58. # 获取飞书api token
  59. @classmethod
  60. def get_token(cls, log_type):
  61. """
  62. 获取飞书api token
  63. :return:
  64. """
  65. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  66. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  67. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  68. try:
  69. urllib3.disable_warnings()
  70. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  71. tenant_access_token = response.json()["tenant_access_token"]
  72. return tenant_access_token
  73. except Exception as e:
  74. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  75. # 获取表格元数据
  76. @classmethod
  77. def get_metainfo(cls, log_type, crawler):
  78. """
  79. 获取表格元数据
  80. :return:
  81. """
  82. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  83. + cls.spreadsheettoken(crawler) + "/metainfo"
  84. headers = {
  85. "Authorization": "Bearer " + cls.get_token(log_type),
  86. "Content-Type": "application/json; charset=utf-8"
  87. }
  88. params = {
  89. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  90. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  91. }
  92. try:
  93. urllib3.disable_warnings()
  94. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  95. response = json.loads(r.content.decode("utf8"))
  96. return response
  97. except Exception as e:
  98. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  99. # 读取工作表中所有数据
  100. @classmethod
  101. def get_values_batch(cls, log_type, crawler, sheetid):
  102. """
  103. 读取工作表中所有数据
  104. :param log_type: 启用哪个 log
  105. :param crawler: 哪个爬虫
  106. :param sheetid: 哪张表
  107. :return: 所有数据
  108. """
  109. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  110. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  111. headers = {
  112. "Authorization": "Bearer " + cls.get_token(log_type),
  113. "Content-Type": "application/json; charset=utf-8"
  114. }
  115. params = {
  116. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  117. "ranges": sheetid,
  118. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  119. # valueRenderOption=FormattedValue 计算并格式化单元格;
  120. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  121. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  122. "valueRenderOption": "ToString",
  123. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  124. "dateTimeRenderOption": "",
  125. # 返回的用户id类型,可选open_id,union_id
  126. "user_id_type": "open_id"
  127. }
  128. try:
  129. urllib3.disable_warnings()
  130. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  131. # print(r.text)
  132. response = json.loads(r.content.decode("utf8"))
  133. values = response["data"]["valueRanges"][0]["values"]
  134. return values
  135. except Exception as e:
  136. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  137. # 工作表,插入行或列
  138. @classmethod
  139. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  140. """
  141. 工作表插入行或列
  142. :param log_type: 日志路径
  143. :param crawler: 哪个爬虫的云文档
  144. :param sheetid:哪张工作表
  145. :param majordimension:行或者列, ROWS、COLUMNS
  146. :param startindex:开始位置
  147. :param endindex:结束位置
  148. """
  149. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  150. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  151. headers = {
  152. "Authorization": "Bearer " + cls.get_token(log_type),
  153. "Content-Type": "application/json; charset=utf-8"
  154. }
  155. body = {
  156. "dimension": {
  157. "sheetId": sheetid,
  158. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  159. "startIndex": startindex, # 开始的位置
  160. "endIndex": endindex # 结束的位置
  161. },
  162. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  163. }
  164. try:
  165. urllib3.disable_warnings()
  166. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  167. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  168. except Exception as e:
  169. Common.logger(log_type).error("插入行或列异常:{}", e)
  170. # 写入数据
  171. @classmethod
  172. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  173. """
  174. 写入数据
  175. :param log_type: 日志路径
  176. :param crawler: 哪个爬虫的云文档
  177. :param sheetid:哪张工作表
  178. :param ranges:单元格范围
  179. :param values:写入的具体数据,list
  180. """
  181. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  182. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  183. headers = {
  184. "Authorization": "Bearer " + cls.get_token(log_type),
  185. "Content-Type": "application/json; charset=utf-8"
  186. }
  187. body = {
  188. "valueRanges": [
  189. {
  190. "range": sheetid + "!" + ranges,
  191. "values": values
  192. },
  193. ],
  194. }
  195. try:
  196. urllib3.disable_warnings()
  197. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  198. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  199. except Exception as e:
  200. Common.logger(log_type).error("写入数据异常:{}", e)
  201. # 合并单元格
  202. @classmethod
  203. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  204. """
  205. 合并单元格
  206. :param log_type: 日志路径
  207. :param crawler: 哪个爬虫
  208. :param sheetid:哪张工作表
  209. :param ranges:需要合并的单元格范围
  210. """
  211. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  212. + cls.spreadsheettoken(crawler) + "/merge_cells"
  213. headers = {
  214. "Authorization": "Bearer " + cls.get_token(log_type),
  215. "Content-Type": "application/json; charset=utf-8"
  216. }
  217. body = {
  218. "range": sheetid + "!" + ranges,
  219. "mergeType": "MERGE_ROWS"
  220. }
  221. try:
  222. urllib3.disable_warnings()
  223. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  224. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  225. except Exception as e:
  226. Common.logger(log_type).error("合并单元格异常:{}", e)
  227. # 读取单元格数据
  228. @classmethod
  229. def get_range_value(cls, log_type, crawler, sheetid, cell):
  230. """
  231. 读取单元格内容
  232. :param log_type: 日志路径
  233. :param crawler: 哪个爬虫
  234. :param sheetid: 哪张工作表
  235. :param cell: 哪个单元格
  236. :return: 单元格内容
  237. """
  238. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  239. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  240. headers = {
  241. "Authorization": "Bearer " + cls.get_token(log_type),
  242. "Content-Type": "application/json; charset=utf-8"
  243. }
  244. params = {
  245. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  246. # valueRenderOption=FormattedValue 计算并格式化单元格;
  247. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  248. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  249. "valueRenderOption": "FormattedValue",
  250. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  251. "dateTimeRenderOption": "",
  252. # 返回的用户id类型,可选open_id,union_id
  253. "user_id_type": "open_id"
  254. }
  255. try:
  256. urllib3.disable_warnings()
  257. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  258. # print(r.text)
  259. return r.json()["data"]["valueRange"]["values"][0]
  260. except Exception as e:
  261. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  262. # 删除行或列,可选 ROWS、COLUMNS
  263. @classmethod
  264. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  265. """
  266. 删除行或列
  267. :param log_type: 日志路径
  268. :param crawler: 哪个爬虫
  269. :param sheetid:工作表
  270. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  271. :param startindex:开始的位置
  272. :param endindex:结束的位置
  273. :return:
  274. """
  275. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  276. + cls.spreadsheettoken(crawler) + "/dimension_range"
  277. headers = {
  278. "Authorization": "Bearer " + cls.get_token(log_type),
  279. "Content-Type": "application/json; charset=utf-8"
  280. }
  281. body = {
  282. "dimension": {
  283. "sheetId": sheetid,
  284. "majorDimension": major_dimension,
  285. "startIndex": startindex,
  286. "endIndex": endindex
  287. }
  288. }
  289. try:
  290. urllib3.disable_warnings()
  291. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  292. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  293. except Exception as e:
  294. Common.logger(log_type).error("删除视频数据异常:{}", e)
  295. # 获取用户 ID
  296. @classmethod
  297. def get_userid(cls, log_type, username):
  298. try:
  299. url = "https://open.feishu.cn/open-apis/user/v1/batch_get_id?"
  300. headers = {
  301. "Authorization": "Bearer " + cls.get_token(log_type),
  302. "Content-Type": "application/json; charset=utf-8"
  303. }
  304. if username == "wangkun":
  305. username = cls.wangkun
  306. elif username == "gaonannan":
  307. username = cls.gaonannan
  308. elif username == "xinxin":
  309. username = cls.xinxin
  310. elif username == "huxinxue":
  311. username = cls.huxinxue
  312. data = {"mobiles": [username]}
  313. urllib3.disable_warnings()
  314. r = requests.get(url=url, headers=headers, params=data, verify=False, proxies=proxies)
  315. open_id = r.json()["data"]["mobile_users"][username][0]["open_id"]
  316. Common.logger(log_type).info("{}:{}", username, open_id)
  317. # print(f"{username}:{open_id}")
  318. return open_id
  319. except Exception as e:
  320. Common.logger(log_type).error("get_userid异常:{}", e)
  321. # 飞书机器人
  322. @classmethod
  323. def bot(cls, log_type, crawler, text):
  324. try:
  325. url = "https://open.feishu.cn/open-apis/bot/v2/hook/96989577-50e7-4653-9ec2-308fe3f2c5fe"
  326. headers = {
  327. 'Content-Type': 'application/json'
  328. }
  329. if crawler == "kanyikan":
  330. content = "看一看爬虫表"
  331. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?sheet=20ce0c"
  332. elif crawler == "xiaoniangao":
  333. content = "小年糕爬虫表"
  334. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=yatRv2"
  335. elif crawler == "music_album":
  336. content = "音乐相册爬虫表"
  337. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnT6zvmfsYe1g0iv4pt7855g?sheet=f5a76e"
  338. elif crawler == "bszf":
  339. content = "本山祝福爬虫表"
  340. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?sheet=440018"
  341. elif crawler == "kuaishou":
  342. content = "快手爬虫表"
  343. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?sheet=3cd128"
  344. elif crawler == "gzh":
  345. content = "公众号爬虫表"
  346. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?sheet=fCs3BT"
  347. else:
  348. content = "小年糕爬虫表"
  349. sheet_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?sheet=yatRv2"
  350. data = json.dumps({
  351. "msg_type": "interactive",
  352. "card": {
  353. "config": {
  354. "wide_screen_mode": True,
  355. "enable_forward": True
  356. },
  357. "elements": [{
  358. "tag": "div",
  359. "text": {
  360. "content": "\n<at id=" + str(cls.get_userid(log_type, "wangkun")) + "></at>\n" + text,
  361. "tag": "lark_md"
  362. }
  363. }, {
  364. "actions": [{
  365. "tag": "button",
  366. "text": {
  367. "content": content,
  368. "tag": "lark_md"
  369. },
  370. "url": sheet_url,
  371. "type": "default",
  372. "value": {}
  373. }],
  374. "tag": "action"
  375. }],
  376. "header": {
  377. "title": {
  378. "content": "📣您有新的报警,请注意查收",
  379. "tag": "plain_text"
  380. }
  381. }
  382. }
  383. })
  384. urllib3.disable_warnings()
  385. r = requests.post(url, headers=headers, data=data, verify=False, proxies=proxies)
  386. Common.logger(log_type).info("触发机器人消息:{}, {}", r, r.json()["StatusMessage"])
  387. except Exception as e:
  388. Common.logger(log_type).error("bot异常:{}", e)
  389. if __name__ == "__main__":
  390. Feishu.bot("bot", "kuaishou", "我是快手测试内容,请忽略")
  391. # Feishu.get_userid("kuaishou", "huxinxue")