feishu_lib.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/11/7
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  17. # 微视爬虫数据表
  18. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  19. # 小年糕爬虫数据表
  20. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  21. # 数据监控表
  22. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  23. # 本山祝福数据表
  24. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  25. # 公众号爬虫表
  26. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  27. # 视频号表
  28. shipinhao_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcn9rOdZRAGFbRkWpn7hqEHGc?'
  29. # 知青总群
  30. zhiqingzongqun_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnjmhKdJOKdqnEzJcZb5xaHc?'
  31. # 众妙音信
  32. zmyx_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnbZIxstPeM0xshW07b26sve?'
  33. # 岁岁年年迎福气
  34. ssnnyfq_url = 'https://w42nne6hzg.feishu.cn/sheets/shtcnyJmJSJynHDLLbLTkySfvZe'
  35. # 飞书路径token
  36. @classmethod
  37. def spreadsheettoken(cls, crawler):
  38. """
  39. :param crawler: 哪个爬虫
  40. """
  41. if crawler == "kanyikan":
  42. return "shtcngRPoDYAi24x52j2nDuHMih"
  43. elif crawler == "kuaishou":
  44. return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  45. elif crawler == "weishi":
  46. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  47. elif crawler == "xiaoniangao":
  48. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  49. elif crawler == "monitor":
  50. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  51. elif crawler == "bszf":
  52. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  53. elif crawler == "gzh":
  54. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  55. elif crawler == "shipinhao":
  56. return "shtcn9rOdZRAGFbRkWpn7hqEHGc"
  57. elif crawler == "zhiqingzongqun":
  58. return "shtcnjmhKdJOKdqnEzJcZb5xaHc"
  59. elif crawler == "zmyx":
  60. return "shtcnbZIxstPeM0xshW07b26sve"
  61. elif crawler == "ssnnyfq":
  62. return "shtcnyJmJSJynHDLLbLTkySfvZe"
  63. # 获取飞书api token
  64. @classmethod
  65. def get_token(cls, log_type):
  66. """
  67. 获取飞书api token
  68. :return:
  69. """
  70. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  71. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  72. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  73. try:
  74. urllib3.disable_warnings()
  75. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  76. tenant_access_token = response.json()["tenant_access_token"]
  77. return tenant_access_token
  78. except Exception as e:
  79. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  80. # 获取表格元数据
  81. @classmethod
  82. def get_metainfo(cls, log_type, crawler):
  83. """
  84. 获取表格元数据
  85. :return:
  86. """
  87. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  88. + cls.spreadsheettoken(crawler) + "/metainfo"
  89. headers = {
  90. "Authorization": "Bearer " + cls.get_token(log_type),
  91. "Content-Type": "application/json; charset=utf-8"
  92. }
  93. params = {
  94. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  95. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  96. }
  97. try:
  98. urllib3.disable_warnings()
  99. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  100. response = json.loads(r.content.decode("utf8"))
  101. return response
  102. except Exception as e:
  103. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  104. # 读取工作表中所有数据
  105. @classmethod
  106. def get_values_batch(cls, log_type, crawler, sheetid):
  107. """
  108. 读取工作表中所有数据
  109. :param log_type: 启用哪个 log
  110. :param crawler: 哪个爬虫
  111. :param sheetid: 哪张表
  112. :return: 所有数据
  113. """
  114. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  115. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  116. headers = {
  117. "Authorization": "Bearer " + cls.get_token(log_type),
  118. "Content-Type": "application/json; charset=utf-8"
  119. }
  120. params = {
  121. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  122. "ranges": sheetid,
  123. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  124. # valueRenderOption=FormattedValue 计算并格式化单元格;
  125. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  126. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  127. "valueRenderOption": "ToString",
  128. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  129. "dateTimeRenderOption": "",
  130. # 返回的用户id类型,可选open_id,union_id
  131. "user_id_type": "open_id"
  132. }
  133. try:
  134. urllib3.disable_warnings()
  135. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  136. # print(r.text)
  137. response = json.loads(r.content.decode("utf8"))
  138. values = response["data"]["valueRanges"][0]["values"]
  139. return values
  140. except Exception as e:
  141. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  142. # 工作表,插入行或列
  143. @classmethod
  144. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  145. """
  146. 工作表插入行或列
  147. :param log_type: 日志路径
  148. :param crawler: 哪个爬虫的云文档
  149. :param sheetid:哪张工作表
  150. :param majordimension:行或者列, ROWS、COLUMNS
  151. :param startindex:开始位置
  152. :param endindex:结束位置
  153. """
  154. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  155. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  156. headers = {
  157. "Authorization": "Bearer " + cls.get_token(log_type),
  158. "Content-Type": "application/json; charset=utf-8"
  159. }
  160. body = {
  161. "dimension": {
  162. "sheetId": sheetid,
  163. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  164. "startIndex": startindex, # 开始的位置
  165. "endIndex": endindex # 结束的位置
  166. },
  167. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  168. }
  169. try:
  170. urllib3.disable_warnings()
  171. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  172. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  173. except Exception as e:
  174. Common.logger(log_type).error("插入行或列异常:{}", e)
  175. # 写入数据
  176. @classmethod
  177. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  178. """
  179. 写入数据
  180. :param log_type: 日志路径
  181. :param crawler: 哪个爬虫的云文档
  182. :param sheetid:哪张工作表
  183. :param ranges:单元格范围
  184. :param values:写入的具体数据,list
  185. """
  186. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  187. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  188. headers = {
  189. "Authorization": "Bearer " + cls.get_token(log_type),
  190. "Content-Type": "application/json; charset=utf-8"
  191. }
  192. body = {
  193. "valueRanges": [
  194. {
  195. "range": sheetid + "!" + ranges,
  196. "values": values
  197. },
  198. ],
  199. }
  200. try:
  201. urllib3.disable_warnings()
  202. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  203. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  204. except Exception as e:
  205. Common.logger(log_type).error("写入数据异常:{}", e)
  206. # 合并单元格
  207. @classmethod
  208. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  209. """
  210. 合并单元格
  211. :param log_type: 日志路径
  212. :param crawler: 哪个爬虫
  213. :param sheetid:哪张工作表
  214. :param ranges:需要合并的单元格范围
  215. """
  216. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  217. + cls.spreadsheettoken(crawler) + "/merge_cells"
  218. headers = {
  219. "Authorization": "Bearer " + cls.get_token(log_type),
  220. "Content-Type": "application/json; charset=utf-8"
  221. }
  222. body = {
  223. "range": sheetid + "!" + ranges,
  224. "mergeType": "MERGE_ROWS"
  225. }
  226. try:
  227. urllib3.disable_warnings()
  228. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  229. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  230. except Exception as e:
  231. Common.logger(log_type).error("合并单元格异常:{}", e)
  232. # 读取单元格数据
  233. @classmethod
  234. def get_range_value(cls, log_type, crawler, sheetid, cell):
  235. """
  236. 读取单元格内容
  237. :param log_type: 日志路径
  238. :param crawler: 哪个爬虫
  239. :param sheetid: 哪张工作表
  240. :param cell: 哪个单元格
  241. :return: 单元格内容
  242. """
  243. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  244. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  245. headers = {
  246. "Authorization": "Bearer " + cls.get_token(log_type),
  247. "Content-Type": "application/json; charset=utf-8"
  248. }
  249. params = {
  250. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  251. # valueRenderOption=FormattedValue 计算并格式化单元格;
  252. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  253. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  254. "valueRenderOption": "FormattedValue",
  255. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  256. "dateTimeRenderOption": "",
  257. # 返回的用户id类型,可选open_id,union_id
  258. "user_id_type": "open_id"
  259. }
  260. try:
  261. urllib3.disable_warnings()
  262. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  263. # print(r.text)
  264. return r.json()["data"]["valueRange"]["values"][0]
  265. except Exception as e:
  266. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  267. # 删除行或列,可选 ROWS、COLUMNS
  268. @classmethod
  269. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  270. """
  271. 删除行或列
  272. :param log_type: 日志路径
  273. :param crawler: 哪个爬虫
  274. :param sheetid:工作表
  275. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  276. :param startindex:开始的位置
  277. :param endindex:结束的位置
  278. :return:
  279. """
  280. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  281. + cls.spreadsheettoken(crawler) + "/dimension_range"
  282. headers = {
  283. "Authorization": "Bearer " + cls.get_token(log_type),
  284. "Content-Type": "application/json; charset=utf-8"
  285. }
  286. body = {
  287. "dimension": {
  288. "sheetId": sheetid,
  289. "majorDimension": major_dimension,
  290. "startIndex": startindex,
  291. "endIndex": endindex
  292. }
  293. }
  294. try:
  295. urllib3.disable_warnings()
  296. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  297. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  298. except Exception as e:
  299. Common.logger(log_type).error("删除视频数据异常:{}", e)
  300. if __name__ == "__main__":
  301. pass