feishu_lib.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/8/1
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  17. # 微视爬虫数据表
  18. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  19. # 小年糕爬虫数据表
  20. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  21. # 数据监控表
  22. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  23. # 本山祝福数据表
  24. crawler_benshanzhufu = "https://w42nne6hzg.feishu.cn/sheets/shtcnGh2rrsPYM4iVNEBO7OqWrb?"
  25. # 公众号爬虫表
  26. gzh_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnexNXnpDLHhARw0QdiwbYuA?"
  27. # 飞书路径token
  28. @classmethod
  29. def spreadsheettoken(cls, crawler):
  30. """
  31. :param crawler: 哪个爬虫
  32. """
  33. if crawler == "kanyikan":
  34. return "shtcngRPoDYAi24x52j2nDuHMih"
  35. elif crawler == "kuaishou":
  36. return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  37. elif crawler == "weishi":
  38. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  39. elif crawler == "xiaoniangao":
  40. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  41. elif crawler == "monitor":
  42. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  43. elif crawler == "bszf":
  44. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  45. elif crawler == "gzh":
  46. return "shtcnexNXnpDLHhARw0QdiwbYuA"
  47. # 获取飞书api token
  48. @classmethod
  49. def get_token(cls, log_type):
  50. """
  51. 获取飞书api token
  52. :return:
  53. """
  54. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  55. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  56. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  57. try:
  58. urllib3.disable_warnings()
  59. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  60. tenant_access_token = response.json()["tenant_access_token"]
  61. return tenant_access_token
  62. except Exception as e:
  63. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  64. # 获取表格元数据
  65. @classmethod
  66. def get_metainfo(cls, log_type, crawler):
  67. """
  68. 获取表格元数据
  69. :return:
  70. """
  71. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  72. + cls.spreadsheettoken(crawler) + "/metainfo"
  73. headers = {
  74. "Authorization": "Bearer " + cls.get_token(log_type),
  75. "Content-Type": "application/json; charset=utf-8"
  76. }
  77. params = {
  78. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  79. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  80. }
  81. try:
  82. urllib3.disable_warnings()
  83. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  84. response = json.loads(r.content.decode("utf8"))
  85. return response
  86. except Exception as e:
  87. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  88. # 读取工作表中所有数据
  89. @classmethod
  90. def get_values_batch(cls, log_type, crawler, sheetid):
  91. """
  92. 读取工作表中所有数据
  93. :param log_type: 启用哪个 log
  94. :param crawler: 哪个爬虫
  95. :param sheetid: 哪张表
  96. :return: 所有数据
  97. """
  98. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  99. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  100. headers = {
  101. "Authorization": "Bearer " + cls.get_token(log_type),
  102. "Content-Type": "application/json; charset=utf-8"
  103. }
  104. params = {
  105. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  106. "ranges": sheetid,
  107. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  108. # valueRenderOption=FormattedValue 计算并格式化单元格;
  109. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  110. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  111. "valueRenderOption": "ToString",
  112. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  113. "dateTimeRenderOption": "",
  114. # 返回的用户id类型,可选open_id,union_id
  115. "user_id_type": "open_id"
  116. }
  117. try:
  118. urllib3.disable_warnings()
  119. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  120. # print(r.text)
  121. response = json.loads(r.content.decode("utf8"))
  122. values = response["data"]["valueRanges"][0]["values"]
  123. return values
  124. except Exception as e:
  125. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  126. # 工作表,插入行或列
  127. @classmethod
  128. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  129. """
  130. 工作表插入行或列
  131. :param log_type: 日志路径
  132. :param crawler: 哪个爬虫的云文档
  133. :param sheetid:哪张工作表
  134. :param majordimension:行或者列, ROWS、COLUMNS
  135. :param startindex:开始位置
  136. :param endindex:结束位置
  137. """
  138. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  139. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  140. headers = {
  141. "Authorization": "Bearer " + cls.get_token(log_type),
  142. "Content-Type": "application/json; charset=utf-8"
  143. }
  144. body = {
  145. "dimension": {
  146. "sheetId": sheetid,
  147. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  148. "startIndex": startindex, # 开始的位置
  149. "endIndex": endindex # 结束的位置
  150. },
  151. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  152. }
  153. try:
  154. urllib3.disable_warnings()
  155. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  156. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  157. except Exception as e:
  158. Common.logger(log_type).error("插入行或列异常:{}", e)
  159. # 写入数据
  160. @classmethod
  161. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  162. """
  163. 写入数据
  164. :param log_type: 日志路径
  165. :param crawler: 哪个爬虫的云文档
  166. :param sheetid:哪张工作表
  167. :param ranges:单元格范围
  168. :param values:写入的具体数据,list
  169. """
  170. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  171. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  172. headers = {
  173. "Authorization": "Bearer " + cls.get_token(log_type),
  174. "Content-Type": "application/json; charset=utf-8"
  175. }
  176. body = {
  177. "valueRanges": [
  178. {
  179. "range": sheetid + "!" + ranges,
  180. "values": values
  181. },
  182. ],
  183. }
  184. try:
  185. urllib3.disable_warnings()
  186. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  187. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  188. except Exception as e:
  189. Common.logger(log_type).error("写入数据异常:{}", e)
  190. # 合并单元格
  191. @classmethod
  192. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  193. """
  194. 合并单元格
  195. :param log_type: 日志路径
  196. :param crawler: 哪个爬虫
  197. :param sheetid:哪张工作表
  198. :param ranges:需要合并的单元格范围
  199. """
  200. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  201. + cls.spreadsheettoken(crawler) + "/merge_cells"
  202. headers = {
  203. "Authorization": "Bearer " + cls.get_token(log_type),
  204. "Content-Type": "application/json; charset=utf-8"
  205. }
  206. body = {
  207. "range": sheetid + "!" + ranges,
  208. "mergeType": "MERGE_ROWS"
  209. }
  210. try:
  211. urllib3.disable_warnings()
  212. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  213. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  214. except Exception as e:
  215. Common.logger(log_type).error("合并单元格异常:{}", e)
  216. # 读取单元格数据
  217. @classmethod
  218. def get_range_value(cls, log_type, crawler, sheetid, cell):
  219. """
  220. 读取单元格内容
  221. :param log_type: 日志路径
  222. :param crawler: 哪个爬虫
  223. :param sheetid: 哪张工作表
  224. :param cell: 哪个单元格
  225. :return: 单元格内容
  226. """
  227. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  228. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  229. headers = {
  230. "Authorization": "Bearer " + cls.get_token(log_type),
  231. "Content-Type": "application/json; charset=utf-8"
  232. }
  233. params = {
  234. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  235. # valueRenderOption=FormattedValue 计算并格式化单元格;
  236. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  237. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  238. "valueRenderOption": "FormattedValue",
  239. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  240. "dateTimeRenderOption": "",
  241. # 返回的用户id类型,可选open_id,union_id
  242. "user_id_type": "open_id"
  243. }
  244. try:
  245. urllib3.disable_warnings()
  246. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  247. # print(r.text)
  248. return r.json()["data"]["valueRange"]["values"][0]
  249. except Exception as e:
  250. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  251. # 删除行或列,可选 ROWS、COLUMNS
  252. @classmethod
  253. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  254. """
  255. 删除行或列
  256. :param log_type: 日志路径
  257. :param crawler: 哪个爬虫
  258. :param sheetid:工作表
  259. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  260. :param startindex:开始的位置
  261. :param endindex:结束的位置
  262. :return:
  263. """
  264. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  265. + cls.spreadsheettoken(crawler) + "/dimension_range"
  266. headers = {
  267. "Authorization": "Bearer " + cls.get_token(log_type),
  268. "Content-Type": "application/json; charset=utf-8"
  269. }
  270. body = {
  271. "dimension": {
  272. "sheetId": sheetid,
  273. "majorDimension": major_dimension,
  274. "startIndex": startindex,
  275. "endIndex": endindex
  276. }
  277. }
  278. try:
  279. urllib3.disable_warnings()
  280. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  281. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  282. except Exception as e:
  283. Common.logger(log_type).error("删除视频数据异常:{}", e)
  284. if __name__ == "__main__":
  285. print(Feishu.get_token('gzh'))
  286. pass