feishu_lib.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2023/1/9
  4. import json
  5. import requests
  6. import urllib3
  7. from main.ganggangdouchuan_common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 刚刚都传
  14. crawler_ganggangdouchuan = 'https://w42nne6hzg.feishu.cn/sheets/shtcnTuJgeZU2bc7VaesAqk3QJx'
  15. # 飞书路径token
  16. @classmethod
  17. def spreadsheettoken(cls, crawler):
  18. """
  19. :param crawler: 哪个爬虫
  20. """
  21. if crawler == "kanyikan":
  22. return "shtcngRPoDYAi24x52j2nDuHMih"
  23. elif crawler == "kuaishou":
  24. return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  25. elif crawler == "weishi":
  26. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  27. elif crawler == "xiaoniangao":
  28. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  29. elif crawler == "monitor":
  30. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  31. elif crawler == "bszf":
  32. return "shtcnGh2rrsPYM4iVNEBO7OqWrb"
  33. elif crawler == "ssyy":
  34. return "shtcnz1ymxHL1u8WHblfqfys7qe"
  35. elif crawler == "ggdc":
  36. return "shtcnTuJgeZU2bc7VaesAqk3QJx"
  37. # 获取飞书api token
  38. @classmethod
  39. def get_token(cls, log_type):
  40. """
  41. 获取飞书api token
  42. :return:
  43. """
  44. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  45. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  46. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  47. try:
  48. urllib3.disable_warnings()
  49. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  50. tenant_access_token = response.json()["tenant_access_token"]
  51. return tenant_access_token
  52. except Exception as e:
  53. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  54. # 获取表格元数据
  55. @classmethod
  56. def get_metainfo(cls, log_type, crawler):
  57. """
  58. 获取表格元数据
  59. :return:
  60. """
  61. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  62. + cls.spreadsheettoken(crawler) + "/metainfo"
  63. headers = {
  64. "Authorization": "Bearer " + cls.get_token(log_type),
  65. "Content-Type": "application/json; charset=utf-8"
  66. }
  67. params = {
  68. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  69. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  70. }
  71. try:
  72. urllib3.disable_warnings()
  73. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  74. response = json.loads(r.content.decode("utf8"))
  75. return response
  76. except Exception as e:
  77. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  78. # 读取工作表中所有数据
  79. @classmethod
  80. def get_values_batch(cls, log_type, crawler, sheetid):
  81. """
  82. 读取工作表中所有数据
  83. :param log_type: 启用哪个 log
  84. :param crawler: 哪个爬虫
  85. :param sheetid: 哪张表
  86. :return: 所有数据
  87. """
  88. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  89. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  90. headers = {
  91. "Authorization": "Bearer " + cls.get_token(log_type),
  92. "Content-Type": "application/json; charset=utf-8"
  93. }
  94. params = {
  95. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  96. "ranges": sheetid,
  97. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  98. # valueRenderOption=FormattedValue 计算并格式化单元格;
  99. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  100. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  101. "valueRenderOption": "ToString",
  102. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  103. "dateTimeRenderOption": "",
  104. # 返回的用户id类型,可选open_id,union_id
  105. "user_id_type": "open_id"
  106. }
  107. try:
  108. urllib3.disable_warnings()
  109. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  110. # print(r.text)
  111. response = json.loads(r.content.decode("utf8"))
  112. values = response["data"]["valueRanges"][0]["values"]
  113. return values
  114. except Exception as e:
  115. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  116. # 工作表,插入行或列
  117. @classmethod
  118. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  119. """
  120. 工作表插入行或列
  121. :param log_type: 日志路径
  122. :param crawler: 哪个爬虫的云文档
  123. :param sheetid:哪张工作表
  124. :param majordimension:行或者列, ROWS、COLUMNS
  125. :param startindex:开始位置
  126. :param endindex:结束位置
  127. """
  128. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  129. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  130. headers = {
  131. "Authorization": "Bearer " + cls.get_token(log_type),
  132. "Content-Type": "application/json; charset=utf-8"
  133. }
  134. body = {
  135. "dimension": {
  136. "sheetId": sheetid,
  137. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  138. "startIndex": startindex, # 开始的位置
  139. "endIndex": endindex # 结束的位置
  140. },
  141. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  142. }
  143. try:
  144. urllib3.disable_warnings()
  145. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  146. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  147. except Exception as e:
  148. Common.logger(log_type).error("插入行或列异常:{}", e)
  149. # 写入数据
  150. @classmethod
  151. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  152. """
  153. 写入数据
  154. :param log_type: 日志路径
  155. :param crawler: 哪个爬虫的云文档
  156. :param sheetid:哪张工作表
  157. :param ranges:单元格范围
  158. :param values:写入的具体数据,list
  159. """
  160. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  161. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  162. headers = {
  163. "Authorization": "Bearer " + cls.get_token(log_type),
  164. "Content-Type": "application/json; charset=utf-8"
  165. }
  166. body = {
  167. "valueRanges": [
  168. {
  169. "range": sheetid + "!" + ranges,
  170. "values": values
  171. },
  172. ],
  173. }
  174. try:
  175. urllib3.disable_warnings()
  176. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  177. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  178. except Exception as e:
  179. Common.logger(log_type).error("写入数据异常:{}", e)
  180. # 合并单元格
  181. @classmethod
  182. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  183. """
  184. 合并单元格
  185. :param log_type: 日志路径
  186. :param crawler: 哪个爬虫
  187. :param sheetid:哪张工作表
  188. :param ranges:需要合并的单元格范围
  189. """
  190. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  191. + cls.spreadsheettoken(crawler) + "/merge_cells"
  192. headers = {
  193. "Authorization": "Bearer " + cls.get_token(log_type),
  194. "Content-Type": "application/json; charset=utf-8"
  195. }
  196. body = {
  197. "range": sheetid + "!" + ranges,
  198. "mergeType": "MERGE_ROWS"
  199. }
  200. try:
  201. urllib3.disable_warnings()
  202. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  203. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  204. except Exception as e:
  205. Common.logger(log_type).error("合并单元格异常:{}", e)
  206. # 读取单元格数据
  207. @classmethod
  208. def get_range_value(cls, log_type, crawler, sheetid, cell):
  209. """
  210. 读取单元格内容
  211. :param log_type: 日志路径
  212. :param crawler: 哪个爬虫
  213. :param sheetid: 哪张工作表
  214. :param cell: 哪个单元格
  215. :return: 单元格内容
  216. """
  217. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  218. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  219. headers = {
  220. "Authorization": "Bearer " + cls.get_token(log_type),
  221. "Content-Type": "application/json; charset=utf-8"
  222. }
  223. params = {
  224. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  225. # valueRenderOption=FormattedValue 计算并格式化单元格;
  226. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  227. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  228. "valueRenderOption": "FormattedValue",
  229. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  230. "dateTimeRenderOption": "",
  231. # 返回的用户id类型,可选open_id,union_id
  232. "user_id_type": "open_id"
  233. }
  234. try:
  235. urllib3.disable_warnings()
  236. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  237. # print(r.text)
  238. return r.json()["data"]["valueRange"]["values"][0]
  239. except Exception as e:
  240. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  241. # 删除行或列,可选 ROWS、COLUMNS
  242. @classmethod
  243. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  244. """
  245. 删除行或列
  246. :param log_type: 日志路径
  247. :param crawler: 哪个爬虫
  248. :param sheetid:工作表
  249. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  250. :param startindex:开始的位置
  251. :param endindex:结束的位置
  252. :return:
  253. """
  254. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  255. + cls.spreadsheettoken(crawler) + "/dimension_range"
  256. headers = {
  257. "Authorization": "Bearer " + cls.get_token(log_type),
  258. "Content-Type": "application/json; charset=utf-8"
  259. }
  260. body = {
  261. "dimension": {
  262. "sheetId": sheetid,
  263. "majorDimension": major_dimension,
  264. "startIndex": startindex,
  265. "endIndex": endindex
  266. }
  267. }
  268. try:
  269. urllib3.disable_warnings()
  270. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  271. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  272. except Exception as e:
  273. Common.logger(log_type).error("删除视频数据异常:{}", e)
  274. if __name__ == "__main__":
  275. feishu = Feishu()
  276. pass