feishu_lib.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/5/9
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. # kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  17. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnICEfaw9llDNQkKgdymM1xf?"
  18. # 微视爬虫数据表
  19. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  20. # 小年糕爬虫数据表
  21. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  22. # 数据监控表
  23. crawler_monitor = "https://w42nne6hzg.feishu.cn/sheets/shtcnlZWYazInhf7Z60jkbLRJyd?"
  24. # 飞书路径token
  25. @classmethod
  26. def spreadsheettoken(cls, crawler):
  27. """
  28. :param crawler: 哪个爬虫
  29. """
  30. if crawler == "kanyikan":
  31. return "shtcngRPoDYAi24x52j2nDuHMih"
  32. elif crawler == "kuaishou":
  33. # return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  34. return "shtcnICEfaw9llDNQkKgdymM1xf"
  35. elif crawler == "weishi":
  36. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  37. elif crawler == "xiaoniangao":
  38. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  39. elif crawler == "monitor":
  40. return "shtcnlZWYazInhf7Z60jkbLRJyd"
  41. # 获取飞书api token
  42. @classmethod
  43. def get_token(cls, log_type):
  44. """
  45. 获取飞书api token
  46. :return:
  47. """
  48. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  49. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  50. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  51. try:
  52. urllib3.disable_warnings()
  53. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  54. tenant_access_token = response.json()["tenant_access_token"]
  55. return tenant_access_token
  56. except Exception as e:
  57. Common.logger(log_type).error("获取飞书 api token 异常:{}", e)
  58. # 获取表格元数据
  59. @classmethod
  60. def get_metainfo(cls, log_type, crawler):
  61. """
  62. 获取表格元数据
  63. :return:
  64. """
  65. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  66. + cls.spreadsheettoken(crawler) + "/metainfo"
  67. headers = {
  68. "Authorization": "Bearer " + cls.get_token(log_type),
  69. "Content-Type": "application/json; charset=utf-8"
  70. }
  71. params = {
  72. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  73. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  74. }
  75. try:
  76. urllib3.disable_warnings()
  77. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  78. response = json.loads(r.content.decode("utf8"))
  79. return response
  80. except Exception as e:
  81. Common.logger(log_type).error("获取表格元数据异常:{}", e)
  82. # 读取工作表中所有数据
  83. @classmethod
  84. def get_values_batch(cls, log_type, crawler, sheetid):
  85. """
  86. 读取工作表中所有数据
  87. :param log_type: 启用哪个 log
  88. :param crawler: 哪个爬虫
  89. :param sheetid: 哪张表
  90. :return: 所有数据
  91. """
  92. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  93. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  94. headers = {
  95. "Authorization": "Bearer " + cls.get_token(log_type),
  96. "Content-Type": "application/json; charset=utf-8"
  97. }
  98. params = {
  99. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  100. "ranges": sheetid,
  101. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  102. # valueRenderOption=FormattedValue 计算并格式化单元格;
  103. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  104. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  105. "valueRenderOption": "ToString",
  106. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  107. "dateTimeRenderOption": "",
  108. # 返回的用户id类型,可选open_id,union_id
  109. "user_id_type": "open_id"
  110. }
  111. try:
  112. urllib3.disable_warnings()
  113. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  114. # print(r.text)
  115. response = json.loads(r.content.decode("utf8"))
  116. values = response["data"]["valueRanges"][0]["values"]
  117. return values
  118. except Exception as e:
  119. Common.logger(log_type).error("读取工作表所有数据异常:{}", e)
  120. # 工作表,插入行或列
  121. @classmethod
  122. def insert_columns(cls, log_type, crawler, sheetid, majordimension, startindex, endindex):
  123. """
  124. 工作表插入行或列
  125. :param log_type: 日志路径
  126. :param crawler: 哪个爬虫的云文档
  127. :param sheetid:哪张工作表
  128. :param majordimension:行或者列, ROWS、COLUMNS
  129. :param startindex:开始位置
  130. :param endindex:结束位置
  131. """
  132. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  133. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  134. headers = {
  135. "Authorization": "Bearer " + cls.get_token(log_type),
  136. "Content-Type": "application/json; charset=utf-8"
  137. }
  138. body = {
  139. "dimension": {
  140. "sheetId": sheetid,
  141. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  142. "startIndex": startindex, # 开始的位置
  143. "endIndex": endindex # 结束的位置
  144. },
  145. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  146. }
  147. try:
  148. urllib3.disable_warnings()
  149. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  150. Common.logger(log_type).info("插入行或列:{}", r.json()["msg"])
  151. except Exception as e:
  152. Common.logger(log_type).error("插入行或列异常:{}", e)
  153. # 写入数据
  154. @classmethod
  155. def update_values(cls, log_type, crawler, sheetid, ranges, values):
  156. """
  157. 写入数据
  158. :param log_type: 日志路径
  159. :param crawler: 哪个爬虫的云文档
  160. :param sheetid:哪张工作表
  161. :param ranges:单元格范围
  162. :param values:写入的具体数据,list
  163. """
  164. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  165. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  166. headers = {
  167. "Authorization": "Bearer " + cls.get_token(log_type),
  168. "Content-Type": "application/json; charset=utf-8"
  169. }
  170. body = {
  171. "valueRanges": [
  172. {
  173. "range": sheetid + "!" + ranges,
  174. "values": values
  175. },
  176. ],
  177. }
  178. try:
  179. urllib3.disable_warnings()
  180. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  181. Common.logger(log_type).info("写入数据:{}", r.json()["msg"])
  182. except Exception as e:
  183. Common.logger(log_type).error("写入数据异常:{}", e)
  184. # 合并单元格
  185. @classmethod
  186. def merge_cells(cls, log_type, crawler, sheetid, ranges):
  187. """
  188. 合并单元格
  189. :param log_type: 日志路径
  190. :param crawler: 哪个爬虫
  191. :param sheetid:哪张工作表
  192. :param ranges:需要合并的单元格范围
  193. """
  194. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  195. + cls.spreadsheettoken(crawler) + "/merge_cells"
  196. headers = {
  197. "Authorization": "Bearer " + cls.get_token(log_type),
  198. "Content-Type": "application/json; charset=utf-8"
  199. }
  200. body = {
  201. "range": sheetid + "!" + ranges,
  202. "mergeType": "MERGE_ROWS"
  203. }
  204. try:
  205. urllib3.disable_warnings()
  206. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  207. Common.logger(log_type).info("合并单元格:{}", r.json()["msg"])
  208. except Exception as e:
  209. Common.logger(log_type).error("合并单元格异常:{}", e)
  210. # 读取单元格数据
  211. @classmethod
  212. def get_range_value(cls, log_type, crawler, sheetid, cell):
  213. """
  214. 读取单元格内容
  215. :param log_type: 日志路径
  216. :param crawler: 哪个爬虫
  217. :param sheetid: 哪张工作表
  218. :param cell: 哪个单元格
  219. :return: 单元格内容
  220. """
  221. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  222. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  223. headers = {
  224. "Authorization": "Bearer " + cls.get_token(log_type),
  225. "Content-Type": "application/json; charset=utf-8"
  226. }
  227. params = {
  228. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  229. # valueRenderOption=FormattedValue 计算并格式化单元格;
  230. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  231. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  232. "valueRenderOption": "FormattedValue",
  233. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  234. "dateTimeRenderOption": "",
  235. # 返回的用户id类型,可选open_id,union_id
  236. "user_id_type": "open_id"
  237. }
  238. try:
  239. urllib3.disable_warnings()
  240. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  241. # print(r.text)
  242. return r.json()["data"]["valueRange"]["values"][0]
  243. except Exception as e:
  244. Common.logger(log_type).error("读取单元格数据异常:{}", e)
  245. # 删除行或列,可选 ROWS、COLUMNS
  246. @classmethod
  247. def dimension_range(cls, log_type, crawler, sheetid, major_dimension, startindex, endindex):
  248. """
  249. 删除行或列
  250. :param log_type: 日志路径
  251. :param crawler: 哪个爬虫
  252. :param sheetid:工作表
  253. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  254. :param startindex:开始的位置
  255. :param endindex:结束的位置
  256. :return:
  257. """
  258. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  259. + cls.spreadsheettoken(crawler) + "/dimension_range"
  260. headers = {
  261. "Authorization": "Bearer " + cls.get_token(log_type),
  262. "Content-Type": "application/json; charset=utf-8"
  263. }
  264. body = {
  265. "dimension": {
  266. "sheetId": sheetid,
  267. "majorDimension": major_dimension,
  268. "startIndex": startindex,
  269. "endIndex": endindex
  270. }
  271. }
  272. try:
  273. urllib3.disable_warnings()
  274. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  275. Common.logger(log_type).info("删除视频数据:{}", r.json()["msg"])
  276. except Exception as e:
  277. Common.logger(log_type).error("删除视频数据异常:{}", e)
  278. if __name__ == "__main__":
  279. feishu = Feishu()
  280. # print(feishu.get_range_value("person", "xiaoniangao", "dzcWHw", "B4:B4")[0])
  281. # print(feishu.get_range_value("person", "xiaoniangao", "dzcWHw", "C5:C5")[0][0]["link"])
  282. # print(feishu.get_range_value("person", "xiaoniangao", "dzcWHw", "B6:B6")[0])
  283. # print(feishu.get_range_value("person", "xiaoniangao", "dzcWHw", "B7:B7")[0])
  284. pass