feishu_lib.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/5/11
  4. import datetime
  5. import json
  6. import time
  7. import requests
  8. import urllib3
  9. from main.common import Common
  10. proxies = {"http": None, "https": None}
  11. class Feishu:
  12. """
  13. 编辑飞书云文档
  14. """
  15. # 看一看爬虫数据表
  16. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  17. # 快手爬虫数据表
  18. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  19. # 微视爬虫数据表
  20. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  21. # 小年糕爬虫数据表
  22. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  23. # 飞书路径token
  24. @classmethod
  25. def spreadsheetToken(cls, crawler):
  26. """
  27. :param crawler: 哪个爬虫
  28. """
  29. if crawler == "kanyikan":
  30. return "shtcngRPoDYAi24x52j2nDuHMih"
  31. elif crawler == "kuaishou":
  32. return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  33. elif crawler == "weishi":
  34. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  35. elif crawler == "xiaoniangao":
  36. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  37. # 获取飞书api token
  38. @classmethod
  39. def get_token(cls):
  40. """
  41. 获取飞书api token
  42. :return:
  43. """
  44. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  45. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  46. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  47. try:
  48. urllib3.disable_warnings()
  49. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  50. tenant_access_token = response.json()["tenant_access_token"]
  51. return tenant_access_token
  52. except Exception as e:
  53. Common.logger().error("获取飞书 api token 异常:{}", e)
  54. # 获取表格元数据
  55. @classmethod
  56. def get_metainfo(cls, crawler):
  57. """
  58. 获取表格元数据
  59. :return:
  60. """
  61. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  62. + cls.spreadsheetToken(crawler) + "/metainfo"
  63. headers = {
  64. "Authorization": "Bearer " + cls.get_token(),
  65. "Content-Type": "application/json; charset=utf-8"
  66. }
  67. params = {
  68. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  69. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  70. }
  71. try:
  72. urllib3.disable_warnings()
  73. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  74. response = json.loads(r.content.decode("utf8"))
  75. return response
  76. except Exception as e:
  77. Common.logger().error("获取表格元数据异常:{}", e)
  78. # 读取工作表中所有数据
  79. @classmethod
  80. def get_values_batch(cls, crawler, sheetid):
  81. """
  82. 读取工作表中所有数据
  83. :param crawler: 哪个爬虫
  84. :param sheetid: 哪张表
  85. :return: 所有数据
  86. """
  87. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  88. + cls.spreadsheetToken(crawler) + "/values_batch_get"
  89. headers = {
  90. "Authorization": "Bearer " + cls.get_token(),
  91. "Content-Type": "application/json; charset=utf-8"
  92. }
  93. params = {
  94. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  95. "ranges": sheetid,
  96. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  97. # valueRenderOption=FormattedValue 计算并格式化单元格;
  98. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  99. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  100. "valueRenderOption": "ToString",
  101. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  102. "dateTimeRenderOption": "",
  103. # 返回的用户id类型,可选open_id,union_id
  104. "user_id_type": "open_id"
  105. }
  106. try:
  107. urllib3.disable_warnings()
  108. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  109. response = json.loads(r.content.decode("utf8"))
  110. values = response["data"]["valueRanges"][0]["values"]
  111. return values
  112. except Exception as e:
  113. Common.logger().error("读取工作表所有数据异常:{}", e)
  114. # 工作表,插入行或列
  115. @classmethod
  116. def insert_columns(cls, crawler, sheetid, majordimension, startindex, endindex):
  117. """
  118. 工作表插入行或列
  119. :param crawler: 哪个爬虫
  120. :param sheetid:哪张工作表
  121. :param majordimension:行或者列
  122. :param startindex:开始位置
  123. :param endindex:结束位置
  124. """
  125. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  126. + cls.spreadsheetToken(crawler) + "/insert_dimension_range"
  127. headers = {
  128. "Authorization": "Bearer " + cls.get_token(),
  129. "Content-Type": "application/json; charset=utf-8"
  130. }
  131. body = {
  132. "dimension": {
  133. "sheetId": sheetid,
  134. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  135. "startIndex": startindex, # 开始的位置
  136. "endIndex": endindex # 结束的位置
  137. },
  138. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  139. }
  140. try:
  141. urllib3.disable_warnings()
  142. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  143. Common.logger().info("插入行或列:{}", r.json()["msg"])
  144. except Exception as e:
  145. Common.logger().error("插入行或列异常:{}", e)
  146. # 写入数据
  147. @classmethod
  148. def update_values(cls, crawler, sheetid, ranges, values):
  149. """
  150. 写入数据
  151. :param crawler: 哪个爬虫
  152. :param sheetid:哪张工作表
  153. :param ranges:单元格范围
  154. :param values:写入的具体数据,list
  155. """
  156. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  157. + cls.spreadsheetToken(crawler) + "/values_batch_update"
  158. headers = {
  159. "Authorization": "Bearer " + cls.get_token(),
  160. "Content-Type": "application/json; charset=utf-8"
  161. }
  162. body = {
  163. "valueRanges": [
  164. {
  165. "range": sheetid + "!" + ranges,
  166. "values": values
  167. },
  168. ],
  169. }
  170. try:
  171. urllib3.disable_warnings()
  172. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  173. Common.logger().info("写入数据:{}", r.json()["msg"])
  174. except Exception as e:
  175. Common.logger().error("写入数据异常:{}", e)
  176. # 合并单元格
  177. @classmethod
  178. def merge_cells(cls, crawler, sheetid, ranges):
  179. """
  180. 合并单元格
  181. :param crawler: 哪个爬虫
  182. :param sheetid:哪张工作表
  183. :param ranges:需要合并的单元格范围
  184. """
  185. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  186. + cls.spreadsheetToken(crawler) + "/merge_cells"
  187. headers = {
  188. "Authorization": "Bearer " + cls.get_token(),
  189. "Content-Type": "application/json; charset=utf-8"
  190. }
  191. body = {
  192. "range": sheetid + "!" + ranges,
  193. "mergeType": "MERGE_ROWS"
  194. }
  195. try:
  196. urllib3.disable_warnings()
  197. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  198. Common.logger().info("合并单元格:{}", r.json()["msg"])
  199. except Exception as e:
  200. Common.logger().error("合并单元格异常:{}", e)
  201. # 读取单元格数据
  202. @classmethod
  203. def get_range_value(cls, crawler, sheetid, cell):
  204. """
  205. 读取单元格内容
  206. :param crawler: 哪个爬虫
  207. :param sheetid: 哪张工作表
  208. :param cell: 哪个单元格
  209. :return: 单元格内容
  210. """
  211. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  212. + cls.spreadsheetToken(crawler) + "/values/" + sheetid + "!" + cell
  213. headers = {
  214. "Authorization": "Bearer " + cls.get_token(),
  215. "Content-Type": "application/json; charset=utf-8"
  216. }
  217. params = {
  218. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  219. # valueRenderOption=FormattedValue 计算并格式化单元格;
  220. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  221. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  222. "valueRenderOption": "FormattedValue",
  223. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  224. "dateTimeRenderOption": "",
  225. # 返回的用户id类型,可选open_id,union_id
  226. "user_id_type": "open_id"
  227. }
  228. try:
  229. urllib3.disable_warnings()
  230. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  231. return r.json()["data"]["valueRange"]["values"][0]
  232. except Exception as e:
  233. Common.logger().error("读取单元格数据异常:{}", e)
  234. # 删除行或列,可选 ROWS、COLUMNS
  235. @classmethod
  236. def dimension_range(cls, crawler, sheetid, major_dimension, startindex, endindex):
  237. """
  238. 删除行或列
  239. :param crawler: 哪个爬虫
  240. :param sheetid:工作表
  241. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  242. :param startindex:开始的位置
  243. :param endindex:结束的位置
  244. :return:
  245. """
  246. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/"\
  247. + cls.spreadsheetToken(crawler) + "/dimension_range"
  248. headers = {
  249. "Authorization": "Bearer " + cls.get_token(),
  250. "Content-Type": "application/json; charset=utf-8"
  251. }
  252. body = {
  253. "dimension": {
  254. "sheetId": sheetid,
  255. "majorDimension": major_dimension,
  256. "startIndex": startindex,
  257. "endIndex": endindex
  258. }
  259. }
  260. try:
  261. urllib3.disable_warnings()
  262. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  263. Common.logger().info("删除视频数据:{}", r.json()["msg"])
  264. except Exception as e:
  265. Common.logger().error("删除视频数据异常:{}", e)
  266. if __name__ == "__main__":
  267. feishu = Feishu()
  268. # # 获取飞书api token
  269. # feishu.get_token()
  270. # 获取表格元数据
  271. # feishu.get_metainfo()
  272. # 读取工作表中所有数据
  273. # print(feishu.get_values_batch("xiaoniangao", "ba0da4"))
  274. # print(len(feishu.get_values_batch("k2rKkv")))
  275. # for i in range(3, len(feishu.get_values_batch("k2rKkv"))+1):
  276. # print(feishu.get_range_value("k2rKkv", "A" + str(i) + ":" + "A" + str(i))[0])
  277. # print(feishu.update_hour_list_values("k2rKkv", "G" + str(i) + ":" + "H" + str(i), [["333"]]))
  278. # time.sleep(0.5)
  279. # feishu.get_range_value("k2rKkv", "F3:F3")[0]
  280. # print(type(feishu.get_range_value("k2rKkv", "H19:H19")[0].split(" ")[-1].split(":")[0]))
  281. # print(feishu.get_range_value("k2rKkv", "H19:H19")[0])
  282. # print(int(feishu.get_range_value("xiaoniangao", "ba0da4", "G6:G6")[0].split(" ")[-1].split(":")[0]))
  283. # print(feishu.get_range_value("xiaoniangao", "ba0da4", "G6:G6")[0].split(" ")[0])
  284. feishu.update_values("xiaoniangao", "ba0da4", "H4:H4", [["2022-05-18 21:14:27"]])
  285. # 看一看+工作表,插入首行
  286. # print(feishu.insert_columns("k2rKkv", "COLUMNS", 6, 9))
  287. # print(feishu.update_hour_list_values("k2rKkv"))
  288. # print(feishu.merge_cells("k2rKkv", "G1:I1"))
  289. #
  290. # # 看一看+工作表,首行写入数据
  291. # print(feishu.update_values("Y8N3Vl", "a1", "b1", "c1", "d1", "e1", "f1", "g1",
  292. # "h1", "i1", "j1", "k1", "l1", "m1", "n1", "o1"))
  293. # 查询单元格内容
  294. # print(type(feishu.get_range_value("k2rKkv", "G1:G1")[0]))
  295. #
  296. # 删除行或列,可选 ROWS、COLUMNS
  297. # feishu.dimension_range("k2rKkv", "ROWS", 3, 3)
  298. pass