feishu_lib.py 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376
  1. # -*- coding: utf-8 -*-
  2. # @Author: wangkun
  3. # @Time: 2022/5/11
  4. import json
  5. import requests
  6. import urllib3
  7. from main.common import Common
  8. proxies = {"http": None, "https": None}
  9. class Feishu:
  10. """
  11. 编辑飞书云文档
  12. """
  13. # 看一看爬虫数据表
  14. kanyikan_url = "https://w42nne6hzg.feishu.cn/sheets/shtcngRPoDYAi24x52j2nDuHMih?"
  15. # 快手爬虫数据表
  16. kuaishou_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnp4SaJt37q6OOOrYzPMjQkg?"
  17. # 微视爬虫数据表
  18. weishi_url = "https://w42nne6hzg.feishu.cn/sheets/shtcn5YSWg91JfVGzj0SFZIRRPh?"
  19. # 小年糕爬虫数据表
  20. xiaoniangao_url = "https://w42nne6hzg.feishu.cn/sheets/shtcnYxiyQ1wLklo1W5Kdqc9cGh?"
  21. # 飞书路径token
  22. @classmethod
  23. def spreadsheettoken(cls, crawler):
  24. """
  25. :param crawler: 哪个爬虫
  26. """
  27. if crawler == "kanyikan":
  28. return "shtcngRPoDYAi24x52j2nDuHMih"
  29. elif crawler == "kuaishou":
  30. return "shtcnp4SaJt37q6OOOrYzPMjQkg"
  31. elif crawler == "weishi":
  32. return "shtcn5YSWg91JfVGzj0SFZIRRPh"
  33. elif crawler == "xiaoniangao":
  34. return "shtcnYxiyQ1wLklo1W5Kdqc9cGh"
  35. # 获取飞书api token
  36. @classmethod
  37. def get_token(cls, log_path):
  38. """
  39. 获取飞书api token
  40. :return:
  41. """
  42. url = "https://open.feishu.cn/open-apis/auth/v3/tenant_access_token/internal/"
  43. post_data = {"app_id": "cli_a13ad2afa438d00b", # 这里账号密码是发布应用的后台账号及密码
  44. "app_secret": "4tK9LY9VbiQlY5umhE42dclBFo6t4p5O"}
  45. try:
  46. urllib3.disable_warnings()
  47. response = requests.post(url=url, data=post_data, proxies=proxies, verify=False)
  48. tenant_access_token = response.json()["tenant_access_token"]
  49. return tenant_access_token
  50. except Exception as e:
  51. if log_path == "logs":
  52. Common.logger().error("获取飞书 api token 异常:{}", e)
  53. elif log_path == "person-logs":
  54. Common.person_logger().error("获取飞书 api token 异常:{}", e)
  55. # 获取表格元数据
  56. @classmethod
  57. def get_metainfo(cls, log_path, crawler):
  58. """
  59. 获取表格元数据
  60. :return:
  61. """
  62. get_metainfo_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  63. + cls.spreadsheettoken(crawler) + "/metainfo"
  64. headers = {
  65. "Authorization": "Bearer " + cls.get_token(log_path),
  66. "Content-Type": "application/json; charset=utf-8"
  67. }
  68. params = {
  69. "extFields": "protectedRange", # 额外返回的字段,extFields=protectedRange时返回保护行列信息
  70. "user_id_type": "open_id" # 返回的用户id类型,可选open_id,union_id
  71. }
  72. try:
  73. urllib3.disable_warnings()
  74. r = requests.get(url=get_metainfo_url, headers=headers, params=params, proxies=proxies, verify=False)
  75. response = json.loads(r.content.decode("utf8"))
  76. return response
  77. except Exception as e:
  78. if log_path == "logs":
  79. Common.logger().error("获取表格元数据异常:{}", e)
  80. elif log_path == "person-logs":
  81. Common.person_logger().error("获取表格元数据异常:{}", e)
  82. # 读取工作表中所有数据
  83. @classmethod
  84. def get_values_batch(cls, log_path, crawler, sheetid):
  85. """
  86. 读取工作表中所有数据
  87. :param log_path: 启用哪个 log
  88. :param crawler: 哪个爬虫
  89. :param sheetid: 哪张表
  90. :return: 所有数据
  91. """
  92. get_values_batch_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  93. + cls.spreadsheettoken(crawler) + "/values_batch_get"
  94. headers = {
  95. "Authorization": "Bearer " + cls.get_token(log_path),
  96. "Content-Type": "application/json; charset=utf-8"
  97. }
  98. params = {
  99. # 多个查询范围 如 url?ranges=range1,range2 ,其中 range 包含 sheetId 与单元格范围两部分
  100. "ranges": sheetid,
  101. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  102. # valueRenderOption=FormattedValue 计算并格式化单元格;
  103. # valueRenderOption=Formula单元格中含有公式时返回公式本身;
  104. # valueRenderOption=UnformattedValue计算但不对单元格进行格式化
  105. "valueRenderOption": "ToString",
  106. # dateTimeRenderOption=FormattedString 计算并将时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  107. "dateTimeRenderOption": "",
  108. # 返回的用户id类型,可选open_id,union_id
  109. "user_id_type": "open_id"
  110. }
  111. try:
  112. urllib3.disable_warnings()
  113. r = requests.get(url=get_values_batch_url, headers=headers, params=params, proxies=proxies, verify=False)
  114. response = json.loads(r.content.decode("utf8"))
  115. values = response["data"]["valueRanges"][0]["values"]
  116. return values
  117. except Exception as e:
  118. if log_path == "logs":
  119. Common.logger().error("读取工作表所有数据异常:{}", e)
  120. elif log_path == "person-logs":
  121. Common.person_logger().error("读取工作表所有数据异常:{}", e)
  122. # 工作表,插入行或列
  123. @classmethod
  124. def insert_columns(cls, log_path, crawler, sheetid, majordimension, startindex, endindex):
  125. """
  126. 工作表插入行或列
  127. :param log_path: 日志路径
  128. :param crawler: 哪个爬虫
  129. :param sheetid:哪张工作表
  130. :param majordimension:行或者列
  131. :param startindex:开始位置
  132. :param endindex:结束位置
  133. """
  134. insert_columns_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  135. + cls.spreadsheettoken(crawler) + "/insert_dimension_range"
  136. headers = {
  137. "Authorization": "Bearer " + cls.get_token(log_path),
  138. "Content-Type": "application/json; charset=utf-8"
  139. }
  140. body = {
  141. "dimension": {
  142. "sheetId": sheetid,
  143. "majorDimension": majordimension, # 默认 ROWS ,可选 ROWS、COLUMNS
  144. "startIndex": startindex, # 开始的位置
  145. "endIndex": endindex # 结束的位置
  146. },
  147. "inheritStyle": "AFTER" # BEFORE 或 AFTER,不填为不继承 style
  148. }
  149. try:
  150. urllib3.disable_warnings()
  151. r = requests.post(url=insert_columns_url, headers=headers, json=body, proxies=proxies, verify=False)
  152. if log_path == "logs":
  153. Common.logger().info("插入行或列:{}", r.json()["msg"])
  154. elif log_path == "person-logs":
  155. Common.person_logger().info("插入行或列:{}", r.json()["msg"])
  156. except Exception as e:
  157. if log_path == "logs":
  158. Common.logger().error("插入行或列异常:{}", e)
  159. elif log_path == "person-logs":
  160. Common.person_logger().error("插入行或列异常:{}", e)
  161. # 写入数据
  162. @classmethod
  163. def update_values(cls, log_path, crawler, sheetid, ranges, values):
  164. """
  165. 写入数据
  166. :param log_path: 日志路径
  167. :param crawler: 哪个爬虫
  168. :param sheetid:哪张工作表
  169. :param ranges:单元格范围
  170. :param values:写入的具体数据,list
  171. """
  172. update_values_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  173. + cls.spreadsheettoken(crawler) + "/values_batch_update"
  174. headers = {
  175. "Authorization": "Bearer " + cls.get_token(log_path),
  176. "Content-Type": "application/json; charset=utf-8"
  177. }
  178. body = {
  179. "valueRanges": [
  180. {
  181. "range": sheetid + "!" + ranges,
  182. "values": values
  183. },
  184. ],
  185. }
  186. try:
  187. urllib3.disable_warnings()
  188. r = requests.post(url=update_values_url, headers=headers, json=body, proxies=proxies, verify=False)
  189. if log_path == "logs":
  190. Common.logger().info("写入数据:{}", r.json()["msg"])
  191. elif log_path == "person-logs":
  192. Common.person_logger().info("写入数据:{}", r.json()["msg"])
  193. except Exception as e:
  194. if log_path == "logs":
  195. Common.logger().error("写入数据异常:{}", e)
  196. elif log_path == "person-logs":
  197. Common.person_logger().error("写入数据异常:{}", e)
  198. # 合并单元格
  199. @classmethod
  200. def merge_cells(cls, log_path, crawler, sheetid, ranges):
  201. """
  202. 合并单元格
  203. :param log_path: 日志路径
  204. :param crawler: 哪个爬虫
  205. :param sheetid:哪张工作表
  206. :param ranges:需要合并的单元格范围
  207. """
  208. merge_cells_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  209. + cls.spreadsheettoken(crawler) + "/merge_cells"
  210. headers = {
  211. "Authorization": "Bearer " + cls.get_token(log_path),
  212. "Content-Type": "application/json; charset=utf-8"
  213. }
  214. body = {
  215. "range": sheetid + "!" + ranges,
  216. "mergeType": "MERGE_ROWS"
  217. }
  218. try:
  219. urllib3.disable_warnings()
  220. r = requests.post(url=merge_cells_url, headers=headers, json=body, proxies=proxies, verify=False)
  221. if log_path == "logs":
  222. Common.logger().info("合并单元格:{}", r.json()["msg"])
  223. elif log_path == "person-logs":
  224. Common.person_logger().info("合并单元格:{}", r.json()["msg"])
  225. except Exception as e:
  226. if log_path == "logs":
  227. Common.logger().error("合并单元格异常:{}", e)
  228. elif log_path == "person-logs":
  229. Common.person_logger().error("合并单元格异常:{}", e)
  230. # 读取单元格数据
  231. @classmethod
  232. def get_range_value(cls, log_path, crawler, sheetid, cell):
  233. """
  234. 读取单元格内容
  235. :param log_path: 日志路径
  236. :param crawler: 哪个爬虫
  237. :param sheetid: 哪张工作表
  238. :param cell: 哪个单元格
  239. :return: 单元格内容
  240. """
  241. get_range_value_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  242. + cls.spreadsheettoken(crawler) + "/values/" + sheetid + "!" + cell
  243. headers = {
  244. "Authorization": "Bearer " + cls.get_token(log_path),
  245. "Content-Type": "application/json; charset=utf-8"
  246. }
  247. params = {
  248. # valueRenderOption=ToString 可返回纯文本的值(数值类型除外);
  249. # valueRenderOption=FormattedValue 计算并格式化单元格;
  250. # valueRenderOption=Formula 单元格中含有公式时返回公式本身;
  251. # valueRenderOption=UnformattedValue 计算但不对单元格进行格式化。
  252. "valueRenderOption": "FormattedValue",
  253. # dateTimeRenderOption=FormattedString 计算并对时间日期按照其格式进行格式化,但不会对数字进行格式化,返回格式化后的字符串。
  254. "dateTimeRenderOption": "",
  255. # 返回的用户id类型,可选open_id,union_id
  256. "user_id_type": "open_id"
  257. }
  258. try:
  259. urllib3.disable_warnings()
  260. r = requests.get(url=get_range_value_url, headers=headers, params=params, proxies=proxies, verify=False)
  261. return r.json()["data"]["valueRange"]["values"][0]
  262. except Exception as e:
  263. if log_path == "logs":
  264. Common.logger().error("读取单元格数据异常:{}", e)
  265. elif log_path == "person-logs":
  266. Common.person_logger().error("读取单元格数据异常:{}", e)
  267. # 删除行或列,可选 ROWS、COLUMNS
  268. @classmethod
  269. def dimension_range(cls, log_path, crawler, sheetid, major_dimension, startindex, endindex):
  270. """
  271. 删除行或列
  272. :param log_path: 日志路径
  273. :param crawler: 哪个爬虫
  274. :param sheetid:工作表
  275. :param major_dimension:默认 ROWS ,可选 ROWS、COLUMNS
  276. :param startindex:开始的位置
  277. :param endindex:结束的位置
  278. :return:
  279. """
  280. dimension_range_url = "https://open.feishu.cn/open-apis/sheets/v2/spreadsheets/" \
  281. + cls.spreadsheettoken(crawler) + "/dimension_range"
  282. headers = {
  283. "Authorization": "Bearer " + cls.get_token(log_path),
  284. "Content-Type": "application/json; charset=utf-8"
  285. }
  286. body = {
  287. "dimension": {
  288. "sheetId": sheetid,
  289. "majorDimension": major_dimension,
  290. "startIndex": startindex,
  291. "endIndex": endindex
  292. }
  293. }
  294. try:
  295. urllib3.disable_warnings()
  296. r = requests.delete(url=dimension_range_url, headers=headers, json=body, proxies=proxies, verify=False)
  297. if log_path == "logs":
  298. Common.logger().info("删除视频数据:{}", r.json()["msg"])
  299. elif log_path == "person-logs":
  300. Common.person_logger().info("删除视频数据:{}", r.json()["msg"])
  301. except Exception as e:
  302. if log_path == "logs":
  303. Common.logger().error("删除视频数据异常:{}", e)
  304. elif log_path == "person-logs":
  305. Common.person_logger().error("删除视频数据异常:{}", e)
  306. if __name__ == "__main__":
  307. feishu = Feishu()
  308. print(feishu.get_range_value("person-log", "xiaoniangao", "dzcWHw", "B3:B3")[0])
  309. print(feishu.get_range_value("person-log", "xiaoniangao", "dzcWHw", "B4:B4")[0])
  310. print(feishu.get_range_value("person-log", "xiaoniangao", "dzcWHw", "C5:C5")[0][0]["link"])
  311. print(feishu.get_range_value("person-log", "xiaoniangao", "dzcWHw", "B6:B6")[0])
  312. print(feishu.get_range_value("person-log", "xiaoniangao", "dzcWHw", "B7:B7")[0])
  313. # # 获取飞书api token
  314. # feishu.get_token()
  315. # 获取表格元数据
  316. # feishu.get_metainfo()
  317. # 读取工作表中所有数据
  318. # print(feishu.get_values_batch("xiaoniangao", "ba0da4"))
  319. # print(len(feishu.get_values_batch("k2rKkv")))
  320. # for i in range(3, len(feishu.get_values_batch("k2rKkv"))+1):
  321. # print(feishu.get_range_value("k2rKkv", "A" + str(i) + ":" + "A" + str(i))[0])
  322. # print(feishu.update_hour_list_values("k2rKkv", "G" + str(i) + ":" + "H" + str(i), [["333"]]))
  323. # time.sleep(0.5)
  324. # feishu.get_range_value("k2rKkv", "F3:F3")[0]
  325. # print(type(feishu.get_range_value("k2rKkv", "H19:H19")[0].split(" ")[-1].split(":")[0]))
  326. # print(feishu.get_range_value("k2rKkv", "H19:H19")[0])
  327. # print(int(feishu.get_range_value("xiaoniangao", "ba0da4", "G6:G6")[0].split(" ")[-1].split(":")[0]))
  328. # print(feishu.get_range_value("xiaoniangao", "ba0da4", "G6:G6")[0].split(" ")[0])
  329. # feishu.update_values("logs", "xiaoniangao", "ba0da4", "H4:H4", [["2022-05-18 21:14:27"]])
  330. # 看一看+工作表,插入首行
  331. # print(feishu.insert_columns("k2rKkv", "COLUMNS", 6, 9))
  332. # print(feishu.update_hour_list_values("k2rKkv"))
  333. # print(feishu.merge_cells("k2rKkv", "G1:I1"))
  334. #
  335. # # 看一看+工作表,首行写入数据
  336. # print(feishu.update_values("Y8N3Vl", "a1", "b1", "c1", "d1", "e1", "f1", "g1",
  337. # "h1", "i1", "j1", "k1", "l1", "m1", "n1", "o1"))
  338. # 查询单元格内容
  339. # print(type(feishu.get_range_value("k2rKkv", "G1:G1")[0]))
  340. #
  341. # 删除行或列,可选 ROWS、COLUMNS
  342. # feishu.dimension_range("k2rKkv", "ROWS", 3, 3)
  343. pass