|
@@ -22,7 +22,7 @@ from common.scheduling_db import MysqlHelper
|
|
|
from common.common import Common
|
|
|
from common.feishu import Feishu
|
|
|
from common.publish import Publish
|
|
|
-from common.public import get_config_from_mysql, download_rule
|
|
|
+from common.public import get_config_from_mysql, download_rule, get_title_score
|
|
|
from common.userAgent import get_random_user_agent
|
|
|
|
|
|
|
|
@@ -645,11 +645,19 @@ class XiguasearchScheduling:
|
|
|
Common.logger(log_type, crawler).info('视频已下载\n')
|
|
|
Common.logging(log_type, crawler, env, '视频已下载\n')
|
|
|
else:
|
|
|
+ title_score = get_title_score(log_type, "kuaishou", "16QspO", "0usaDk", video_dict["video_title"])
|
|
|
+ if title_score <= 0.3:
|
|
|
+ Common.logger(log_type, crawler).info(f"权重分:{title_score}<=0.3\n")
|
|
|
+ Common.logging(log_type, crawler, env, f"权重分:{title_score}<=0.3\n")
|
|
|
+ continue
|
|
|
+ Common.logger(log_type, crawler).info(f"权重分:{title_score}>0.3\n")
|
|
|
+ Common.logging(log_type, crawler, env, f"权重分:{title_score}>0.3\n")
|
|
|
cls.download_publish(log_type=log_type,
|
|
|
crawler=crawler,
|
|
|
user_dict=user_dict,
|
|
|
video_dict=video_dict,
|
|
|
rule_dict=rule_dict,
|
|
|
+ title_score=title_score,
|
|
|
env=env)
|
|
|
except Exception as e:
|
|
|
Common.logger(log_type, crawler).warning(f"抓取单条视频异常:{e}\n")
|
|
@@ -668,7 +676,7 @@ class XiguasearchScheduling:
|
|
|
|
|
|
# 下载 / 上传
|
|
|
@classmethod
|
|
|
- def download_publish(cls, log_type, crawler, user_dict, video_dict, rule_dict, env):
|
|
|
+ def download_publish(cls, log_type, crawler, user_dict, video_dict, rule_dict, title_score, env):
|
|
|
|
|
|
Common.download_method(log_type=log_type, crawler=crawler, text='xigua_video',
|
|
|
title=video_dict['video_title'], url=video_dict['video_url'])
|
|
@@ -769,7 +777,8 @@ class XiguasearchScheduling:
|
|
|
|
|
|
# 视频信息写入飞书
|
|
|
Feishu.insert_columns(log_type, crawler, "BUNvGC", "ROWS", 1, 2)
|
|
|
- values = [[user_dict["link"],
|
|
|
+ values = [[title_score,
|
|
|
+ user_dict["link"],
|
|
|
time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(int(time.time()))),
|
|
|
"关键词搜索",
|
|
|
video_dict['video_title'],
|
|
@@ -790,7 +799,7 @@ class XiguasearchScheduling:
|
|
|
video_dict['video_url'],
|
|
|
video_dict['audio_url']]]
|
|
|
time.sleep(0.5)
|
|
|
- Feishu.update_values(log_type, crawler, "BUNvGC", "E2:Z2", values)
|
|
|
+ Feishu.update_values(log_type, crawler, "BUNvGC", "D2:Z2", values)
|
|
|
Common.logger(log_type, crawler).info('视频信息写入飞书完成\n')
|
|
|
Common.logging(log_type, crawler, env, '视频信息写入飞书完成\n')
|
|
|
|