|
@@ -30,8 +30,9 @@ class KanyikanRecommend:
|
|
def get_videoList(cls, log_type, crawler, our_uid, rule_dict, env):
|
|
def get_videoList(cls, log_type, crawler, our_uid, rule_dict, env):
|
|
mq = MQ(topic_name="topic_crawler_etl_" + env)
|
|
mq = MQ(topic_name="topic_crawler_etl_" + env)
|
|
try:
|
|
try:
|
|
- Common.logger(log_type, crawler).info(f"正在抓取列表页")
|
|
|
|
|
|
+ Common.logger(log_type, crawler).info(f"正在抓取列表页{crawler}")
|
|
Common.logging(log_type, crawler, env, f"正在抓取列表页")
|
|
Common.logging(log_type, crawler, env, f"正在抓取列表页")
|
|
|
|
+ Common.logger(log_type, crawler).info(f"Test{crawler}")
|
|
session = Common.get_session(log_type, crawler, env)
|
|
session = Common.get_session(log_type, crawler, env)
|
|
if session is None:
|
|
if session is None:
|
|
time.sleep(1)
|
|
time.sleep(1)
|
|
@@ -62,6 +63,7 @@ class KanyikanRecommend:
|
|
}
|
|
}
|
|
urllib3.disable_warnings()
|
|
urllib3.disable_warnings()
|
|
response = requests.get(url=url, headers=header, params=params, proxies=proxies, verify=False)
|
|
response = requests.get(url=url, headers=header, params=params, proxies=proxies, verify=False)
|
|
|
|
+ # print(response)
|
|
if "data" not in response.text:
|
|
if "data" not in response.text:
|
|
Common.logger(log_type, crawler).info("获取视频list时,session过期,随机睡眠 31-50 秒")
|
|
Common.logger(log_type, crawler).info("获取视频list时,session过期,随机睡眠 31-50 秒")
|
|
Common.logging(log_type, crawler, env, "获取视频list时,session过期,随机睡眠 31-50 秒")
|
|
Common.logging(log_type, crawler, env, "获取视频list时,session过期,随机睡眠 31-50 秒")
|
|
@@ -164,9 +166,16 @@ class KanyikanRecommend:
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if __name__ == "__main__":
|
|
- print(get_config_from_mysql(log_type="recommend",
|
|
|
|
- source="kanyikan",
|
|
|
|
- env="dev",
|
|
|
|
- text="filter",
|
|
|
|
- action=""))
|
|
|
|
- pass
|
|
|
|
|
|
+ KanyikanRecommend.get_videoList(
|
|
|
|
+ log_type="recommend",
|
|
|
|
+ crawler="kanyikan",
|
|
|
|
+ env="prod",
|
|
|
|
+ rule_dict={'share_cnt': {'min': 300, 'max': 0}},
|
|
|
|
+ our_uid=64080779
|
|
|
|
+ )
|
|
|
|
+ # print(get_config_from_mysql(log_type="recommend",
|
|
|
|
+ # source="kanyikan",
|
|
|
|
+ # env="dev",
|
|
|
|
+ # text="filter",
|
|
|
|
+ # action=""))
|
|
|
|
+ # pass
|