|
@@ -101,7 +101,9 @@ class XiaoNianGaoAuthor:
|
|
try:
|
|
try:
|
|
message = f"扫描到一条视频"
|
|
message = f"扫描到一条视频"
|
|
print(message)
|
|
print(message)
|
|
- self.process_video_obj(video_obj, user_dict)
|
|
|
|
|
|
+ flag = self.process_video_obj(video_obj, user_dict)
|
|
|
|
+ if not flag:
|
|
|
|
+ return
|
|
except Exception as e:
|
|
except Exception as e:
|
|
message = "抓取单条视频异常, 报错原因是: {}".format(e)
|
|
message = "抓取单条视频异常, 报错原因是: {}".format(e)
|
|
print(message)
|
|
print(message)
|
|
@@ -160,7 +162,15 @@ class XiaoNianGaoAuthor:
|
|
"strategy": self.mode,
|
|
"strategy": self.mode,
|
|
"out_video_id": video_obj.get("vid", ""),
|
|
"out_video_id": video_obj.get("vid", ""),
|
|
}
|
|
}
|
|
- print(video_dict)
|
|
|
|
|
|
+ if (
|
|
|
|
+ int(time.time()) - publish_time_stamp
|
|
|
|
+ > 3600 * 24 * int(self.rule_dict.get("period", {}).get("max", 1000))
|
|
|
|
+ ):
|
|
|
|
+ message = "发布时间超过{}天".format(
|
|
|
|
+ int(self.rule_dict.get("period", {}).get("max", 1000))
|
|
|
|
+ )
|
|
|
|
+ print(message)
|
|
|
|
+ return False
|
|
pipeline = PiaoQuanPipelineTest(
|
|
pipeline = PiaoQuanPipelineTest(
|
|
platform=self.platform,
|
|
platform=self.platform,
|
|
mode=self.mode,
|
|
mode=self.mode,
|
|
@@ -176,11 +186,12 @@ class XiaoNianGaoAuthor:
|
|
video_dict["crawler_rule"] = json.dumps(self.rule_dict)
|
|
video_dict["crawler_rule"] = json.dumps(self.rule_dict)
|
|
video_dict["user_id"] = user_dict["uid"]
|
|
video_dict["user_id"] = user_dict["uid"]
|
|
video_dict["publish_time"] = video_dict["publish_time_str"]
|
|
video_dict["publish_time"] = video_dict["publish_time_str"]
|
|
- # print(video_dict)
|
|
|
|
- self.mq.send_msg(video_dict)
|
|
|
|
|
|
+ print(video_dict)
|
|
|
|
+ # self.mq.send_msg(video_dict)
|
|
self.download_count += 1
|
|
self.download_count += 1
|
|
message = "成功发送 MQ 至 ETL"
|
|
message = "成功发送 MQ 至 ETL"
|
|
print(message)
|
|
print(message)
|
|
|
|
+ return True
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if __name__ == "__main__":
|