|
@@ -14,7 +14,7 @@ class KS:
|
|
|
|
|
|
@classmethod
|
|
|
def get_share_count(cls, v_id):
|
|
|
- url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
|
|
|
+ url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
|
|
|
|
|
|
payload = json.dumps({
|
|
|
"content_id": v_id
|
|
@@ -109,40 +109,39 @@ class KS:
|
|
|
video_id = feeds[i].get("photo", {}).get("id", "")
|
|
|
status = sqlCollect.is_used(task_mark, video_id, mark, channel_id)
|
|
|
|
|
|
- # share_count = cls.get_share_count(video_id)
|
|
|
+ share_count = cls.get_share_count(video_id)
|
|
|
old_title = feeds[i].get("photo", {}).get("caption")
|
|
|
cover_url = feeds[i].get('photo', {}).get('coverUrl', "")
|
|
|
video_url = feeds[i].get('photo', {}).get('photoUrl', "")
|
|
|
view_count = int(feeds[i].get('photo', {}).get('viewCount', 0))
|
|
|
realLikeCount = int(feeds[i].get('photo', {}).get('realLikeCount', 0))
|
|
|
- # video_percent = '%.4f' % (share_count / view_count)
|
|
|
- video_percent = 0
|
|
|
+ video_percent = '%.4f' % (share_count / view_count)
|
|
|
|
|
|
duration = dataHelp.video_duration(video_url)
|
|
|
- # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
|
|
|
- log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
|
|
|
+ log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
|
|
|
+ # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
|
|
|
|
|
|
AliyunLogger.logging(channel_id, name, url_id, video_id, "扫描到一条视频", "2001", log_data)
|
|
|
- # Common.logger("ks").info(
|
|
|
- # f"扫描:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
+ Common.logger("ks").info(
|
|
|
+ f"扫描:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
if status:
|
|
|
AliyunLogger.logging(channel_id, name, url_id, video_id, "该视频已改造过", "2001", log_data)
|
|
|
continue
|
|
|
special = float(0.001)
|
|
|
- # if float(video_percent) < special:
|
|
|
- # AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
|
|
|
- # Common.logger("ks").info(
|
|
|
- # f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
- # continue
|
|
|
- # if share_count < 500:
|
|
|
- # AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
|
|
|
- # Common.logger("ks").info(
|
|
|
- # f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
- # continue
|
|
|
+ if float(video_percent) < special:
|
|
|
+ AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
|
|
|
+ Common.logger("ks").info(
|
|
|
+ f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
+ continue
|
|
|
+ if share_count < 500:
|
|
|
+ AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
|
|
|
+ Common.logger("ks").info(
|
|
|
+ f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
+ continue
|
|
|
if duration < 30 or duration > 720:
|
|
|
AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:时长不符合规则大于720秒/小于30秒", "2003", log_data)
|
|
|
- # Common.logger("ks").info(
|
|
|
- # f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
+ Common.logger("ks").info(
|
|
|
+ f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
|
|
|
continue
|
|
|
AliyunLogger.logging(channel_id, name, url_id, video_id, "符合规则等待改造", "2004", log_data)
|
|
|
all_data = {"video_id": video_id, "cover": cover_url, "video_url": video_url, "rule": video_percent, "old_title": old_title}
|