1 gadu atpakaļ · c5749d3e68
--- a/data_channel/dy_keyword.py
+++ b/data_channel/dy_keyword.py
@@ -15,7 +15,7 @@ class DyKeyword:
 
				         share_count_rule = 0
			
 
				         special = 0
			
 
				         short_duration_rule = 0
			
 
				-        url = "http://8.217.190.241:8888/crawler/dou_yin/keyword"
			
 
				+        url = "http://47.236.68.175:8889/crawler/dou_yin/keyword"
			
 
				         list = []
			
 
				         payload = json.dumps({
			
 
				             "keyword": keyword,
			
--- a/data_channel/dy_ls.py
+++ b/data_channel/dy_ls.py
@@ -11,7 +11,7 @@ from common.sql_help import sqlCollect
 
				 class DYLS:
			
 
				     @classmethod
			
 
				     def get_dy_zr_list(cls, task_mark, url_id, number, mark, channel_id, name):
			
 
				-        url = "http://8.217.190.241:8888/crawler/dou_yin/blogger"
			
 
				+        url = "http://47.236.68.175:8889/crawler/dou_yin/blogger"
			
 
				         list = []
			
 
				         next_cursor = ''
			
 
				         for i in range(20):
			
@@ -105,7 +105,7 @@ class DYLS:
 
				             list = []
			
 
				             try:
			
 
				                 #  抖查查
			
 
				-                url = "http://8.217.190.241:8888/crawler/dou_yin/blogger"
			
 
				+                url = "http://47.236.68.175:8889/crawler/dou_yin/blogger"
			
 
				                 payload = json.dumps({
			
 
				                     "account_id": url_id,
			
 
				                     "source": "抖查查",
			
@@ -165,7 +165,7 @@ class DYLS:
 
				 
			
 
				     @classmethod
			
 
				     def get_video(cls, video_id):
			
 
				-        url = "http://8.217.190.241:8888/crawler/dou_yin/detail"
			
 
				+        url = "http://47.236.68.175:8889/crawler/dou_yin/detail"
			
 
				         for i in range(3):
			
 
				             payload = json.dumps({
			
 
				                 "content_id": str(video_id)
			
--- a/data_channel/ks_keyword.py
+++ b/data_channel/ks_keyword.py
@@ -18,7 +18,7 @@ class KsKeyword:
 
				         special = 0
			
 
				         short_duration_rule = 0
			
 
				 
			
 
				-        url = "http://8.217.190.241:8888/crawler/kuai_shou/keyword"
			
 
				+        url = "http://47.236.68.175:8889/crawler/kuai_shou/keyword"
			
 
				         list = []
			
 
				 
			
 
				         payload = json.dumps({
			
@@ -116,7 +116,7 @@ class KsKeyword:
 
				 
			
 
				     @classmethod
			
 
				     def get_video(cls, video_id):
			
 
				-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
			
 
				+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
			
 
				 
			
 
				         payload = json.dumps({
			
 
				             "content_id": str(video_id)
			
--- a/data_channel/ks_ls.py
+++ b/data_channel/ks_ls.py
@@ -10,7 +10,7 @@ class KSLS:
 
				     @classmethod
			
 
				     def get_ksls_list(cls, task_mark, url_id, number, mark, channel_id, name):
			
 
				         #  快手app
			
 
				-        url = "http://8.217.190.241:8888/crawler/kuai_shou/blogger"
			
 
				+        url = "http://47.236.68.175:8889/crawler/kuai_shou/blogger"
			
 
				         next_cursor = ""
			
 
				         for i in range(20):
			
 
				             payload = json.dumps({
			
@@ -93,7 +93,7 @@ class KSLS:
 
				 
			
 
				     @classmethod
			
 
				     def get_video(cls, video_id):
			
 
				-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
			
 
				+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
			
 
				 
			
 
				         payload = json.dumps({
			
 
				             "content_id": str(video_id)
			
--- a/data_channel/kuaishou.py
+++ b/data_channel/kuaishou.py
@@ -14,7 +14,7 @@ class KS:
 
				 
			
 
				     @classmethod
			
 
				     def get_share_count(cls, v_id):
			
 
				-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
			
 
				+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
			
 
				 
			
 
				         payload = json.dumps({
			
 
				             "content_id": v_id
			
@@ -109,40 +109,39 @@ class KS:
 
				                     video_id = feeds[i].get("photo", {}).get("id", "")
			
 
				                     status = sqlCollect.is_used(task_mark, video_id, mark, channel_id)
			
 
				 
			
 
				-                    # share_count = cls.get_share_count(video_id)
			
 
				+                    share_count = cls.get_share_count(video_id)
			
 
				                     old_title = feeds[i].get("photo", {}).get("caption")
			
 
				                     cover_url = feeds[i].get('photo', {}).get('coverUrl', "")
			
 
				                     video_url = feeds[i].get('photo', {}).get('photoUrl', "")
			
 
				                     view_count = int(feeds[i].get('photo', {}).get('viewCount', 0))
			
 
				                     realLikeCount = int(feeds[i].get('photo', {}).get('realLikeCount', 0))
			
 
				-                    # video_percent = '%.4f' % (share_count / view_count)
			
 
				-                    video_percent = 0
			
 
				+                    video_percent = '%.4f' % (share_count / view_count)
			
 
				 
			
 
				                     duration = dataHelp.video_duration(video_url)
			
 
				-                    # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
			
 
				-                    log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
			
 
				+                    log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
			
 
				+                    # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
			
 
				 
			
 
				                     AliyunLogger.logging(channel_id, name, url_id, video_id, "扫描到一条视频", "2001", log_data)
			
 
				-                    # Common.logger("ks").info(
			
 
				-                    #     f"扫描：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				+                    Common.logger("ks").info(
			
 
				+                        f"扫描：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				                     if status:
			
 
				                         AliyunLogger.logging(channel_id, name, url_id, video_id, "该视频已改造过", "2001", log_data)
			
 
				                         continue
			
 
				                     special = float(0.001)
			
 
				-                    # if float(video_percent) < special:
			
 
				-                    #     AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
			
 
				-                    #     Common.logger("ks").info(
			
 
				-                    #         f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				-                    #     continue
			
 
				-                    # if share_count < 500:
			
 
				-                    #     AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
			
 
				-                    #     Common.logger("ks").info(
			
 
				-                    #         f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				-                    #     continue
			
 
				+                    if float(video_percent) < special:
			
 
				+                        AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
			
 
				+                        Common.logger("ks").info(
			
 
				+                            f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				+                        continue
			
 
				+                    if share_count < 500:
			
 
				+                        AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
			
 
				+                        Common.logger("ks").info(
			
 
				+                            f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				+                        continue
			
 
				                     if duration < 30 or duration > 720:
			
 
				                         AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:时长不符合规则大于720秒/小于30秒", "2003", log_data)
			
 
				-                        # Common.logger("ks").info(
			
 
				-                        #     f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				+                        Common.logger("ks").info(
			
 
				+                            f"不符合规则：{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
			
 
				                         continue
			
 
				                     AliyunLogger.logging(channel_id, name, url_id, video_id, "符合规则等待改造", "2004", log_data)
			
 
				                     all_data = {"video_id": video_id, "cover": cover_url, "video_url": video_url, "rule": video_percent, "old_title": old_title}