zhangyong 5 mēneši atpakaļ
vecāks
revīzija
c5749d3e68

+ 1 - 1
data_channel/dy_keyword.py

@@ -15,7 +15,7 @@ class DyKeyword:
         share_count_rule = 0
         special = 0
         short_duration_rule = 0
-        url = "http://8.217.190.241:8888/crawler/dou_yin/keyword"
+        url = "http://47.236.68.175:8889/crawler/dou_yin/keyword"
         list = []
         payload = json.dumps({
             "keyword": keyword,

+ 3 - 3
data_channel/dy_ls.py

@@ -11,7 +11,7 @@ from common.sql_help import sqlCollect
 class DYLS:
     @classmethod
     def get_dy_zr_list(cls, task_mark, url_id, number, mark, channel_id, name):
-        url = "http://8.217.190.241:8888/crawler/dou_yin/blogger"
+        url = "http://47.236.68.175:8889/crawler/dou_yin/blogger"
         list = []
         next_cursor = ''
         for i in range(20):
@@ -105,7 +105,7 @@ class DYLS:
             list = []
             try:
                 #  抖查查
-                url = "http://8.217.190.241:8888/crawler/dou_yin/blogger"
+                url = "http://47.236.68.175:8889/crawler/dou_yin/blogger"
                 payload = json.dumps({
                     "account_id": url_id,
                     "source": "抖查查",
@@ -165,7 +165,7 @@ class DYLS:
 
     @classmethod
     def get_video(cls, video_id):
-        url = "http://8.217.190.241:8888/crawler/dou_yin/detail"
+        url = "http://47.236.68.175:8889/crawler/dou_yin/detail"
         for i in range(3):
             payload = json.dumps({
                 "content_id": str(video_id)

+ 2 - 2
data_channel/ks_keyword.py

@@ -18,7 +18,7 @@ class KsKeyword:
         special = 0
         short_duration_rule = 0
 
-        url = "http://8.217.190.241:8888/crawler/kuai_shou/keyword"
+        url = "http://47.236.68.175:8889/crawler/kuai_shou/keyword"
         list = []
 
         payload = json.dumps({
@@ -116,7 +116,7 @@ class KsKeyword:
 
     @classmethod
     def get_video(cls, video_id):
-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
 
         payload = json.dumps({
             "content_id": str(video_id)

+ 2 - 2
data_channel/ks_ls.py

@@ -10,7 +10,7 @@ class KSLS:
     @classmethod
     def get_ksls_list(cls, task_mark, url_id, number, mark, channel_id, name):
         #  快手app
-        url = "http://8.217.190.241:8888/crawler/kuai_shou/blogger"
+        url = "http://47.236.68.175:8889/crawler/kuai_shou/blogger"
         next_cursor = ""
         for i in range(20):
             payload = json.dumps({
@@ -93,7 +93,7 @@ class KSLS:
 
     @classmethod
     def get_video(cls, video_id):
-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
 
         payload = json.dumps({
             "content_id": str(video_id)

+ 19 - 20
data_channel/kuaishou.py

@@ -14,7 +14,7 @@ class KS:
 
     @classmethod
     def get_share_count(cls, v_id):
-        url = "http://8.217.190.241:8888/crawler/kuai_shou/detail"
+        url = "http://47.236.68.175:8889/crawler/kuai_shou/detail"
 
         payload = json.dumps({
             "content_id": v_id
@@ -109,40 +109,39 @@ class KS:
                     video_id = feeds[i].get("photo", {}).get("id", "")
                     status = sqlCollect.is_used(task_mark, video_id, mark, channel_id)
 
-                    # share_count = cls.get_share_count(video_id)
+                    share_count = cls.get_share_count(video_id)
                     old_title = feeds[i].get("photo", {}).get("caption")
                     cover_url = feeds[i].get('photo', {}).get('coverUrl', "")
                     video_url = feeds[i].get('photo', {}).get('photoUrl', "")
                     view_count = int(feeds[i].get('photo', {}).get('viewCount', 0))
                     realLikeCount = int(feeds[i].get('photo', {}).get('realLikeCount', 0))
-                    # video_percent = '%.4f' % (share_count / view_count)
-                    video_percent = 0
+                    video_percent = '%.4f' % (share_count / view_count)
 
                     duration = dataHelp.video_duration(video_url)
-                    # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
-                    log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
+                    log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,share_count:{share_count},,view_count:{view_count},,duration:{duration}"
+                    # log_data = f"user:{url_id},,video_id:{video_id},,video_url:{video_url},,original_title:{old_title},,view_count:{view_count},,duration:{duration}"
 
                     AliyunLogger.logging(channel_id, name, url_id, video_id, "扫描到一条视频", "2001", log_data)
-                    # Common.logger("ks").info(
-                    #     f"扫描:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
+                    Common.logger("ks").info(
+                        f"扫描:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
                     if status:
                         AliyunLogger.logging(channel_id, name, url_id, video_id, "该视频已改造过", "2001", log_data)
                         continue
                     special = float(0.001)
-                    # if float(video_percent) < special:
-                    #     AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
-                    #     Common.logger("ks").info(
-                    #         f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
-                    #     continue
-                    # if share_count < 500:
-                    #     AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
-                    #     Common.logger("ks").info(
-                    #         f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
-                    #     continue
+                    if float(video_percent) < special:
+                        AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享/浏览小于0.001", "2003", log_data)
+                        Common.logger("ks").info(
+                            f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
+                        continue
+                    if share_count < 500:
+                        AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:分享小于500", "2003", log_data)
+                        Common.logger("ks").info(
+                            f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
+                        continue
                     if duration < 30 or duration > 720:
                         AliyunLogger.logging(channel_id, name, url_id, video_id, "不符合规则:时长不符合规则大于720秒/小于30秒", "2003", log_data)
-                        # Common.logger("ks").info(
-                        #     f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
+                        Common.logger("ks").info(
+                            f"不符合规则:{task_mark},用户主页id:{url_id},视频id{video_id} ,播放数:{view_count} ,分享数:{share_count},时长:{duration} ")
                         continue
                     AliyunLogger.logging(channel_id, name, url_id, video_id, "符合规则等待改造", "2004", log_data)
                     all_data = {"video_id": video_id, "cover": cover_url, "video_url": video_url, "rule": video_percent, "old_title": old_title}