wangkun 1 yıl önce
ebeveyn
işleme
c76c241d45

+ 1 - 0
README.MD

@@ -250,4 +250,5 @@ aliyun_python_sdk==2.2.0
 opencv-python~=4.8.0.74
 # pip3 install scikit-learn
 scikit-learn~=1.3.0
+# pip3 install beautifulsoup4
 ```

+ 4 - 0
common/publish.py

@@ -266,6 +266,10 @@ class Publish:
             return 'ZHIQINGZONGQUN'
         elif crawler == 'zhiqingtiantiankan':
             return 'ZHIQINGZONGQUN'
+        elif crawler == 'haitunzhufu':
+            return 'HAITUNZHUFU'
+        elif crawler == 'zhufuquanzi':
+            return 'ZHUFUQUANZI'
 
         elif crawler == 'kanyikan':
             return 'KANYIKAN'

+ 11 - 1
haitunzhufu/haitunzhufu_recommend/haitunzhufu_recommend2.py

@@ -3,6 +3,7 @@
 # @Time: 2023/9/13
 import json
 import os
+import random
 import re
 import shutil
 import sys
@@ -227,6 +228,15 @@ class HTZFRecommend:
             Common.logger(log_type, crawler).info('已抓取完一组视频,休眠5秒\n')
             time.sleep(5)
 
+    @classmethod
+    def get_our_uid(cls, log_type, crawler, env):
+        select_sql = f""" SELECT uid FROM crawler_user_v3 WHERE `source`="{crawler}"; """
+        uids = MysqlHelper.get_values(log_type, crawler, select_sql, env, action="")
+        uid_list = []
+        for uid_dict in uids:
+            uid_list.append(uid_dict["uid"])
+        return random.choice(uid_list)
+
     @classmethod
     def download_publish(cls, log_type, crawler, video_dict, env):
         Common.download_method(log_type=log_type, crawler=crawler, text='video', title=video_dict['video_title'],
@@ -251,7 +261,7 @@ class HTZFRecommend:
         our_video_id = Publish.upload_and_publish(log_type=log_type,
                                                   crawler=crawler,
                                                   strategy="推荐榜爬虫策略",
-                                                  our_uid="recommend",
+                                                  our_uid=cls.get_our_uid(log_type, crawler, env),
                                                   env=env,
                                                   oss_endpoint="out")
         if env == 'dev':