Ver código fonte

小年糕账户数据源获取变更

zhangliang 1 mês atrás
pai
commit
dc393eb8ea
2 arquivos alterados com 9 adições e 5 exclusões
  1. 5 1
      services/async_mysql_service.py
  2. 4 4
      spiders/authorspider.py

+ 5 - 1
services/async_mysql_service.py

@@ -162,7 +162,11 @@ class AsyncMysqlService:
 
     async def get_xng_mid(self) -> int:
         #  order by `create_time` desc
-        sql = """select uid,link,nick_name from crawler_user_v3 where task_id=21"""
+        sql = """SELECT uid,id
+                FROM xng_uid
+                GROUP BY uid  
+                ORDER BY id DESC;
+              """
         result = await self.fetch_all(sql)
         return result if result else 0
 

+ 4 - 4
spiders/authorspider.py

@@ -41,7 +41,7 @@ class AuthorSpider(BaseSpider):
                 return
 
             user = self.user_list_from_db[self.current_user_index]
-            crawler_user_uid = user.get("link")
+            crawler_user_uid = user.get("uid")
             self.logger.info(
                 f"处理用户 uid={crawler_user_uid}(第{self.current_user_index + 1}个),"
                 f"当前cursor: {self.current_cursor or '0'}"
@@ -54,8 +54,8 @@ class AuthorSpider(BaseSpider):
             raw_data = await self.crawl_user_videos(request_body, crawler_user_uid)
 
             # 处理数据
-            if self.platform == "xiaoniangao":
-                self.user_list = [user]  # 特殊逻辑
+            # if self.platform == "xiaoniangao":
+            #     self.user_list = [user]  # 特殊逻辑
             pass_video = await self.process_data(raw_data)
             # 根据成功通过视频数大于0和下一页游标判断是否继续当前用户
             if pass_video > 0 and self.current_cursor:
@@ -77,7 +77,7 @@ class AuthorSpider(BaseSpider):
         """构建请求体"""
         virtual_data = {
             # "uid": "173309188", # 测试
-            "uid": str(user.get("link")),
+            "uid": str(user.get("uid")),
             "next_cursor": self.current_cursor
         }