Parcourir la source

outside article monitor

luojunhui il y a 2 mois
Parent
commit
c67df28911
1 fichiers modifiés avec 4 ajouts et 3 suppressions
  1. 4 3
      tasks/ai_tasks/category_generation_task.py

+ 4 - 3
tasks/ai_tasks/category_generation_task.py

@@ -410,8 +410,8 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
         """
         fetch_query = f"""
                select article_id, title from {self.const.ARTICLE_TABLE_NAME}
-               where category_status = %s and status = %s and score > %s
-               order by score desc limit 1000;
+               where category_status = %s and status = %s and score > %s and read_cnt >= 5000
+               order by score desc limit 100000;
            """
         fetch_result = self.db_client.fetch(
             query=fetch_query,
@@ -428,6 +428,7 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
                 crawler_meta_article
             where 
                 category = 'account_association' and title_sensitivity = 0 and platform = 'weixin'
+                
             order by score desc
         """
         article_list = self.db_client.fetch(query=fetch_query)
@@ -482,7 +483,7 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
 
         self.rollback_lock_tasks(self.const.ARTICLE_TABLE_NAME)
 
-        task_list = self.get_task_v2()
+        task_list = self.get_task_list()
         task_batch_list = yield_batch(data=task_list, batch_size=self.const.BATCH_SIZE)
 
         # #  dev