|
@@ -410,8 +410,8 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
|
|
|
"""
|
|
|
fetch_query = f"""
|
|
|
select article_id, title from {self.const.ARTICLE_TABLE_NAME}
|
|
|
- where category_status = %s and status = %s and score > %s
|
|
|
- order by score desc limit 1000;
|
|
|
+ where category_status = %s and status = %s and score > %s and read_cnt >= 5000
|
|
|
+ order by score desc limit 100000;
|
|
|
"""
|
|
|
fetch_result = self.db_client.fetch(
|
|
|
query=fetch_query,
|
|
@@ -428,6 +428,7 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
|
|
|
crawler_meta_article
|
|
|
where
|
|
|
category = 'account_association' and title_sensitivity = 0 and platform = 'weixin'
|
|
|
+
|
|
|
order by score desc
|
|
|
"""
|
|
|
article_list = self.db_client.fetch(query=fetch_query)
|
|
@@ -482,7 +483,7 @@ class ArticlePoolCategoryGenerationTask(CategoryGenerationTask):
|
|
|
|
|
|
self.rollback_lock_tasks(self.const.ARTICLE_TABLE_NAME)
|
|
|
|
|
|
- task_list = self.get_task_v2()
|
|
|
+ task_list = self.get_task_list()
|
|
|
task_batch_list = yield_batch(data=task_list, batch_size=self.const.BATCH_SIZE)
|
|
|
|
|
|
# # dev
|