| 
					
				 | 
			
			
				@@ -13,6 +13,7 @@ from applications import aiditApi, log, bot 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 from config import apolloConfig 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 apollo = apolloConfig() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+DAILY_CRAWLER_MAX_NUM = 1000 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				 class CategoryColdStartTask(object): 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -268,7 +269,7 @@ class CategoryColdStartTask(object): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             }, 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             mention=False 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         ) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-        return filter_df[:1000] 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+        return filter_df[:DAILY_CRAWLER_MAX_NUM] 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				     def filter_toutiao_articles(self, articles_df, category): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         """ 
			 | 
		
	
	
		
			
				| 
					
				 | 
			
			
				@@ -377,7 +378,7 @@ class CategoryColdStartTask(object): 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				         for category in category_list: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				             try: 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 # 已发布标题去重 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				-                self.published_articles_title_filter(category=category) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				+                self.published_articles_title_filter() 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				  
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 category_df = self.get_articles_from_meta_table(category=category, article_source=article_source) 
			 | 
		
	
		
			
				 | 
				 | 
			
			
				                 self.publish_filter_articles( 
			 |