Browse Source

冷启动,将抓取计划id存储到抓取计划表

luojunhui 7 months ago
parent
commit
d4ec85a9b6
1 changed files with 6 additions and 1 deletions
  1. 6 1
      coldStartTasks/publish/publishCategoryArticles.py

+ 6 - 1
coldStartTasks/publish/publishCategoryArticles.py

@@ -226,6 +226,7 @@ class CategoryColdStartTask(object):
             mention=False
         )
         if url_list:
+            # create_crawler_plan
             crawler_plan_response = aiditApi.auto_create_crawler_task(
                 plan_id=None,
                 plan_name="自动绑定-{}--{}--{}".format(category, datetime.date.today().__str__(), len(url_list)),
@@ -238,12 +239,14 @@ class CategoryColdStartTask(object):
                 message="成功创建抓取计划",
                 data=crawler_plan_response
             )
-            # auto bind to generate plan
+
+            # save to db
             create_timestamp = int(time.time()) * 1000
             crawler_plan_id = crawler_plan_response['data']['id']
             crawler_plan_name = crawler_plan_response['data']['name']
             self.insert_into_db(crawler_plan_id, crawler_plan_name, create_timestamp)
 
+            # auto bind to generate plan
             new_crawler_task_list = [
                 {
                     "contentType": 1,
@@ -266,6 +269,8 @@ class CategoryColdStartTask(object):
                 message="成功绑定到生成计划",
                 data=generate_plan_response
             )
+
+            # change article status
             article_id_list = filter_df['article_id'].values.tolist()
             self.change_article_status_while_publishing(article_id_list=article_id_list)