|
@@ -175,6 +175,7 @@ class ArticlePoolColdStart(ArticlePoolColdStartStrategy, ArticlePoolFilterStrate
|
|
|
article_dataframe = await self.get_article_from_meta_table(
|
|
article_dataframe = await self.get_article_from_meta_table(
|
|
|
platform, crawl_method, strategy, category
|
|
platform, crawl_method, strategy, category
|
|
|
)
|
|
)
|
|
|
|
|
+ print(article_dataframe)
|
|
|
|
|
|
|
|
await self.log_client.log(
|
|
await self.log_client.log(
|
|
|
contents={
|
|
contents={
|
|
@@ -228,6 +229,21 @@ class ArticlePoolColdStart(ArticlePoolColdStartStrategy, ArticlePoolFilterStrate
|
|
|
article_id_list=article_id_list
|
|
article_id_list=article_id_list
|
|
|
)
|
|
)
|
|
|
|
|
|
|
|
|
|
+ case "strategy_v3":
|
|
|
|
|
+ url_list = filter_article_df["link"].values.tolist()
|
|
|
|
|
+ print("url_list", url_list)
|
|
|
|
|
+ await self.create_crawler_plan_and_bind_to_produce_plan(
|
|
|
|
|
+ strategy, crawl_method, category, platform, url_list, plan_id
|
|
|
|
|
+ )
|
|
|
|
|
+ print("抓取计划创建成功")
|
|
|
|
|
+ # change article status
|
|
|
|
|
+ article_id_list = filter_article_df["article_id"].values.tolist()
|
|
|
|
|
+ await self.change_article_status_while_publishing(
|
|
|
|
|
+ article_id_list=article_id_list
|
|
|
|
|
+ )
|
|
|
|
|
+ print("文章状态修改成功")
|
|
|
|
|
+
|
|
|
|
|
+
|
|
|
async def deal(
|
|
async def deal(
|
|
|
self,
|
|
self,
|
|
|
platform: str,
|
|
platform: str,
|
|
@@ -388,5 +404,13 @@ class ArticlePoolColdStart(ArticlePoolColdStartStrategy, ArticlePoolFilterStrate
|
|
|
mention=False,
|
|
mention=False,
|
|
|
)
|
|
)
|
|
|
|
|
|
|
|
|
|
+ case "strategy_v3":
|
|
|
|
|
+ plan_id = "20250703081329508785665"
|
|
|
|
|
+ await self.create_cold_start_plan(
|
|
|
|
|
+ platform=platform,
|
|
|
|
|
+ strategy=strategy,
|
|
|
|
|
+ plan_id=plan_id,
|
|
|
|
|
+ )
|
|
|
|
|
+
|
|
|
case _:
|
|
case _:
|
|
|
raise Exception(f"error strategy {strategy}")
|
|
raise Exception(f"error strategy {strategy}")
|