Przeglądaj źródła

限流文章扫描删除策略迭代

luojunhui 3 tygodni temu
rodzic
commit
4aa453cac5
2 zmienionych plików z 346 dodań i 148 usunięć
  1. 295 105
      README.md
  2. 51 43
      dev/crontab_back.txt

+ 295 - 105
README.md

@@ -29,12 +29,28 @@ docker compose up -d
 │   │   │   └── rate_limiter.py
 │   │   ├── service
 │   │   │   ├── __init__.py
+│   │   │   ├── daily_rank_manager.py
 │   │   │   ├── gzh_cookie_manager.py
 │   │   │   ├── task_manager_service.py
 │   │   │   └── task_scheduler.py
 │   │   └── v1
-│   │       ├── __init__.py
-│   │       └── routes.py
+│   │       ├── endpoints
+│   │       │   ├── __init__.py
+│   │       │   ├── abtest.py
+│   │       │   ├── health.py
+│   │       │   ├── mcp.py
+│   │       │   ├── monitor.py
+│   │       │   ├── rank_log.py
+│   │       │   ├── tasks.py
+│   │       │   └── tokens.py
+│   │       ├── routes
+│   │       │   ├── __init__.py
+│   │       │   └── routes.py
+│   │       └── utils
+│   │           ├── __init__.py
+│   │           ├── _utils.py
+│   │           ├── deps.py
+│   │           └── schemas.py
 │   ├── core
 │   │   ├── bootstrap
 │   │   │   ├── __init__.py
@@ -53,6 +69,7 @@ docker compose up -d
 │   │   │       ├── deepseek.py
 │   │   │       ├── elasticsearch.py
 │   │   │       ├── mysql.py
+│   │   │       ├── read_rate_limited.py
 │   │   │       └── task_chinese_name.py
 │   │   ├── database
 │   │   │   ├── __init__.py
@@ -79,9 +96,20 @@ docker compose up -d
 │   │   ├── analysis_task
 │   │   │   ├── __init__.py
 │   │   │   ├── account_position_info.py
-│   │   │   └── crawler_detail.py
+│   │   │   ├── crawler_detail.py
+│   │   │   └── rate_limited_article_filter
+│   │   │       ├── __init__.py
+│   │   │       ├── _mapper.py
+│   │   │       ├── _utils.py
+│   │   │       └── entrance.py
 │   │   ├── cold_start_tasks
 │   │   │   ├── __init__.py
+│   │   │   ├── ad_platform_articles
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _utils.py
+│   │   │   │   └── entrance.py
 │   │   │   ├── article_pool
 │   │   │   │   ├── __init__.py
 │   │   │   │   ├── article_pool_cold_start_const.py
@@ -104,21 +132,78 @@ docker compose up -d
 │   │   │   ├── article_detail_stat.py
 │   │   │   ├── recycle_daily_publish_articles.py
 │   │   │   ├── recycle_mini_program_detail.py
+│   │   │   ├── recycle_mini_program_info
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _util.py
+│   │   │   │   └── entrance.py
 │   │   │   └── recycle_outside_account_articles.py
 │   │   ├── llm_tasks
 │   │   │   ├── __init__.py
+│   │   │   ├── aigc_decode_task
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _utils.py
+│   │   │   │   ├── create_decode_tasks.py
+│   │   │   │   ├── extract_decode_task_detail.py
+│   │   │   │   └── fetch_decode_results.py
 │   │   │   ├── candidate_account_process.py
 │   │   │   ├── process_title.py
 │   │   │   └── prompts.py
-│   │   └── monitor_tasks
+│   │   ├── mcp
+│   │   │   ├── __init__.py
+│   │   │   ├── _const.py
+│   │   │   ├── _handler_map.py
+│   │   │   └── _mapper.py
+│   │   ├── monitor_tasks
+│   │   │   ├── __init__.py
+│   │   │   ├── ad_platform_accounts_monitor
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _utils.py
+│   │   │   │   └── entrance.py
+│   │   │   ├── auto_reply_cards_monitor
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _utils.py
+│   │   │   │   └── entrance.py
+│   │   │   ├── cooperate_accounts_monitor.py
+│   │   │   ├── fwh_group_publish_monitor.py
+│   │   │   ├── get_off_videos.py
+│   │   │   ├── gzh_article_monitor.py
+│   │   │   ├── kimi_balance.py
+│   │   │   ├── limited_account_analysis.py
+│   │   │   ├── rank_log_monitor
+│   │   │   │   ├── __init__.py
+│   │   │   │   ├── _const.py
+│   │   │   │   ├── _mapper.py
+│   │   │   │   ├── _utils.py
+│   │   │   │   └── entrance.py
+│   │   │   └── task_processing_monitor.py
+│   │   └── recommend
 │   │       ├── __init__.py
-│   │       ├── auto_reply_cards_monitor.py
-│   │       ├── cooperate_accounts_monitor.py
-│   │       ├── get_off_videos.py
-│   │       ├── gzh_article_monitor.py
-│   │       ├── kimi_balance.py
-│   │       ├── limited_account_analysis.py
-│   │       └── task_processing_monitor.py
+│   │       ├── i2i_recommend
+│   │       │   ├── __init__.py
+│   │       │   ├── _const.py
+│   │       │   ├── _mapper.py
+│   │       │   ├── _utils.py
+│   │       │   └── entrance.py
+│   │       └── offline_recommend
+│   │           ├── __init__.py
+│   │           ├── core.py
+│   │           ├── strategy
+│   │           │   ├── __init__.py
+│   │           │   ├── base.py
+│   │           │   ├── get_top_article.py
+│   │           │   └── i2i.py
+│   │           └── utils
+│   │               ├── __init__.py
+│   │               ├── produce_data.py
+│   │               └── recommend_apollo.py
 │   ├── infra
 │   │   ├── crawler
 │   │   │   ├── __init__.py
@@ -142,31 +227,58 @@ docker compose up -d
 │   │   │   ├── apollo.py
 │   │   │   ├── deepseek_official.py
 │   │   │   ├── elastic_search.py
-│   │   │   └── feishu.py
+│   │   │   ├── feishu.py
+│   │   │   └── odps_service.py
 │   │   ├── internal
 │   │   │   ├── __init__.py
 │   │   │   ├── aigc_system.py
 │   │   │   ├── long_articles.py
-│   │   │   └── piaoquan.py
-│   │   ├── shared
+│   │   │   ├── piaoquan.py
+│   │   │   └── piaoquan_decode_server.py
+│   │   ├── mapper
 │   │   │   ├── __init__.py
-│   │   │   ├── async_tasks.py
-│   │   │   ├── http_client.py
-│   │   │   └── tools.py
-│   │   └── utils
+│   │   │   ├── aigc_mapper.py
+│   │   │   ├── long_article_mapper.py
+│   │   │   ├── long_video_mapper.py
+│   │   │   └── piaoquan_crawler_mapper.py
+│   │   └── shared
 │   │       ├── __init__.py
-│   │       ├── get_cover.py
-│   │       └── response.py
-│   └── jobs
-│       ├── task_config.py
-│       ├── task_handler.py
-│       ├── task_mapper.py
-│       └── task_utils.py
+│   │       ├── async_tasks.py
+│   │       ├── http_client.py
+│   │       ├── image.py
+│   │       ├── oss.py
+│   │       ├── response.py
+│   │       └── tools.py
+│   ├── jobs
+│   │   ├── domains
+│   │   │   ├── __init__.py
+│   │   │   ├── algorithm.py
+│   │   │   ├── anaylsis.py
+│   │   │   ├── cold_start.py
+│   │   │   ├── crawler_tasks.py
+│   │   │   ├── data_recycle.py
+│   │   │   ├── llm_task.py
+│   │   │   ├── monitor_task.py
+│   │   │   └── recommend.py
+│   │   ├── task_config.py
+│   │   ├── task_handler.py
+│   │   ├── task_mapper.py
+│   │   └── task_utils.py
+│   └── schemas
+│       ├── __init__.py
+│       └── image.py
 ├── app_config.toml
+├── dev
+│   ├── crontab_back.txt
 ├── docker-compose.yaml
+├── docs
+│   ├── i2i_recommend_data_sync.md
+│   ├── rank_log_monitor_tech_plan.md
+│   └── rate_limited_article_filter_tech_plan.md
 ├── jenkins_bash.sh
 ├── requirements.txt
 └── task_app.py
+
 ```
 
 ### get code strategy
@@ -174,90 +286,168 @@ docker compose up -d
 tree -I "__pycache__|*.pyc"
 ```
 
-## 1. 数据任务
-#### daily发文数据回收
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
-```
-#### daily发文更新root_source_id
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
-```
-#### 账号质量处理
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'
-```
-## 2. 抓取任务
+## Crontab(生产调度)
 
-#### 今日头条账号内文章抓取
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao"}'
-```
-#### 今日头条推荐抓取文章
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao", "method": "recommend"}'
-```
-#### 今日头条搜索抓取账号
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao", "method": "search"}'
-```
-#### 抓取账号管理(微信)
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_account_manager", "platform": "weixin"}'
-```
-#### 抓取微信文章(抓账号模式)
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "account_association", "crawl_mode": "account"}'
-```
-#### 抓取微信文章(搜索模式)
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "search", "crawl_mode": "search"}'
-```
+以下为服务器上配置的定时任务(路径与主机以实际环境为准)。
 
-## 3. 冷启动发布任务
-#### 发布头条文章
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "platform": "toutiao", "crawler_methods": ["toutiao_account_association"]}'
-```
-#### 发布公众号文章
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start"}'
-```
+```cron
+0 9,15,21 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "auto_follow_account"}'
 
-## 4. 其他
-#### 校验kimi余额
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
-```
-#### 自动下架视频
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_off_videos"}'
-```
-#### 校验视频可见状态
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_publish_video_audit_status"}'
-```
-#### 外部服务号监测
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "outside_article_monitor"}'
-```
-#### 站内服务号发文监测
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
-```
-#### 标题重写
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "title_rewrite"}'
-```
-#### 为标题增加品类(文章池)
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_category_generation", "limit": "1000"}'
-```
-#### 候选账号质量分析
-```aiignore
-curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'
-```
+26 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rate_limited_article_filter"}'
+
+30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_follow_result"}'
+
+50 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_reply_result"}'
+
+
+0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "1030-手动挑号", "crawl_mode": "account", "strategy": "V1"}'
+
+0 4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "cooperate_account", "crawl_mode": "account", "strategy": "V1"}'
+
+
+# 定时清理文件
+0 1 * * * find /root/luojunhui/LongArticlesJob/static -type f -name "*.mp4" -mtime +5 -delete
+# 每天 9 点, 18 点执行 gzh 视频抓取
+0 9,18 * * * bash /root/luojunhui/LongArticlesJob/sh/run_gzh_video_crawler.sh
+
+* * * * * bash /root/luojunhui/LongArticlesJob/sh/run_long_articles_job.sh
+
+# 外部服务号监测
+0 13 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_monitor"}'
+
+30 * * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_detail"}'
+
+# 每天凌晨 4点,下午 4 点各执行一次头条视频抓取
+0 4,16 * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_account_video_crawler.sh
+
+# 更新服务号数据
+0 10,17 * * * bash /root/luojunhui/LongArticlesJob/sh/run_fwh_data_manager.sh
+
+# 每15分钟执行一次今日头条推荐流抓取
+*/15 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_recommend.sh
+
+# 每10分钟执行一次从aigc系统获取发布文章
+*/10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_article_info_from_aigc.sh
+
+# 每10分钟执行一次标题相似度计算任务
+*/10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_similarity_task.sh
+
+# 每小时执行一次标题改写
+0 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_process_task.sh
+
+# 凌晨2点30执行更新小程序信息任务
+30 2 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_minigram_info_daily.sh
+
+# 凌晨3:00,下午3:00执行视频号抓取任务
+0 3,15 * * * bash /root/luojunhui/LongArticlesJob/sh/run_sph_video_crawler.sh
+
+# 每天上午10点30执行文章退场 && 晋升任务
+30 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_title_exit_v1.sh
+
+# 晚上6点执行头条文章冷启动
+0 18 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "platform": "toutiao", "crawler_methods": ["toutiao_account_association"]}'
+
+# 17:50执行公众号文章战冷启动
+30 17 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "strategy": "strategy_v3"}'
+
+0 4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "strategy": "strategy_v1"}'
+
+# 早上执行sohu 抓取
+0 6 * * * bash /root/luojunhui/LongArticlesJob/sh/run_schedule_app.sh
+0 2 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao"}'
+
+#
+0 14 * * * bash /root/luojunhui/LongArticlesJob/sh/run_cold_start_publish.sh
+
+# 每日上午9点执行账号联想任务
+0 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_association.sh
+
+# 执行阅读率均值
+0 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_read_rate_avg"}'
+
+# 执行阅读均值
+40 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_read_avg"}'
+
+# 执行打开率均值
+50 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_open_rate_avg"}'
+
+
+# 每天11点执行文章联想任务
+0 11 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_association.sh
+
+# 每小时执行一次校验视频状态
+24 */4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_publish_video_audit_status"}'
+
+
+# 每天凌晨4:30 15:30执行视频发布和审核流程
+0 1,8,19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_video_publish_and_audit.sh
+
+
+30 8,15 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
+
+0 21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
+
+10 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
+
+30 9,16,21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
+
+30 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
+
+# 每天上午 9:30 点,下午 2 点,晚上 7 点执行下架视频任务
+0 9,15,19 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_off_videos"}'
+
+# 执行内部文章违规检测
+0 9,16,23 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
+
+# 每开始执行百度视频
+20 0,12 * * * bash /root/luojunhui/LongArticlesJob/sh/run_baidu_video_crawler.sh
+
+# check kimo balance hourly
+# 每4h校验一次kimi余额
+# 25 */4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
+
+# 更新小程序信息
+0 3,4,5,6,7,8 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "mini_program_detail_process"}'
+
+
+# */8 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_title_features", "batch_size": 50, "version": 2}'
+
+# 0 9,16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "recycle_outside_account_articles"}'
+
+# 35 16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_outside_account_article_root_source_id"}'
+
+# 执行限流文章分析
+40 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_limited_account_info"}'
+
+# 早上 11 点获取前日文章详情
+30 11 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_detail_stat"}'
+
+# 执行广告平台账号内容抓取
+0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_accounts_crawler"}'
+
+# 执广告平台账号详情抓取
+32 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_detail"}'
+
+# 执行创建解构任务
+# 15 20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_ad_platform_accounts_decode_task"}'
+
+# 定时获取解构结果
+30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_decode_result"}'
+
+
+# 定时获取解构结果
+50 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_decode_result"}'
+
+# 腾讯广告互相平台账号--发文至头条
+0 6 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_publish"}'
 
+# 排序日志更新
+0 14 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rank_log_monitor"}'
 
+# I2I 排序日志更新
+0 5 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "i2i_recommend_data_sync"}'
 
 
+# 候选账号质量分析
+# 0 5,10,15,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'
+```

+ 51 - 43
dev/crontab_back.txt

@@ -1,7 +1,16 @@
+0 9,15,21 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "auto_follow_account"}'
 
-0 3 * * * curl -X POST http://192.168.100.31:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "1030-手动挑号", "crawl_mode": "account", "strategy": "V1"}'
+26 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rate_limited_article_filter"}'
+
+30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_follow_result"}'
+
+50 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_reply_result"}'
+
+
+0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "1030-手动挑号", "crawl_mode": "account", "strategy": "V1"}'
+
+0 4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "cooperate_account", "crawl_mode": "account", "strategy": "V1"}'
 
-0 4 * * * curl -X POST http://192.168.100.31:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "cooperate_account", "crawl_mode": "account", "strategy": "V1"}'
 
 # 定时清理文件
 0 1 * * * find /root/luojunhui/LongArticlesJob/static -type f -name "*.mp4" -mtime +5 -delete
@@ -11,13 +20,15 @@
 * * * * * bash /root/luojunhui/LongArticlesJob/sh/run_long_articles_job.sh
 
 # 外部服务号监测
-# 0 13 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "outside_article_monitor"}'
+0 13 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_monitor"}'
+
+30 * * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_detail"}'
 
 # 每天凌晨 4点,下午 4 点各执行一次头条视频抓取
 0 4,16 * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_account_video_crawler.sh
 
 # 更新服务号数据
-0 11,17 * * * bash /root/luojunhui/LongArticlesJob/sh/run_fwh_data_manager.sh
+0 10,17 * * * bash /root/luojunhui/LongArticlesJob/sh/run_fwh_data_manager.sh
 
 # 每15分钟执行一次今日头条推荐流抓取
 */15 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_recommend.sh
@@ -40,9 +51,6 @@
 # 每天上午10点30执行文章退场 && 晋升任务
 30 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_title_exit_v1.sh
 
-# 每天上午4点执行账号冷启动任务
-# 0 1 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_cold_start_daily.sh
-
 # 晚上6点执行头条文章冷启动
 0 18 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "platform": "toutiao", "crawler_methods": ["toutiao_account_association"]}'
 
@@ -61,12 +69,6 @@
 # 每日上午9点执行账号联想任务
 0 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_association.sh
 
-# 每天 10 点执行前一天的阅读率均值代码
-# 0 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_account_read_rate_avg.sh
-
-# 每天10点40执行阅读均值任务
-# 40 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_account_avg_v3.sh
-
 # 执行阅读率均值
 0 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_read_rate_avg"}'
 
@@ -81,18 +83,12 @@
 0 11 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_association.sh
 
 # 每小时执行一次校验视频状态
-# 20 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_check_video_status_hourly.sh
 24 */4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_publish_video_audit_status"}'
 
 
 # 每天凌晨4:30 15:30执行视频发布和审核流程
 0 1,8,19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_video_publish_and_audit.sh
 
-# 每天 上午8:30, 下午1:00, 晚上8:50执行
-
-# 30 8 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
-# 20 14 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
-# 50 20 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
 
 30 8,15 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
 
@@ -103,37 +99,19 @@
 30 9,16,21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
 
 30 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
-# 每天上午9点,下午2点,晚上9点执行v2代码
-# 0 9,14,21 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily_v2.sh
-
 
 # 每天上午 9:30 点,下午 2 点,晚上 7 点执行下架视频任务
-
-# 30 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
-
-# 0 15 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
-
-# 0 19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
-
 0 9,15,19 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_off_videos"}'
 
-# 每天早上9点,下午2:30, 晚上7:30
-
-# 0 10,16,20 * * * bash /root/luojunhui/LongArticlesJob/sh/published_articles_monitor.sh
-0 10,16,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
+# 执行内部文章违规检测
+0 9,16,23 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
 
 # 每开始执行百度视频
 20 0,12 * * * bash /root/luojunhui/LongArticlesJob/sh/run_baidu_video_crawler.sh
 
 # check kimo balance hourly
-
-# 30 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_kimi_balance_monitor.sh
 # 每4h校验一次kimi余额
-25 */4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
-
-# 0 11,23 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_explore.sh
-
-# 0 5,10,15,20 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_quality_analysis.sh
+# 25 */4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
 
 # 更新小程序信息
 0 3,4,5,6,7,8 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "mini_program_detail_process"}'
@@ -141,11 +119,41 @@
 
 # */8 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_title_features", "batch_size": 50, "version": 2}'
 
-0 9,16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "recycle_outside_account_articles"}'
+# 0 9,16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "recycle_outside_account_articles"}'
 
-35 16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_outside_account_article_root_source_id"}'
+# 35 16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_outside_account_article_root_source_id"}'
 
 # 执行限流文章分析
 40 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_limited_account_info"}'
+
+# 早上 11 点获取前日文章详情
+30 11 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_detail_stat"}'
+
+# 执行广告平台账号内容抓取
+0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_accounts_crawler"}'
+
+# 执广告平台账号详情抓取
+32 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_detail"}'
+
+# 执行创建解构任务
+# 15 20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_ad_platform_accounts_decode_task"}'
+
+# 定时获取解构结果
+30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_decode_result"}'
+
+
+# 定时获取解构结果
+50 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_decode_result"}'
+
+# 腾讯广告互相平台账号--发文至头条
+0 6 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_publish"}'
+
+# 排序日志更新
+0 14 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rank_log_monitor"}'
+
+# I2I 排序日志更新
+0 5 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "i2i_recommend_data_sync"}'
+
+
 # 候选账号质量分析
-0 5,10,15,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'
+# 0 5,10,15,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'