crontab_back.txt 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179
  1. # 卡片解构-封面下载重试
  2. 40 * * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "re_extract"}'
  3. # 卡片解构 — 每小时 05 分创建任务
  4. 5 * * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_cards_decode_task"}'
  5. # 文章解构 — 每小时 15 分创建任务
  6. 15 * * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_inner_articles_decode_task"}'
  7. # 素材解构 — 每小时 25 分创建任务
  8. 25 * * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_material_decode_task"}'
  9. # 获取解构结果 — 每天 22:00
  10. 0 20 * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_cards_decode_result"}'
  11. 0 21 * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_decode_result"}'
  12. 0 22 * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_material_decode_result"}'
  13. # 创建增长头部视频数据生产
  14. 0 13 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "produce_decode_growth_head_videos"}'
  15. 0 9,15,21 * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "auto_follow_account"}'
  16. 26 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rate_limited_article_filter"}'
  17. 30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_follow_result"}'
  18. 50 * * * * curl -X POST http://192.168.205.85:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_reply_result"}'
  19. 0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "1030-手动挑号", "crawl_mode": "account", "strategy": "V1"}'
  20. 0 4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_gzh_articles", "account_method": "cooperate_account", "crawl_mode": "account", "strategy": "V1"}'
  21. # 定时清理文件
  22. 0 1 * * * find /root/luojunhui/LongArticlesJob/static -type f -name "*.mp4" -mtime +5 -delete
  23. # 每天 9 点, 18 点执行 gzh 视频抓取
  24. 0 9,18 * * * bash /root/luojunhui/LongArticlesJob/sh/run_gzh_video_crawler.sh
  25. * * * * * bash /root/luojunhui/LongArticlesJob/sh/run_long_articles_job.sh
  26. # 外部服务号监测
  27. 0 13 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_monitor"}'
  28. 30 * * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "cooperate_accounts_detail"}'
  29. # 每天凌晨 4点,下午 4 点各执行一次头条视频抓取
  30. 0 4,16 * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_account_video_crawler.sh
  31. # 更新服务号数据
  32. 0 10,17 * * * bash /root/luojunhui/LongArticlesJob/sh/run_fwh_data_manager.sh
  33. # 每15分钟执行一次今日头条推荐流抓取
  34. */15 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_recommend.sh
  35. # 每10分钟执行一次从aigc系统获取发布文章
  36. */10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_article_info_from_aigc.sh
  37. # 每10分钟执行一次标题相似度计算任务
  38. */10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_similarity_task.sh
  39. # 每小时执行一次标题改写
  40. 0 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_process_task.sh
  41. # 凌晨2点30执行更新小程序信息任务
  42. 30 2 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_minigram_info_daily.sh
  43. # 凌晨3:00,下午3:00执行视频号抓取任务
  44. 0 3,15 * * * bash /root/luojunhui/LongArticlesJob/sh/run_sph_video_crawler.sh
  45. # 每天上午10点30执行文章退场 && 晋升任务
  46. 30 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_title_exit_v1.sh
  47. # 晚上6点执行头条文章冷启动
  48. 0 18 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "platform": "toutiao", "crawler_methods": ["toutiao_account_association"]}'
  49. # 17:50执行公众号文章战冷启动
  50. 30 17 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "strategy": "strategy_v3"}'
  51. 0 4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "strategy": "strategy_v1"}'
  52. # 早上执行sohu 抓取
  53. 0 6 * * * bash /root/luojunhui/LongArticlesJob/sh/run_schedule_app.sh
  54. 0 2 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao"}'
  55. #
  56. 0 14 * * * bash /root/luojunhui/LongArticlesJob/sh/run_cold_start_publish.sh
  57. # 每日上午9点执行账号联想任务
  58. 0 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_association.sh
  59. # 执行阅读率均值
  60. 0 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_read_rate_avg"}'
  61. # 执行阅读均值
  62. 40 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_read_avg"}'
  63. # 执行打开率均值
  64. 50 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_account_open_rate_avg"}'
  65. # 每天11点执行文章联想任务
  66. 0 11 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_association.sh
  67. # 每小时执行一次校验视频状态
  68. 24 */4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_publish_video_audit_status"}'
  69. # 每天凌晨4:30 15:30执行视频发布和审核流程
  70. 0 1,8,19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_video_publish_and_audit.sh
  71. 30 8,15 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
  72. 0 21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
  73. 10 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
  74. 30 9,16,21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
  75. 30 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
  76. # 每天上午 9:30 点,下午 2 点,晚上 7 点执行下架视频任务
  77. # 0 9,15,19 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_off_videos"}'
  78. # 执行内部文章违规检测
  79. 0 9,16,23 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
  80. # 每开始执行百度视频
  81. 20 0,12 * * * bash /root/luojunhui/LongArticlesJob/sh/run_baidu_video_crawler.sh
  82. # check kimo balance hourly
  83. # 每4h校验一次kimi余额
  84. # 25 */4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
  85. # 更新小程序信息
  86. 0 3,4,5,6,7,8 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "mini_program_detail_process"}'
  87. # */8 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_title_features", "batch_size": 50, "version": 2}'
  88. # 0 9,16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "recycle_outside_account_articles"}'
  89. # 35 16 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_outside_account_article_root_source_id"}'
  90. # 执行限流文章分析
  91. 40 10 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_limited_account_info"}'
  92. # 早上 11 点获取前日文章详情
  93. 30 11 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_detail_stat"}'
  94. # 执行广告平台账号内容抓取
  95. 0 3 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_accounts_crawler"}'
  96. # 执广告平台账号详情抓取
  97. 32 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_detail"}'
  98. # 执行创建解构任务
  99. # 15 20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "create_ad_platform_accounts_decode_task"}'
  100. # 定时获取解构结果
  101. 30 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "fetch_decode_result"}'
  102. # 定时获取解构结果
  103. 50 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_decode_result"}'
  104. # 腾讯广告互相平台账号--发文至头条
  105. 0 6 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "ad_platform_article_publish"}'
  106. # 排序日志更新
  107. 0 14 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "rank_log_monitor"}'
  108. # I2I 排序日志更新
  109. 0 5 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "i2i_recommend_data_sync"}'
  110. # 候选账号质量分析
  111. # 0 5,10,15,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'