Browse Source

提取标题品类信息

luojunhui 3 tháng trước cách đây
mục cha
commit
2cb309cda5
1 tập tin đã thay đổi với 124 bổ sung0 xóa
  1. 124 0
      dev/crontab_back.txt

+ 124 - 0
dev/crontab_back.txt

@@ -0,0 +1,124 @@
+# 定时清理文件
+0 1 * * * find /root/luojunhui/LongArticlesJob/static -type f -name "*.mp4" -mtime +5 -delete
+# 每天 9 点, 18 点执行 gzh 视频抓取
+0 9,18 * * * bash /root/luojunhui/LongArticlesJob/sh/run_gzh_video_crawler.sh
+
+* * * * * bash /root/luojunhui/LongArticlesJob/sh/run_long_articles_job.sh
+
+# 外部服务号监测
+# 0 13 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "outside_article_monitor"}'
+
+# 每天凌晨 4点,下午 4 点各执行一次头条视频抓取
+0 4,16 * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_account_video_crawler.sh
+
+# 更新服务号数据
+0 11,17 * * * bash /root/luojunhui/LongArticlesJob/sh/run_fwh_data_manager.sh
+
+# 每15分钟执行一次今日头条推荐流抓取
+*/15 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_toutiao_recommend.sh
+
+# 每10分钟执行一次从aigc系统获取发布文章
+*/10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_article_info_from_aigc.sh
+
+# 每10分钟执行一次标题相似度计算任务
+*/10 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_similarity_task.sh
+
+# 每小时执行一次标题改写
+0 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_title_process_task.sh
+
+# 凌晨2点30执行更新小程序信息任务
+30 2 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_minigram_info_daily.sh
+
+# 凌晨3:00,下午3:00执行视频号抓取任务
+0 3,15 * * * bash /root/luojunhui/LongArticlesJob/sh/run_sph_video_crawler.sh
+
+# 每天上午10点30执行文章退场 && 晋升任务
+30 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_title_exit_v1.sh
+
+# 每天上午4点执行账号冷启动任务
+0 1 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_cold_start_daily.sh
+
+# 晚上6点执行头条文章冷启动
+0 18 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "platform": "toutiao", "crawler_methods": ["toutiao_account_association"]}'
+
+# 17:50执行公众号文章战冷启动
+30 17 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "article_pool_cold_start", "strategy": "strategy_v2"}'
+
+# 早上执行sohu 抓取
+0 6 * * * bash /root/luojunhui/LongArticlesJob/sh/run_schedule_app.sh
+0 2 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "crawler_toutiao"}'
+
+#
+0 14 * * * bash /root/luojunhui/LongArticlesJob/sh/run_cold_start_publish.sh
+
+# 每日上午9点执行账号联想任务
+0 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_association.sh
+
+# 每天 10 点执行前一天的阅读率均值代码
+0 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_account_read_rate_avg.sh
+
+# 每天10点40执行阅读均值任务
+40 10 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_account_avg_v3.sh
+
+# 每天11点执行文章联想任务
+0 11 * * * bash /root/luojunhui/LongArticlesJob/sh/run_article_association.sh
+
+# 每小时执行一次校验视频状态
+# 20 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_check_video_status_hourly.sh
+24 */4 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_publish_video_audit_status"}'
+
+
+# 每天凌晨4:30 15:30执行视频发布和审核流程
+0 1,8,19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_video_publish_and_audit.sh
+
+# 每天 上午8:30, 下午1:00, 晚上8:50执行
+
+# 30 8 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
+# 20 14 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
+# 50 20 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily.sh
+
+0 8,15,21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
+10 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "daily_publish_articles_recycle"}'
+30 9,16,21 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
+
+30 22 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "update_root_source_id"}'
+# 每天上午9点,下午2点,晚上9点执行v2代码
+# 0 9,14,21 * * * bash /root/luojunhui/LongArticlesJob/sh/run_update_published_articles_daily_v2.sh
+
+
+# 每天上午 9:30 点,下午 2 点,晚上 7 点执行下架视频任务
+
+# 30 9 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
+
+# 0 15 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
+
+# 0 19 * * * bash /root/luojunhui/LongArticlesJob/sh/run_get_off_videos_three_times_per_day.sh
+
+0 9,15,19 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "get_off_videos"}'
+
+# 每天早上9点,下午2:30, 晚上7:30
+
+# 0 10,16,20 * * * bash /root/luojunhui/LongArticlesJob/sh/published_articles_monitor.sh
+0 10,16,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "inner_article_monitor"}'
+
+# 每开始执行百度视频
+20 0,12 * * * bash /root/luojunhui/LongArticlesJob/sh/run_baidu_video_crawler.sh
+
+# check kimo balance hourly
+
+# 30 * * * * bash /root/luojunhui/LongArticlesJob/sh/run_kimi_balance_monitor.sh
+# 每4h校验一次kimi余额
+25 */4 * * * curl -X POST http://127.0.0.1:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "check_kimi_balance"}'
+
+0 11,23 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_explore.sh
+
+# 0 5,10,15,20 * * * bash /root/luojunhui/LongArticlesJob/sh/run_account_quality_analysis.sh
+
+# 更新小程序信息
+13 3,4,5 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "mini_program_detail_process"}'
+
+
+# */8 * * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "extract_title_features", "batch_size": 10}'
+
+# 候选账号质量分析
+0 5,10,15,20 * * * curl -X POST http://192.168.142.66:6060/api/run_task -H "Content-Type: application/json" -d '{"task_name": "candidate_account_quality_analysis"}'