long_articles_job.py 2.7 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889
  1. from argparse import ArgumentParser
  2. from tasks.crawler_tasks.crawler_video.crawler_piaoquan_videos import (
  3. CrawlerPiaoQuanVideos,
  4. )
  5. from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import CrawlerSohuHotVideos
  6. from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import (
  7. CrawlerSohuRecommendVideos,
  8. )
  9. from tasks.crawler_tasks.crawler_video.crawler_sph_videos import (
  10. CrawlerChannelAccountVideos,
  11. )
  12. from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishRecordManager
  13. from tasks.data_tasks.fwh_data_recycle import SaveFwhDataToDatabase
  14. from tasks.monitor_tasks.kimi_balance_monitor import check_kimi_balance
  15. from tasks.publish_tasks.top_article_generalize import (
  16. TopArticleGeneralizeFromArticlePool,
  17. )
  18. def run_piaoquan_video_crawler():
  19. crawler = CrawlerPiaoQuanVideos()
  20. crawler.deal()
  21. def run_sohu_video_crawler():
  22. # step1, crawl sohu hot videos
  23. crawler_sohu_hot_videos = CrawlerSohuHotVideos()
  24. crawler_sohu_hot_videos.deal()
  25. # step2, crawl sohu recommend videos
  26. crawler_sohu_recommend_videos = CrawlerSohuRecommendVideos()
  27. crawler_sohu_recommend_videos.deal()
  28. def run_sph_video_crawler():
  29. crawler_channel_account_videos = CrawlerChannelAccountVideos()
  30. crawler_channel_account_videos.deal()
  31. def run_fwh_data_manager():
  32. fwh_group_publish_record_manager = FwhGroupPublishRecordManager()
  33. fwh_group_publish_record_manager.deal()
  34. fwh_group_publish_record_manager.monitor()
  35. # 2. 保存数据到数据库
  36. save_fwh_data_to_database = SaveFwhDataToDatabase()
  37. save_fwh_data_to_database.deal()
  38. def run_top_article_generalize_from_article_pool():
  39. task = TopArticleGeneralizeFromArticlePool()
  40. task.deal()
  41. def main():
  42. """
  43. run long_articles_job
  44. """
  45. parser = ArgumentParser()
  46. parser.add_argument("--task_name", help="which task you want to run")
  47. parser.add_argument("--run_date", help="task specify run date")
  48. args = parser.parse_args()
  49. task_name = args.task_name
  50. if task_name is None:
  51. print("task_name cannot be None")
  52. return
  53. else:
  54. match task_name:
  55. case "run_piaoquan_video_crawler":
  56. run_piaoquan_video_crawler()
  57. case "run_sohu_video_crawler":
  58. run_sohu_video_crawler()
  59. case "run_check_kimi_balance":
  60. check_kimi_balance()
  61. case "run_fwh_data_manager":
  62. run_fwh_data_manager()
  63. case "run_sph_video_crawler":
  64. run_sph_video_crawler()
  65. case "top_article_generalize":
  66. run_top_article_generalize_from_article_pool()
  67. case _:
  68. print("task_name cannot be None")
  69. if __name__ == "__main__":
  70. main()