long_articles_job.py 2.7 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788
  1. from argparse import ArgumentParser
  2. from tasks.crawler_tasks.crawler_video.crawler_piaoquan_videos import (
  3. CrawlerPiaoQuanVideos,
  4. )
  5. from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import CrawlerSohuHotVideos
  6. from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import (
  7. CrawlerSohuRecommendVideos,
  8. )
  9. from tasks.crawler_tasks.crawler_video.crawler_sph_videos import (
  10. CrawlerChannelAccountVideos,
  11. )
  12. from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishRecordManager
  13. from tasks.data_tasks.fwh_data_recycle import SaveFwhDataToDatabase
  14. from tasks.monitor_tasks.kimi_balance_monitor import check_kimi_balance
  15. from tasks.publish_tasks.top_article_generalize import (
  16. TopArticleGeneralizeFromArticlePool,
  17. )
  18. def run_piaoquan_video_crawler():
  19. crawler = CrawlerPiaoQuanVideos()
  20. crawler.deal()
  21. def run_sohu_video_crawler():
  22. # step1, crawl sohu hot videos
  23. crawler_sohu_hot_videos = CrawlerSohuHotVideos()
  24. crawler_sohu_hot_videos.deal()
  25. # step2, crawl sohu recommend videos
  26. crawler_sohu_recommend_videos = CrawlerSohuRecommendVideos()
  27. crawler_sohu_recommend_videos.deal()
  28. def run_sph_video_crawler():
  29. crawler_channel_account_videos = CrawlerChannelAccountVideos()
  30. crawler_channel_account_videos.deal()
  31. def run_fwh_data_manager():
  32. fwh_group_publish_record_manager = FwhGroupPublishRecordManager()
  33. fwh_group_publish_record_manager.deal()
  34. fwh_group_publish_record_manager.monitor()
  35. # 2. 保存数据到数据库
  36. save_fwh_data_to_database = SaveFwhDataToDatabase()
  37. save_fwh_data_to_database.deal()
  38. def run_top_article_generalize_from_article_pool():
  39. TopArticleGeneralizeFromArticlePool().deal()
  40. def main():
  41. """
  42. run long_articles_job
  43. """
  44. parser = ArgumentParser()
  45. parser.add_argument("--task_name", help="which task you want to run")
  46. parser.add_argument("--run_date", help="task specify run date")
  47. args = parser.parse_args()
  48. task_name = args.task_name
  49. if task_name is None:
  50. print("task_name cannot be None")
  51. return
  52. else:
  53. match task_name:
  54. case "run_piaoquan_video_crawler":
  55. run_piaoquan_video_crawler()
  56. case "run_sohu_video_crawler":
  57. run_sohu_video_crawler()
  58. case "run_check_kimi_balance":
  59. check_kimi_balance()
  60. case "run_fwh_data_manager":
  61. run_fwh_data_manager()
  62. case "run_sph_video_crawler":
  63. run_sph_video_crawler()
  64. case "top":
  65. run_top_article_generalize_from_article_pool()
  66. case _:
  67. print("task_name cannot be None")
  68. if __name__ == "__main__":
  69. main()