12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788 |
- from argparse import ArgumentParser
- from tasks.crawler_tasks.crawler_video.crawler_piaoquan_videos import (
- CrawlerPiaoQuanVideos,
- )
- from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import CrawlerSohuHotVideos
- from tasks.crawler_tasks.crawler_video.crawler_sohu_videos import (
- CrawlerSohuRecommendVideos,
- )
- from tasks.crawler_tasks.crawler_video.crawler_sph_videos import (
- CrawlerChannelAccountVideos,
- )
- from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishRecordManager
- from tasks.data_tasks.fwh_data_recycle import SaveFwhDataToDatabase
- from tasks.monitor_tasks.kimi_balance_monitor import check_kimi_balance
- from tasks.publish_tasks.top_article_generalize import (
- TopArticleGeneralizeFromArticlePool,
- )
- def run_piaoquan_video_crawler():
- crawler = CrawlerPiaoQuanVideos()
- crawler.deal()
- def run_sohu_video_crawler():
- # step1, crawl sohu hot videos
- crawler_sohu_hot_videos = CrawlerSohuHotVideos()
- crawler_sohu_hot_videos.deal()
- # step2, crawl sohu recommend videos
- crawler_sohu_recommend_videos = CrawlerSohuRecommendVideos()
- crawler_sohu_recommend_videos.deal()
- def run_sph_video_crawler():
- crawler_channel_account_videos = CrawlerChannelAccountVideos()
- crawler_channel_account_videos.deal()
- def run_fwh_data_manager():
- fwh_group_publish_record_manager = FwhGroupPublishRecordManager()
- fwh_group_publish_record_manager.deal()
- fwh_group_publish_record_manager.monitor()
- # 2. 保存数据到数据库
- save_fwh_data_to_database = SaveFwhDataToDatabase()
- save_fwh_data_to_database.deal()
- def run_top_article_generalize_from_article_pool():
- TopArticleGeneralizeFromArticlePool().deal()
- def main():
- """
- run long_articles_job
- """
- parser = ArgumentParser()
- parser.add_argument("--task_name", help="which task you want to run")
- parser.add_argument("--run_date", help="task specify run date")
- args = parser.parse_args()
- task_name = args.task_name
- if task_name is None:
- print("task_name cannot be None")
- return
- else:
- match task_name:
- case "run_piaoquan_video_crawler":
- run_piaoquan_video_crawler()
- case "run_sohu_video_crawler":
- run_sohu_video_crawler()
- case "run_check_kimi_balance":
- check_kimi_balance()
- case "run_fwh_data_manager":
- run_fwh_data_manager()
- case "run_sph_video_crawler":
- run_sph_video_crawler()
- case "top":
- run_top_article_generalize_from_article_pool()
- case _:
- print("task_name cannot be None")
- if __name__ == "__main__":
- main()
|