|
@@ -1,7 +1,9 @@
|
|
|
|
|
+import time
|
|
|
from argparse import ArgumentParser
|
|
from argparse import ArgumentParser
|
|
|
|
|
|
|
|
from cold_start.crawler.baidu import BaiduVideoCrawler
|
|
from cold_start.crawler.baidu import BaiduVideoCrawler
|
|
|
from tasks.ai_tasks import run_title_similarity_task
|
|
from tasks.ai_tasks import run_title_similarity_task
|
|
|
|
|
+from tasks.safety_tasks import GetOffVideos
|
|
|
from tasks.crawler_tasks.crawler_video.crawler_piaoquan_videos import (
|
|
from tasks.crawler_tasks.crawler_video.crawler_piaoquan_videos import (
|
|
|
CrawlerPiaoQuanVideos,
|
|
CrawlerPiaoQuanVideos,
|
|
|
)
|
|
)
|
|
@@ -20,8 +22,12 @@ from tasks.crawler_tasks.crawler_video.crawler_gzh_videos import CrawlerGzhMetaV
|
|
|
from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishRecordManager
|
|
from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishRecordManager
|
|
|
from tasks.data_tasks.fwh_data_recycle import SaveFwhDataToDatabase
|
|
from tasks.data_tasks.fwh_data_recycle import SaveFwhDataToDatabase
|
|
|
from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishMonitor
|
|
from tasks.data_tasks.fwh_data_recycle import FwhGroupPublishMonitor
|
|
|
|
|
+
|
|
|
from tasks.monitor_tasks.kimi_balance_monitor import check_kimi_balance
|
|
from tasks.monitor_tasks.kimi_balance_monitor import check_kimi_balance
|
|
|
-from tasks.monitor_tasks.outside_server_accounts_monitor import run_outside_server_accounts_monitor
|
|
|
|
|
|
|
+from tasks.monitor_tasks.outside_server_accounts_monitor import (
|
|
|
|
|
+ run_outside_server_accounts_monitor,
|
|
|
|
|
+)
|
|
|
|
|
+
|
|
|
from tasks.publish_tasks.top_article_generalize import (
|
|
from tasks.publish_tasks.top_article_generalize import (
|
|
|
TopArticleGeneralizeFromArticlePool,
|
|
TopArticleGeneralizeFromArticlePool,
|
|
|
)
|
|
)
|
|
@@ -83,6 +89,10 @@ def run_top_article_generalize_from_article_pool():
|
|
|
task.deal()
|
|
task.deal()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
+def run_get_off_videos():
|
|
|
|
|
+ GetOffVideos().deal()
|
|
|
|
|
+
|
|
|
|
|
+
|
|
|
def main():
|
|
def main():
|
|
|
"""
|
|
"""
|
|
|
run long_articles_job
|
|
run long_articles_job
|
|
@@ -102,26 +112,40 @@ def main():
|
|
|
match task_name:
|
|
match task_name:
|
|
|
case "run_piaoquan_video_crawler":
|
|
case "run_piaoquan_video_crawler":
|
|
|
crawler.run_piaoquan_video_crawler()
|
|
crawler.run_piaoquan_video_crawler()
|
|
|
|
|
+
|
|
|
case "run_sohu_video_crawler":
|
|
case "run_sohu_video_crawler":
|
|
|
crawler.run_sohu_video_crawler()
|
|
crawler.run_sohu_video_crawler()
|
|
|
|
|
+
|
|
|
case "run_sph_video_crawler":
|
|
case "run_sph_video_crawler":
|
|
|
crawler.run_sph_video_crawler()
|
|
crawler.run_sph_video_crawler()
|
|
|
|
|
+
|
|
|
case "crawler_gzh_meta_videos":
|
|
case "crawler_gzh_meta_videos":
|
|
|
crawler.crawler_gzh_meta_videos()
|
|
crawler.crawler_gzh_meta_videos()
|
|
|
|
|
+
|
|
|
case "run_toutiao_video_crawler":
|
|
case "run_toutiao_video_crawler":
|
|
|
crawler.run_toutiao_video_crawler()
|
|
crawler.run_toutiao_video_crawler()
|
|
|
|
|
+
|
|
|
case "run_baidu_video_crawler":
|
|
case "run_baidu_video_crawler":
|
|
|
crawler.run_baidu_video_crawler()
|
|
crawler.run_baidu_video_crawler()
|
|
|
|
|
+
|
|
|
case "run_check_kimi_balance":
|
|
case "run_check_kimi_balance":
|
|
|
check_kimi_balance()
|
|
check_kimi_balance()
|
|
|
|
|
+
|
|
|
case "run_fwh_data_manager":
|
|
case "run_fwh_data_manager":
|
|
|
run_fwh_data_manager()
|
|
run_fwh_data_manager()
|
|
|
|
|
+
|
|
|
case "run_title_similarity_task":
|
|
case "run_title_similarity_task":
|
|
|
run_title_similarity_task()
|
|
run_title_similarity_task()
|
|
|
|
|
+
|
|
|
case "top_article_generalize":
|
|
case "top_article_generalize":
|
|
|
run_top_article_generalize_from_article_pool()
|
|
run_top_article_generalize_from_article_pool()
|
|
|
|
|
+
|
|
|
|
|
+ case "run_get_off_videos":
|
|
|
|
|
+ run_get_off_videos()
|
|
|
|
|
+
|
|
|
case "run_outside_server_accounts_monitor":
|
|
case "run_outside_server_accounts_monitor":
|
|
|
run_outside_server_accounts_monitor()
|
|
run_outside_server_accounts_monitor()
|
|
|
|
|
+
|
|
|
case _:
|
|
case _:
|
|
|
print("task_name cannot be None")
|
|
print("task_name cannot be None")
|
|
|
|
|
|