|
@@ -4,6 +4,8 @@
|
|
import os
|
|
import os
|
|
import sys
|
|
import sys
|
|
import time
|
|
import time
|
|
|
|
+from hashlib import md5
|
|
|
|
+
|
|
sys.path.append(os.getcwd())
|
|
sys.path.append(os.getcwd())
|
|
from common.common import Common
|
|
from common.common import Common
|
|
from common.scheduling_db import MysqlHelper, RedisHelper
|
|
from common.scheduling_db import MysqlHelper, RedisHelper
|
|
@@ -96,7 +98,37 @@ class SchedulingV3:
|
|
oss_endpoint = "out"
|
|
oss_endpoint = "out"
|
|
|
|
|
|
# 正式环境,调度任务
|
|
# 正式环境,调度任务
|
|
- Common.logger(log_type, crawler).info(f"开始调度任务:{task}\n")
|
|
|
|
|
|
+ Common.logger(log_type, crawler).info(f"开始调度任务")
|
|
|
|
+ # task_str = [
|
|
|
|
+ # ('task_id', str(task['id'])),
|
|
|
|
+ # ('task_name', str(task['task_name'])),
|
|
|
|
+ # ('source', str(task['source'])),
|
|
|
|
+ # ('start_time', str(task['start_time'])),
|
|
|
|
+ # ('interval', str(task['interval'])),
|
|
|
|
+ # ('mode', str(task['mode'])),
|
|
|
|
+ # ('duration_min', eval(task['rule'])['duration']['min']),
|
|
|
|
+ # ('duration_max', eval(task['rule'])['duration']['max']),
|
|
|
|
+ # ('play_cnt_min', eval(task['rule'])['playCnt']['min']),
|
|
|
|
+ # ('play_cnt_max', eval(task['rule'])['playCnt']['max']),
|
|
|
|
+ # ('publish_day_min', eval(task['rule'])['period']['min']),
|
|
|
|
+ # ('publish_day_max', eval(task['rule'])['period']['max']),
|
|
|
|
+ # ('fans_min', eval(task['rule'])['fans']['min']),
|
|
|
|
+ # ('fans_max', eval(task['rule'])['fans']['max']),
|
|
|
|
+ # ('videos_min', eval(task['rule'])['videos']['min']),
|
|
|
|
+ # ('videos_max', eval(task['rule'])['videos']['max']),
|
|
|
|
+ # ('video_like_min', eval(task['rule'])['like']['min']),
|
|
|
|
+ # ('video_like_max', eval(task['rule'])['like']['max']),
|
|
|
|
+ # ('video_width_min', eval(task['rule'])['videoWidth']['min']),
|
|
|
|
+ # ('video_width_max', eval(task['rule'])['videoWidth']['max']),
|
|
|
|
+ # ('video_height_min', eval(task['rule'])['videoHeight']['min']),
|
|
|
|
+ # ('video_height_max', eval(task['rule'])['videoHeight']['max']),
|
|
|
|
+ # ('spider_name', str(task['spider_name'])),
|
|
|
|
+ # ('machine', str(task['machine'])),
|
|
|
|
+ # ('status', str(task['status'])),
|
|
|
|
+ # ('create_time', str(task['create_time'])),
|
|
|
|
+ # ('update_time', str(task['update_time'])),
|
|
|
|
+ # ('operator', str(task['operator']))
|
|
|
|
+ # ]
|
|
task_str = [
|
|
task_str = [
|
|
('task_id', str(task['id'])),
|
|
('task_id', str(task['id'])),
|
|
('task_name', str(task['task_name'])),
|
|
('task_name', str(task['task_name'])),
|
|
@@ -104,22 +136,7 @@ class SchedulingV3:
|
|
('start_time', str(task['start_time'])),
|
|
('start_time', str(task['start_time'])),
|
|
('interval', str(task['interval'])),
|
|
('interval', str(task['interval'])),
|
|
('mode', str(task['mode'])),
|
|
('mode', str(task['mode'])),
|
|
- ('duration_min', eval(task['rule'])['duration']['min']),
|
|
|
|
- ('duration_max', eval(task['rule'])['duration']['max']),
|
|
|
|
- ('play_cnt_min', eval(task['rule'])['playCnt']['min']),
|
|
|
|
- ('play_cnt_max', eval(task['rule'])['playCnt']['max']),
|
|
|
|
- ('publish_day_min', eval(task['rule'])['period']['min']),
|
|
|
|
- ('publish_day_max', eval(task['rule'])['period']['max']),
|
|
|
|
- ('fans_min', eval(task['rule'])['fans']['min']),
|
|
|
|
- ('fans_max', eval(task['rule'])['fans']['max']),
|
|
|
|
- ('videos_min', eval(task['rule'])['videos']['min']),
|
|
|
|
- ('videos_max', eval(task['rule'])['videos']['max']),
|
|
|
|
- ('video_like_min', eval(task['rule'])['like']['min']),
|
|
|
|
- ('video_like_max', eval(task['rule'])['like']['max']),
|
|
|
|
- ('video_width_min', eval(task['rule'])['videoWidth']['min']),
|
|
|
|
- ('video_width_max', eval(task['rule'])['videoWidth']['max']),
|
|
|
|
- ('video_height_min', eval(task['rule'])['videoHeight']['min']),
|
|
|
|
- ('video_height_max', eval(task['rule'])['videoHeight']['max']),
|
|
|
|
|
|
+ ('rule', task['rule']),
|
|
('spider_name', str(task['spider_name'])),
|
|
('spider_name', str(task['spider_name'])),
|
|
('machine', str(task['machine'])),
|
|
('machine', str(task['machine'])),
|
|
('status', str(task['status'])),
|
|
('status', str(task['status'])),
|
|
@@ -127,17 +144,18 @@ class SchedulingV3:
|
|
('update_time', str(task['update_time'])),
|
|
('update_time', str(task['update_time'])),
|
|
('operator', str(task['operator']))
|
|
('operator', str(task['operator']))
|
|
]
|
|
]
|
|
- task_str = str(task_str).replace(' ', '')
|
|
|
|
- cmd = f"""sh scheduling/scheduling_main/scheduling_v3.sh {source}/{source}_main/{spider_name}.py --log_type="{mode}" --crawler="{source}" --task="{task_str}" --oss_endpoint="{oss_endpoint}" --env="{env}" >>{source}/logs/{source}-scheduling.log """
|
|
|
|
- Common.logger(log_type, crawler).info(f"cmd:{cmd}\n")
|
|
|
|
|
|
+ task_str = str(task_str).replace(' ', '').replace('"', "'").replace("\/", "").replace("/", "")
|
|
|
|
+ cmd = f"""sh scheduling/scheduling_v3/scheduling_v3.sh {source}/{source}_main/{spider_name}.py --log_type="{mode}" --crawler="{source}" --task="{task_str}" --oss_endpoint="{oss_endpoint}" --env="{env}" {source}/logs/{source}-{mode}-scheduling.log """
|
|
|
|
+ Common.logger(log_type, crawler).info(f"cmd:{cmd}")
|
|
os.system(cmd)
|
|
os.system(cmd)
|
|
|
|
+ Common.logger(log_type, crawler).info(f"调度任务结束")
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
if __name__ == "__main__":
|
|
# print(Scheduling.get_task("scheduling", "scheduling", "dev"))
|
|
# print(Scheduling.get_task("scheduling", "scheduling", "dev"))
|
|
# Scheduling.update_task("scheduling", "scheduling", 8, 1681833600000, 1, "dev")
|
|
# Scheduling.update_task("scheduling", "scheduling", 8, 1681833600000, 1, "dev")
|
|
- # Scheduling.write_redis("scheduling", "scheduling", "dev")
|
|
|
|
- # print(Scheduling.get_redis("scheduling", "scheduling", "dev"))
|
|
|
|
- SchedulingV3.scheduling_task("scheduling", "scheduling", "dev")
|
|
|
|
|
|
+ SchedulingV3.write_redis("scheduling", "scheduling", "dev")
|
|
|
|
+ # print(SchedulingV3.get_redis("scheduling", "scheduling", "dev"))
|
|
|
|
+ # SchedulingV3.scheduling_task("scheduling", "scheduling", "dev")
|
|
pass
|
|
pass
|
|
|
|
|