|
@@ -7,6 +7,7 @@ from threading import Timer
|
|
|
from utils import data_check, get_feature_data
|
|
|
from config import set_config
|
|
|
from log import Log
|
|
|
+import ODPSQueryUtil
|
|
|
config_ = set_config()
|
|
|
log_ = Log()
|
|
|
features = ['videoid', 'title', 'video_path']
|
|
@@ -29,7 +30,8 @@ def download_video_from_oss(video_id, video_path, download_folder):
|
|
|
auth = oss2.Auth(access_key_id=config_.OSS_CONFIG['accessKeyId'],
|
|
|
access_key_secret=config_.OSS_CONFIG['accessKeySecret'])
|
|
|
|
|
|
- bucket = oss2.Bucket(auth, endpoint=config_.OSS_CONFIG['endpoint'], bucket_name='art-pubbucket')
|
|
|
+ bucket = oss2.Bucket(
|
|
|
+ auth, endpoint=config_.OSS_CONFIG['endpoint'], bucket_name='art-pubbucket')
|
|
|
|
|
|
|
|
|
|
|
@@ -55,12 +57,14 @@ def download_video_from_oss(video_id, video_path, download_folder):
|
|
|
|
|
|
def download_videos(project, table, dt):
|
|
|
|
|
|
- feature_df = get_feature_data(project=project, table=table, dt=dt, features=features)
|
|
|
+ feature_df = get_feature_data(
|
|
|
+ project=project, table=table, dt=dt, features=features)
|
|
|
download_folder = 'videos'
|
|
|
video_id_list = feature_df['videoid'].to_list()
|
|
|
pool = multiprocessing.Pool(processes=6)
|
|
|
for video_id in video_id_list:
|
|
|
- video_path = feature_df[feature_df['videoid'] == video_id]['video_path'].values[0].strip()
|
|
|
+ video_path = feature_df[feature_df['videoid']
|
|
|
+ == video_id]['video_path'].values[0].strip()
|
|
|
video_path = video_path.replace(' ', '')
|
|
|
print(video_id, video_path)
|
|
|
pool.apply_async(
|
|
@@ -77,7 +81,8 @@ def timer_check():
|
|
|
table = config_.DAILY_VIDEO['table']
|
|
|
now_date = datetime.datetime.today()
|
|
|
print(f"now_date: {datetime.datetime.strftime(now_date, '%Y%m%d')}")
|
|
|
- dt = datetime.datetime.strftime(now_date-datetime.timedelta(days=1), '%Y%m%d')
|
|
|
+ dt = datetime.datetime.strftime(
|
|
|
+ now_date-datetime.timedelta(days=1), '%Y%m%d')
|
|
|
|
|
|
data_count = data_check(project=project, table=table, dt=dt)
|
|
|
if data_count > 0:
|
|
@@ -94,4 +99,38 @@ def timer_check():
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
|
|
- timer_check()
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+ auth = oss2.Auth(access_key_id=config_.OSS_CONFIG['accessKeyId'],
|
|
|
+ access_key_secret=config_.OSS_CONFIG['accessKeySecret'])
|
|
|
+
|
|
|
+ bucket = oss2.Bucket(
|
|
|
+ auth, endpoint=config_.OSS_CONFIG['endpoint'], bucket_name='art-pubbucket')
|
|
|
+
|
|
|
+
|
|
|
+
|
|
|
+ bucket.get_object_to_file(
|
|
|
+ 'longvideo/transcode/video/vpc/20221221/17608628PUf8nomrsSCIhllyT3.mp4', 'videos/17608628PUf8nomrsSCIhllyT3.mp4')
|