zhangbo 1 년 전
부모
커밋
6bafc9f171
1개의 변경된 파일8개의 추가작업 그리고 8개의 파일을 삭제
  1. 8 8
      alg_recsys_recall_tags_videosv2.py

+ 8 - 8
alg_recsys_recall_tags_videosv2.py

@@ -4,7 +4,8 @@ from config import set_config
 from log import Log
 from utils import execute_sql_from_odps
 from db_helper import RedisHelper
-import datetime
+from datetime import datetime, timedelta
+
 from alg_recsys_recall_4h_region_trend import records_process_for_list
 config_, _ = set_config()
 log_ = Log()
@@ -123,17 +124,16 @@ OR      exploded_value = 'P0高风险' \
 def get_video_tags_v2():
     PROJECT = "loghubods"
     TABLE = "loghubods.automated_updates_category_labels_1"
+    now_date = datetime.today()
+    date = datetime.strftime(now_date, '%Y%m%d%H')
     try:
         sql = '''SELECT  videoid
         ,secondary_labels
 FROM    loghubods.automated_updates_category_labels_1
 WHERE   (
-            dt LIKE '2023%'
-            OR      dt LIKE '2024%'
-            OR      dt LIKE '2025%'
-            OR      dt LIKE '2026%'
+            dt LIKE '{}%'
 )
-'''
+'''.format(date)
         print("sql:" + sql)
         records = execute_sql_from_odps(project=PROJECT, sql=sql)
         video_tags_list = []
@@ -159,7 +159,7 @@ def process_and_store(row):
     # log_.info("video-tags写入数据key={},value={}".format(key, tags))
 
 def main():
-    log_.info("开始执行:" + datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
+    log_.info("开始执行:" + datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
     video_tags_list = get_video_tags()
     video_tags_list2 = get_video_tags_v2()
 
@@ -192,7 +192,7 @@ def main():
     log_.info("video的数据量:{}".format(len(result)))
     records_process_for_list(result, process_and_store, max_size=50, num_workers=8)
     log_.info("video的数据量:{}".format(len(result)))
-    log_.info("完成执行:" + datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
+    log_.info("完成执行:" + datetime.now().strftime("%Y-%m-%d %H:%M:%S"))
 
 if __name__ == '__main__':
     main()