瀏覽代碼

generate label for mysql

罗俊辉 1 年之前
父節點
當前提交
b7704e14f5
共有 1 個文件被更改,包括 2 次插入2 次删除
  1. 2 2
      process_data.py

+ 2 - 2
process_data.py

@@ -242,10 +242,10 @@ class UserProcess(object):
         three_date_before = dt_time + datetime.timedelta(days=4)
         temp_time = three_date_before.strftime("%Y%m%d")
         if flag == "train":
-            sql = "select video_title, label, uid, channel, user_fans, user_view_30, user_share_30, user_return_30, user_rov, user_str, user_return_videos_30, user_return_videos_3, user_return_3, user_view_3, user_share_3, address from lightgbm_data where type = 'userupload' and daily_dt_str >= '20240305';"
+            sql = "select video_title, label, user_id, channel, user_fans, user_view_30, user_share_30, user_return_30, user_rov, user_str, user_return_videos_30, user_return_videos_3, user_return_3, user_view_3, user_share_3, address from lightgbm_data where type = 'userupload' and daily_dt_str >= '20240305';"
             des_path = "data/train_data/spider_train_{}".format(datetime.datetime.today().strftime("%Y%m%d"))
         elif flag == "predict":
-            sql = f"""select video_title, label, uid, channel, user_fans, user_view_30, user_share_30, user_return_30, user_rov, user_str, user_return_videos_30, user_return_videos_3, user_return_3, user_view_3, user_share_3, address from lightgbm_data where type = 'userupload' and daily_dt_str = '{temp_time}';"""
+            sql = f"""select video_title, label, user_id, channel, user_fans, user_view_30, user_share_30, user_return_30, user_rov, user_str, user_return_videos_30, user_return_videos_3, user_return_3, user_view_3, user_share_3, address from lightgbm_data where type = 'userupload' and daily_dt_str = '{temp_time}';"""
             des_path = "data/predict_data/predict_{}.json".format(dt_time.strftime("%Y%m%d"))
         else:
             return