Jelajahi Sumber

feat:补数据

zhaohaipeng 6 bulan lalu
induk
melakukan
9cd736a3ac
2 mengubah file dengan 28 tambahan dan 2 penghapusan
  1. 2 0
      ad/01_ad_model_update.sh
  2. 26 2
      ad/25_ad_data_make.sh

+ 2 - 0
ad/01_ad_model_update.sh

@@ -31,6 +31,8 @@ MODEL_OSS_PATH=oss://art-recommend.oss-cn-hangzhou.aliyuncs.com/zhangbo/
 model_name=model_xgb_351_1000_v2
 # 本地保存HDFS模型路径文件,测试时修改为其他模型名,避免影响线上
 model_path_file=${model_local_home}/online_model_path.txt
+# 获取当前是星期几,1表示星期一
+current_day_of_week="$(date +"%u")"
 
 # 任务开始时间
 start_time=$(date +%s)

+ 26 - 2
ad/25_ad_data_make.sh

@@ -29,11 +29,35 @@ today_early_1="$(date -d '1 days ago' +%Y%m%d)"
 --master yarn --driver-memory 1G --executor-memory 2G --executor-cores 1 --num-executors 16 \
 ./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
 tablePart:64 repartition:32 \
-beginStr:${today_early_1}00 endStr:${today_early_1}23 \
+beginStr:${today_early_1}00 endStr:${today_early_1}12 \
 savePath:${TRAIN_PATH} \
 table:${TABLE} \
 filterHours:00,01,02,03,04,05,06,07 \
-idDefaultValue:0.1
+idDefaultValue:0.1 &
+
+/opt/apps/SPARK2/spark-2.4.8-hadoop3.2-1.0.8/bin/spark-class2 org.apache.spark.deploy.SparkSubmit \
+--class com.aliyun.odps.spark.examples.makedata_ad.v20240718.makedata_ad_31_originData_20240718 \
+--master yarn --driver-memory 1G --executor-memory 2G --executor-cores 1 --num-executors 16 \
+./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
+tablePart:64 repartition:32 \
+beginStr:${today_early_1}13 endStr:${today_early_1}18 \
+savePath:${TRAIN_PATH} \
+table:${TABLE} \
+filterHours:00,01,02,03,04,05,06,07 \
+idDefaultValue:0.1 &
+
+/opt/apps/SPARK2/spark-2.4.8-hadoop3.2-1.0.8/bin/spark-class2 org.apache.spark.deploy.SparkSubmit \
+--class com.aliyun.odps.spark.examples.makedata_ad.v20240718.makedata_ad_31_originData_20240718 \
+--master yarn --driver-memory 1G --executor-memory 2G --executor-cores 1 --num-executors 16 \
+./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
+tablePart:64 repartition:32 \
+beginStr:${today_early_1}19 endStr:${today_early_1}23 \
+savePath:${TRAIN_PATH} \
+table:${TABLE} \
+filterHours:00,01,02,03,04,05,06,07 \
+idDefaultValue:0.1 &
+
+wait
 
 /opt/apps/SPARK2/spark-2.4.8-hadoop3.2-1.0.8/bin/spark-class2 org.apache.spark.deploy.SparkSubmit \
 --class com.aliyun.odps.spark.examples.makedata_ad.v20240718.makedata_ad_33_bucketData_20240718 \