Bläddra i källkod

feat:添加增量训练脚本

zhaohaipeng 9 månader sedan
förälder
incheckning
79c4224b59
1 ändrade filer med 6 tillägg och 5 borttagningar
  1. 6 5
      ad/20_ad_increment_model_train_predict_auc.sh

+ 6 - 5
ad/20_ad_increment_model_train_predict_auc.sh

@@ -2,12 +2,13 @@
 
 # 模型训练,预测,计算AUC脚本
 
-# set -x
+set -x
 
 begin_date=$1
 end_date=$2
 model_name=$3
-dim=$4
+train_dim=$4
+predict_dim=$5
 
 PROJECT_HOME=/root/zhaohp/recommend-emr-dataprocess
 HADOOP=/opt/apps/HADOOP-COMMON/hadoop-common-current/bin/hadoop
@@ -28,7 +29,7 @@ predict_auc() {
     predict_end_date=$(date -d "$end_date +1 day" +%Y%m%d)
     while [ "$predict_date" != "$predict_end_date" ]; do
 
-        $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${predict_date}/* | ${FM_PREDICT} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${dim} -core 8 -out ${PREDICT_PATH}/${model_name}_${train_date}.txt
+        $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${predict_date}/* | ${FM_PREDICT} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${predict_dim} -core 8 -out ${PREDICT_PATH}/${model_name}_${train_date}.txt
         auc=`cat ${PREDICT_PATH}/${model_name}_${train_date}.txt | /root/sunmingze/AUC/AUC`
 
         echo "模型训练日期: ${train_date}, 模型预测日期: ${predict_date}, AUC: ${auc}, 模型路径: ${MODEL_PATH}/${model_name}_${train_date}.txt"
@@ -48,10 +49,10 @@ main() {
         echo "==================== 开始训练 $train_date 模型 ===================="
 
         if [ "$train_date" == "$begin_date" ]; then
-            $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${train_date}/* | ${FM_TRAIN} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${dim} -core 8
+            $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${train_date}/* | ${FM_TRAIN} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${train_dim} -core 8
         else
             yesterday=$(date -d "$train_date -1 day" +%Y%m%d)
-            $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${train_date}/* | ${FM_TRAIN} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${dim} -core 8 -im ${MODEL_PATH}/${model_name}_${yesterday}.txt
+            $HADOOP fs -text ${HDFS_TRAIN_DATE_PATH}/${train_date}/* | ${FM_TRAIN} -m ${MODEL_PATH}/${model_name}_${train_date}.txt -dim ${train_dim} -core 8 -im ${MODEL_PATH}/${model_name}_${yesterday}.txt
         fi
 
         predict_auc