Browse Source

i2i样本制作,第4步。 连续值分桶

zhangbo 5 months ago
parent
commit
43cd828c0c

+ 3 - 0
src/main/scala/com/aliyun/odps/spark/examples/makedata_dssm/makedata_i2i_04_bucketFile_20241128.scala

@@ -58,6 +58,7 @@ object makedata_i2i_04_bucketFile_20241128 {
               case "vovd1_day7" => result += (("action:vovd1_day7", value))
               case "vovd1_day7" => result += (("action:vovd1_day7", value))
               case "vovd1_day21" => result += (("action:vovd1_day21", value))
               case "vovd1_day21" => result += (("action:vovd1_day21", value))
               case "vovd1_day336" => result += (("action:vovd1_day336", value))
               case "vovd1_day336" => result += (("action:vovd1_day336", value))
+              case _ =>
             }
             }
         }
         }
       })
       })
@@ -82,6 +83,7 @@ object makedata_i2i_04_bucketFile_20241128 {
               case "vovd1_day3" => result += (("cate1:vovd1_day3", value))
               case "vovd1_day3" => result += (("cate1:vovd1_day3", value))
               case "vovd1_day7" => result += (("cate1:vovd1_day7", value))
               case "vovd1_day7" => result += (("cate1:vovd1_day7", value))
               case "vovd1_day30" => result += (("cate1:vovd1_day30", value))
               case "vovd1_day30" => result += (("cate1:vovd1_day30", value))
+              case _ =>
             }
             }
         }
         }
       })
       })
@@ -106,6 +108,7 @@ object makedata_i2i_04_bucketFile_20241128 {
               case "vovd1_day3" => result += (("cate2:vovd1_day3", value))
               case "vovd1_day3" => result += (("cate2:vovd1_day3", value))
               case "vovd1_day7" => result += (("cate2:vovd1_day7", value))
               case "vovd1_day7" => result += (("cate2:vovd1_day7", value))
               case "vovd1_day30" => result += (("cate2:vovd1_day30", value))
               case "vovd1_day30" => result += (("cate2:vovd1_day30", value))
+              case _ =>
             }
             }
         }
         }
       })
       })

+ 2 - 3
src/main/scala/com/aliyun/odps/spark/examples/临时记录的脚本-I2I

@@ -48,7 +48,6 @@ nohup /opt/apps/SPARK2/spark-2.4.8-hadoop3.2-1.0.8/bin/spark-class2 org.apache.s
 --class com.aliyun.odps.spark.examples.makedata_dssm.makedata_i2i_04_bucketFile_20241128 \
 --class com.aliyun.odps.spark.examples.makedata_dssm.makedata_i2i_04_bucketFile_20241128 \
 --master yarn --driver-memory 16G --executor-memory 2G --executor-cores 1 --num-executors 32 \
 --master yarn --driver-memory 16G --executor-memory 2G --executor-cores 1 --num-executors 32 \
 ./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
 ./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
-readPath:/dw/recommend/model/52_dssm_i2i_joinfeature/20241128* \
+readPath:/dw/recommend/model/52_dssm_i2i_joinfeature/20241126* \
 savePath:/dw/recommend/model/54_dssm_i2i_bucketfile/ \
 savePath:/dw/recommend/model/54_dssm_i2i_bucketfile/ \
-readPath:/dw/recommend/model/53_dssm_i2i_onehot/20241128 \
-fileName:47_rate_v1  bucketNum:100 > p53.log 2>&1 &
+fileName:47_rate_v1  bucketNum:100 > p54.log 2>&1 &