Explorar el Código

feat:添加新的分桶任务

zhaohaipeng hace 1 mes
padre
commit
c7a26559cd

+ 10 - 1
recommend/23_str_train_data_make.sh

@@ -17,4 +17,13 @@ for dt in "${dts[@]}"; do
 
     echo "${dt} 负样本采样完成"
 
-done
+done
+
+
+/opt/apps/SPARK2/spark-2.4.8-hadoop3.2-1.0.8/bin/spark-class2 org.apache.spark.deploy.SparkSubmit \
+--class com.aliyun.odps.spark.examples.makedata_recsys.v20250218.makedata_recsys_43_str_data_bucket_20250218 \
+--master yarn --driver-memory 4G --executor-memory 8G --executor-cores 1 --num-executors 16 \
+./target/spark-examples-1.0.0-SNAPSHOT-shaded.jar \
+readPath:/dw/recommend/model/41_recsys_sample_data/ \
+savePath:/dw/recommend/model/43_recsys_str_data_bucket/ \
+beginStr:20250224 endStr:20250302 whatLabel:is_share fileName:20250218_bucket_322.txt

+ 1 - 1
src/main/scala/com/aliyun/odps/spark/examples/makedata_recsys/v20250218/makedata_recsys_43_bucketData_20250218.scala → src/main/scala/com/aliyun/odps/spark/examples/makedata_recsys/v20250218/makedata_recsys_43_str_data_bucket_20250218.scala

@@ -13,7 +13,7 @@ import scala.collection.mutable.ArrayBuffer
 
  */
 
-object makedata_recsys_43_bucketData_20250218 {
+object makedata_recsys_43_str_data_bucket_20250218 {
   def main(args: Array[String]): Unit = {
 
     // 1 读取参数