فهرست منبع

no bucket option

jch 2 ماه پیش
والد
کامیت
5befd4ffcb

+ 6 - 2
src/main/scala/com/aliyun/odps/spark/examples/makedata_recsys_r_rate/makedata_recsys_61_nor_sample_20241209.scala

@@ -24,6 +24,7 @@ object makedata_recsys_61_nor_sample_20241209 {
     val whatLabel = param.getOrElse("whatLabel", "total_return_uv_new")
     val whatApps = param.getOrElse("whatApps", "0,4,5,21,3,6").split(",").toSet
     val fuSampleRate = param.getOrElse("fuSampleRate", "-1.0").toDouble
+    val notUseBucket = param.getOrElse("notUseBucket", "0").toInt
     val featureNameFile = param.getOrElse("featureName", "20241209_recsys_nor_name.txt")
     val featureBucketFile = param.getOrElse("featureBucket", "20241209_recsys_nor_bucket.txt")
 
@@ -35,7 +36,7 @@ object makedata_recsys_61_nor_sample_20241209 {
 
     val loader = getClass.getClassLoader
     val featureNameSet = loadUseFeatureNames(loader, featureNameFile)
-    val featureBucketMap = loadUseFeatureBuckets(loader, featureBucketFile)
+    val featureBucketMap = loadUseFeatureBuckets(loader, notUseBucket, featureBucketFile)
     val bucketsMap_br = sc.broadcast(featureBucketMap)
 
     val dateRange = MyDateUtils.getDateRange(beginStr, endStr)
@@ -131,7 +132,10 @@ object makedata_recsys_61_nor_sample_20241209 {
       .toSet
   }
 
-  private def loadUseFeatureBuckets(loader: ClassLoader, nameFile: String): Map[String, (Double, Array[Double])] = {
+  private def loadUseFeatureBuckets(loader: ClassLoader, notUseBucket: Int, nameFile: String): Map[String, (Double, Array[Double])] = {
+    if (notUseBucket > 0) {
+      return Map[String, (Double, Array[Double])]()
+    }
     val buckets = loadFileData(loader, nameFile)
     println(buckets)
     buckets.split("\n")

+ 6 - 2
src/main/scala/com/aliyun/odps/spark/examples/makedata_recsys_r_rate/makedata_recsys_61_rov_sample_20241209.scala

@@ -28,6 +28,7 @@ object makedata_recsys_61_rov_sample_20241209 {
     val whatLabel = param.getOrElse("whatLabel", "is_return")
     val whatApps = param.getOrElse("whatApps", "0,4,5,21,3,6").split(",").toSet
     val fuSampleRate = param.getOrElse("fuSampleRate", "1.0").toDouble
+    val notUseBucket = param.getOrElse("notUseBucket", "0").toInt
     val featureNameFile = param.getOrElse("featureName", "20241209_recsys_rov_name.txt")
     val featureBucketFile = param.getOrElse("featureBucket", "20241209_recsys_rov_bucket.txt")
 
@@ -39,7 +40,7 @@ object makedata_recsys_61_rov_sample_20241209 {
 
     val loader = getClass.getClassLoader
     val featureNameSet = loadUseFeatureNames(loader, featureNameFile)
-    val featureBucketMap = loadUseFeatureBuckets(loader, featureBucketFile)
+    val featureBucketMap = loadUseFeatureBuckets(loader, notUseBucket, featureBucketFile)
     val bucketsMap_br = sc.broadcast(featureBucketMap)
 
     val dateRange = MyDateUtils.getDateRange(beginStr, endStr)
@@ -135,7 +136,10 @@ object makedata_recsys_61_rov_sample_20241209 {
       .toSet
   }
 
-  private def loadUseFeatureBuckets(loader: ClassLoader, nameFile: String): Map[String, (Double, Array[Double])] = {
+  private def loadUseFeatureBuckets(loader: ClassLoader, notUseBucket: Int, nameFile: String): Map[String, (Double, Array[Double])] = {
+    if (notUseBucket > 0) {
+      return Map[String, (Double, Array[Double])]()
+    }
     val buckets = loadFileData(loader, nameFile)
     println(buckets)
     buckets.split("\n")