|
@@ -66,13 +66,13 @@ object makedata_recsys_61_nor_sample_20241209 {
|
|
|
.map {
|
|
|
case (logKey, labelKey, features) =>
|
|
|
val label = JSON.parseObject(labelKey).getOrDefault(whatLabel, "0").toString.toDouble
|
|
|
- (label, features)
|
|
|
+ (logKey, label, features)
|
|
|
}
|
|
|
.mapPartitions(row => {
|
|
|
val result = new ArrayBuffer[String]()
|
|
|
val bucketsMap = bucketsMap_br.value
|
|
|
row.foreach {
|
|
|
- case (label, features) =>
|
|
|
+ case (logKey, label, features) =>
|
|
|
val featuresBucket = features.map {
|
|
|
case (name, score) =>
|
|
|
if (!featureNameSet.contains(name)) {
|
|
@@ -91,7 +91,7 @@ object makedata_recsys_61_nor_sample_20241209 {
|
|
|
}
|
|
|
}
|
|
|
}.filter(_.nonEmpty)
|
|
|
- result.add(label + "\t" + featuresBucket.mkString("\t"))
|
|
|
+ result.add(logKey + "\t" + label + "\t" + featuresBucket.mkString("\t"))
|
|
|
}
|
|
|
result.iterator
|
|
|
})
|