|
@@ -62,8 +62,8 @@ object train_01_xgb_ad_20240808{
|
|
|
println("zhangbo:train data size:" + trainData.count())
|
|
|
|
|
|
val fields = Array(
|
|
|
- DataTypes.createStructField("label", DataTypes.IntegerType, true),
|
|
|
- DataTypes.createStructField("logKey", DataTypes.IntegerType, true)
|
|
|
+ DataTypes.createStructField("label", DataTypes.IntegerType, true)
|
|
|
+// DataTypes.createStructField("logKey", DataTypes.IntegerType, true)
|
|
|
|
|
|
) ++ features.map(f => DataTypes.createStructField(f, DataTypes.DoubleType, true))
|
|
|
val schema = DataTypes.createStructType(fields)
|
|
@@ -138,11 +138,11 @@ object train_01_xgb_ad_20240808{
|
|
|
featureMap.put(kv_(0), kv_(1).toDouble)
|
|
|
}
|
|
|
})
|
|
|
- val v: Array[Any] = new Array[Any](features.length + 2)
|
|
|
+ val v: Array[Any] = new Array[Any](features.length + 1)
|
|
|
v(0) = label
|
|
|
- v(1) = cid
|
|
|
+// v(1) = cid
|
|
|
for (i <- 0 until features.length) {
|
|
|
- v(i + 2) = featureMap.getOrElse(r, 0.0D)
|
|
|
+ v(i + 1) = featureMap.getOrElse(r, 0.0D)
|
|
|
}
|
|
|
Row(v: _*)
|
|
|
})
|