|
@@ -62,7 +62,7 @@ object train_recsys_61_xgb_nor_20241209 {
|
|
println("recsys nor:train data size:" + trainData.count())
|
|
println("recsys nor:train data size:" + trainData.count())
|
|
|
|
|
|
val fields = Array(
|
|
val fields = Array(
|
|
- DataTypes.createStructField("label", DataTypes.IntegerType, true)
|
|
|
|
|
|
+ DataTypes.createStructField("label", DataTypes.DoubleType, true)
|
|
) ++ features.map(f => DataTypes.createStructField(f, DataTypes.DoubleType, true))
|
|
) ++ features.map(f => DataTypes.createStructField(f, DataTypes.DoubleType, true))
|
|
|
|
|
|
val schema = DataTypes.createStructType(fields)
|
|
val schema = DataTypes.createStructType(fields)
|
|
@@ -131,7 +131,7 @@ object train_recsys_61_xgb_nor_20241209 {
|
|
def createData(data: RDD[String], features: Array[String]): RDD[Row] = {
|
|
def createData(data: RDD[String], features: Array[String]): RDD[Row] = {
|
|
data.map(r => {
|
|
data.map(r => {
|
|
val line: Array[String] = StringUtils.split(r, '\t')
|
|
val line: Array[String] = StringUtils.split(r, '\t')
|
|
- val label: Int = NumberUtils.toInt(line(0))
|
|
|
|
|
|
+ val label: Double = NumberUtils.toDouble(line(0))
|
|
val map: util.Map[String, Double] = new util.HashMap[String, Double]
|
|
val map: util.Map[String, Double] = new util.HashMap[String, Double]
|
|
for (i <- 1 until line.length) {
|
|
for (i <- 1 until line.length) {
|
|
val fv: Array[String] = StringUtils.split(line(i), ':')
|
|
val fv: Array[String] = StringUtils.split(line(i), ':')
|