|
@@ -71,7 +71,7 @@ object train_recsys_61_xgb_rov_20241209 {
|
|
val schema = DataTypes.createStructType(fields)
|
|
val schema = DataTypes.createStructType(fields)
|
|
val trainDataSet: Dataset[Row] = spark.createDataFrame(trainData, schema)
|
|
val trainDataSet: Dataset[Row] = spark.createDataFrame(trainData, schema)
|
|
val vectorAssembler = new VectorAssembler().setInputCols(features).setOutputCol("features")
|
|
val vectorAssembler = new VectorAssembler().setInputCols(features).setOutputCol("features")
|
|
- val xgbInput = vectorAssembler.transform(trainDataSet).select("features", "label").persist()
|
|
|
|
|
|
+ val xgbInput = vectorAssembler.transform(trainDataSet).select("features", "label")
|
|
// val xgbParam = Map("eta" -> 0.01f,
|
|
// val xgbParam = Map("eta" -> 0.01f,
|
|
// "max_depth" -> 5,
|
|
// "max_depth" -> 5,
|
|
// "objective" -> "binary:logistic",
|
|
// "objective" -> "binary:logistic",
|