|
@@ -46,10 +46,10 @@ object makedata_recsys_61_bucket_20241209 {
|
|
|
val bucketNum = param.getOrElse("bucketNum", "200").toInt
|
|
|
|
|
|
val data = sc.textFile(readPath)
|
|
|
- println("问题数据数量:" + data.filter(r => r.split("\t").length != 3).count())
|
|
|
+ println("问题数据数量:" + data.filter(r => r.split("\t").length < 3).count())
|
|
|
val data1 = data.map(r => {
|
|
|
val rList = r.split("\t")
|
|
|
- val jsons = JSON.parseObject(rList(2))
|
|
|
+ val jsons = JSON.parseObject(rList(rList.length - 1))
|
|
|
val doubles = scala.collection.mutable.Map[String, Double]()
|
|
|
jsons.foreach(r => {
|
|
|
doubles.put(r._1, jsons.getDoubleValue(r._1))
|