|
@@ -32,6 +32,7 @@ object makedata_i2i_02_joinFeatureData_20241128 {
|
|
|
val project = param.getOrElse("project", "loghubods")
|
|
|
val repartition = param.getOrElse("repartition", "100").toInt
|
|
|
val filterHours = param.getOrElse("filterHours", "25").split(",").toSet
|
|
|
+ val ifDebug = param.getOrElse("ifDebug", "false").toBoolean
|
|
|
// 2 读取odps+表信息
|
|
|
val odpsOps = env.getODPS(sc)
|
|
|
// 3 循环执行数据生产
|
|
@@ -133,11 +134,16 @@ object makedata_i2i_02_joinFeatureData_20241128 {
|
|
|
val feature_left_cate2 = category1.getOrElse(cate2_left, "{}")
|
|
|
val feature_right_cate1 = category2.getOrElse(cate1_right, "{}")
|
|
|
val feature_right_cate2 = category2.getOrElse(cate2_right, "{}")
|
|
|
- (logKey, label, vid_left, vid_right, feature_left, feature_right, feature_left_action, feature_right_action,
|
|
|
+ result.add(
|
|
|
+ (logKey, label, vid_left, vid_right, feature_left, feature_right, feature_left_action, feature_right_action,
|
|
|
feature_left_cate1, feature_right_cate1, feature_left_cate2, feature_right_cate2)
|
|
|
+ )
|
|
|
}
|
|
|
result.iterator
|
|
|
})
|
|
|
+ if (ifDebug){
|
|
|
+ println("数据量:" + sampleData1.count())
|
|
|
+ }
|
|
|
val hdfsPath = savePath + "/" + savePartition
|
|
|
if (hdfsPath.nonEmpty && hdfsPath.startsWith("/dw/recommend/model/")) {
|
|
|
println("删除路径并开始数据写入:" + hdfsPath)
|