|
@@ -152,7 +152,7 @@ object makedata_recsys_83_originData_20250317 {
|
|
})
|
|
})
|
|
|
|
|
|
// 2.4 加载样本数据
|
|
// 2.4 加载样本数据
|
|
- val pageSet = Set("详情后沉浸页", "回流后沉浸页&内页feed", "首页feed")
|
|
|
|
|
|
+ val pageSet = Set("详情后沉浸页", "回流后沉浸页&内页feed", "首页feed", "详情页")
|
|
val odpsData = DataUtils.getODPSData(sc, project, table, partition, tablePart)
|
|
val odpsData = DataUtils.getODPSData(sc, project, table, partition, tablePart)
|
|
.filter(record => {
|
|
.filter(record => {
|
|
val page = getStringValue(record, "page")
|
|
val page = getStringValue(record, "page")
|
|
@@ -161,9 +161,15 @@ object makedata_recsys_83_originData_20250317 {
|
|
|
|
|
|
// 2.5 样本重采样
|
|
// 2.5 样本重采样
|
|
val filterColumns = Set("allfeaturemap", "metafeaturemap")
|
|
val filterColumns = Set("allfeaturemap", "metafeaturemap")
|
|
|
|
+ val onlineKeys = Set("head_video")
|
|
val resampleData = DataUtils.resampleWithoutInterception(whatLabel, fuSampleRate, odpsData)
|
|
val resampleData = DataUtils.resampleWithoutInterception(whatLabel, fuSampleRate, odpsData)
|
|
.map(record => {
|
|
.map(record => {
|
|
- ConvertUtils.record2Map(record, filterColumns)
|
|
|
|
|
|
+ val map = ConvertUtils.record2Map(record, filterColumns, onlineKeys)
|
|
|
|
+ val page = map.getOrElse("page", "")
|
|
|
|
+ if (page.equals("详情页") && map.containsKey("head_video")) {
|
|
|
|
+ map.put("v2_feature", map.get("head_video"))
|
|
|
|
+ }
|
|
|
|
+ map
|
|
})
|
|
})
|
|
|
|
|
|
// 2.6 join video stat
|
|
// 2.6 join video stat
|