jch 2 днів тому
батько
коміт
ad06245851

+ 2 - 1
src/main/scala/com/aliyun/odps/spark/examples/makedata_recsys_r_rate/makedata_recsys_83_originData_20250317.scala

@@ -154,9 +154,10 @@ object makedata_recsys_83_originData_20250317 {
       val odpsData = DataUtils.getODPSData(sc, project, table, partition, tablePart)
 
       // 2.5 样本重采样
+      val filterColumns = Set("allfeaturemap", "metafeaturemap")
       val resampleData = DataUtils.resampleWithoutInterception(whatLabel, fuSampleRate, odpsData)
         .map(record => {
-          ConvertUtils.record2Map(record)
+          ConvertUtils.record2Map(record, filterColumns)
         })
 
       // 2.6 join video stat

+ 4 - 1
src/main/scala/com/aliyun/odps/spark/examples/myUtils/ConvertUtils.java

@@ -68,13 +68,16 @@ public class ConvertUtils {
         return colMap;
     }
 
-    public static Map<String, String> record2Map(Record record) {
+    public static Map<String, String> record2Map(Record record, Set<String> filterColumns) {
         Map<String, String> map = new HashMap<>();
         if (null != record) {
             Column[] columns = record.getColumns();
             if (null != columns) {
                 for (Column column : columns) {
                     String name = column.getName();
+                    if (filterColumns.contains(name)) {
+                        continue;
+                    }
                     if (!record.isNull(name)) {
                         map.put(name, record.getString(name));
                     }