فهرست منبع

Update makedata_ad_33_bucketDataFromOriginToHive_20250228: Remove useless feature

StrayWarrior 6 روز پیش
والد
کامیت
9459bc2e9c

+ 0 - 3
src/main/scala/com/aliyun/odps/spark/examples/makedata_ad/v20240718/makedata_ad_33_bucketDataFromOriginToHive_20250228.scala

@@ -484,8 +484,6 @@ object makedata_ad_33_bucketDataFromOriginToHive_20250228 {
 
               if (d3.nonEmpty) {
                 val vTitle = d3.getString("title")
-                val score = Similarity.conceptSimilarity(title, vTitle)
-                featureMap.put("ctitle_vtitle_similarity", score);
                 featureMap.put("cate1", d3.getOrDefault("merge_first_level_cate", ""))
                 featureMap.put("cate2", d3.getOrDefault("merge_second_level_cate", ""))
                 featureMap.put("title_split", d3.getOrDefault("title_split", ""))
@@ -528,7 +526,6 @@ object makedata_ad_33_bucketDataFromOriginToHive_20250228 {
                 用户对这个cid的ctr ctcvr cvr
 
             视频
-              title与cid的 sim-score-1/-2 无数据
               vid//cid下的 3h 6h 12h 1d 3d 7d 、 ctr ctcvr cvr ecpm conver --> 30个
               vid//cid下的 1d 3d 7d 14d、 ctr ctcvr ecpm 的rank值 倒数 --> 12个