浏览代码

增加用户-广告交叉特征

xueyiming 2 周之前
父节点
当前提交
d5cce413fe
共有 1 个文件被更改,包括 6 次插入4 次删除
  1. 6 4
      widedeep_v12_9.py

+ 6 - 4
widedeep_v12_9.py

@@ -7,7 +7,9 @@
 # Distributed under terms of the MIT license.
 # Distributed under terms of the MIT license.
 
 
 """
 """
-删除容易导致偏差的viewall特征
+1.删除容易导致偏差的viewall特征
+2.删除分桶不均匀的cpa特征
+3.减少dense特征
 """
 """
 
 
 
 
@@ -25,10 +27,10 @@ def read_features(filename, excludes=None):
                 features.remove(x)
                 features.remove(x)
     return features
     return features
 
 
-exclude_features = ['viewall',]
+exclude_features = ['viewall', 'cpa']
 
 
-dense_features = read_features("features_top300.config", exclude_features)
-top_dense_features = read_features('features_top100.config', exclude_features)
+dense_features = read_features("features_top300.config", exclude_features)[:150]
+top_dense_features = read_features('features_top50.config', exclude_features)
 
 
 sparse_features = [
 sparse_features = [
     "cid", "adid", "adverid",
     "cid", "adid", "adverid",