Browse Source

增加用户-广告交叉特征

xueyiming 2 weeks ago
parent
commit
d5cce413fe
1 changed files with 6 additions and 4 deletions
  1. 6 4
      widedeep_v12_9.py

+ 6 - 4
widedeep_v12_9.py

@@ -7,7 +7,9 @@
 # Distributed under terms of the MIT license.
 
 """
-删除容易导致偏差的viewall特征
+1.删除容易导致偏差的viewall特征
+2.删除分桶不均匀的cpa特征
+3.减少dense特征
 """
 
 
@@ -25,10 +27,10 @@ def read_features(filename, excludes=None):
                 features.remove(x)
     return features
 
-exclude_features = ['viewall',]
+exclude_features = ['viewall', 'cpa']
 
-dense_features = read_features("features_top300.config", exclude_features)
-top_dense_features = read_features('features_top100.config', exclude_features)
+dense_features = read_features("features_top300.config", exclude_features)[:150]
+top_dense_features = read_features('features_top50.config', exclude_features)
 
 sparse_features = [
     "cid", "adid", "adverid",