ad_xgboost_predict.py 862 B

123456789101112131415161718192021222324252627
  1. import os
  2. import pandas as pd
  3. import xgboost as xgb
  4. from xgboost.sklearn import XGBClassifier
  5. # 1. 模型加载
  6. model = XGBClassifier()
  7. booster = xgb.Booster()
  8. booster.load_model('./data/ad_xgb.model')
  9. model._Booster = booster
  10. # 2. 预测:ad_status = 0, 不出广告
  11. df_0 = pd.read_csv('./data/predict_data/predict_data_0.csv')
  12. columns_0 = df_0.columns.values.tolist()
  13. y_pred_proba_0 = model.predict_proba(df_0[columns_0[2:]])
  14. df_0['y_0'] = y_pred_proba_0
  15. # 3. 预测:ad_status = 1, 不出广告
  16. df_1 = pd.read_csv('./data/predict_data/predict_data_1.csv')
  17. columns_1 = df_1.columns.values.tolist()
  18. y_pred_proba_1 = model.predict_proba(df_1[columns_1[2:]])
  19. df_0['y_1'] = y_pred_proba_1
  20. # 4. merge 结果
  21. res_df = pd.merge(df_0, df_1, how='left', on=['apptype', 'mid', 'videoid'])
  22. print(res_df.head())
  23. res_df['res_predict'] = res_df['y_0'] - res_df['y_1']