test_4.sql 47 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632
  1. -- =====================================================================
  2. -- 曝光回流链路 CUBE 聚合表 (基于 wide 宽表, 增加用户/品类维度 + 模型预估指标)
  3. -- 维度: user_type × hh_bucket × head_merge_leve2 × vid_merge_leve2 × vid_id (CUBE)
  4. -- 参考: de.sql + dwd_recsys_alg_exposure_agg_20260209
  5. -- =====================================================================
  6. -- -- DROP TABLE IF EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209;
  7. -- CREATE TABLE IF NOT EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209 (
  8. -- -- ==================== 维度列 ====================
  9. -- dt STRING COMMENT '日期'
  10. -- ,user_type STRING COMMENT '用户拉活量分层(R0&新用户/R1-50/R_180_330等,汇总为SUM)'
  11. -- ,hh_bucket STRING COMMENT '小时段(00-03/04-07/.../20-23,汇总为SUM)'
  12. -- ,head_merge_leve2 STRING COMMENT '进入内容品类(headvideoid品类,汇总为SUM)'
  13. -- ,vid_merge_leve2 STRING COMMENT '推荐内容品类(vid品类,TOP10曝光+其他,汇总为SUM)'
  14. -- ,vid_id STRING COMMENT '内容id(品类曝光TOP1+其他,汇总为SUM)'
  15. -- -- ==================== 基础流量 ====================
  16. -- ,exposure_cnt BIGINT COMMENT '曝光次数'
  17. -- ,exposure_uv BIGINT COMMENT '曝光人数(mid去重)'
  18. -- ,vid_cnt BIGINT COMMENT '视频个数(vid去重)'
  19. -- ,exposure_per_user DOUBLE COMMENT '人均曝光次数 = 曝光次数/曝光人数'
  20. -- -- ==================== 分享 & 回流漏斗 ====================
  21. -- ,share_exposure_cnt BIGINT COMMENT '产生分享的曝光数'
  22. -- ,share_cnt BIGINT COMMENT '分享总次数'
  23. -- ,return_exposure_cnt BIGINT COMMENT '产生回流的曝光数(含自身) = SUM(is_return_n)'
  24. -- ,return_exposure_cnt_noself BIGINT COMMENT '产生回流的曝光数(非自身) = SUM(is_return_noself)'
  25. -- ,return_uv BIGINT COMMENT '回流人数(含自身) = SUM(return_n_uv)'
  26. -- ,return_uv_noself BIGINT COMMENT '回流人数(非自身) = SUM(return_n_uv_noself)'
  27. -- ,share_rate DOUBLE COMMENT '分享率 = share_exposure_cnt/exposure_cnt'
  28. -- ,return_rate DOUBLE COMMENT '回流率(含自身) = return_exposure_cnt/exposure_cnt'
  29. -- ,return_rate_noself DOUBLE COMMENT '回流率(非自身) = return_exposure_cnt_noself/exposure_cnt'
  30. -- ,share_return_rate DOUBLE COMMENT '分享→回流转化率(非自身) = return_exposure_cnt_noself/share_exposure_cnt'
  31. -- -- ==================== 模型预估: STR (曝光→非自身回流概率) ====================
  32. -- ,str_real DOUBLE COMMENT '= return_rate_noself, 模型label'
  33. -- ,str_pred DOUBLE COMMENT 'STR预估 = SUM(str_pred)/exposure_cnt'
  34. -- ,str_copc DOUBLE COMMENT 'STR copc = str_real/str_pred'
  35. -- ,str_mae DOUBLE COMMENT 'STR MAE = AVG(|str_pred - str_real|)'
  36. -- ,str_var DOUBLE COMMENT 'STR VAR = VARIANCE(str_pred - str_real)'
  37. -- -- ==================== 模型预估: ROSN (条件回流UV, 非自身) ====================
  38. -- ,rosn_real DOUBLE COMMENT '= return_uv_noself/return_exposure_cnt_noself, 模型label'
  39. -- ,rosn_pred DOUBLE COMMENT 'ROSN预估 = SUM(rosn_pred WHERE is_return_noself=1)/SUM(is_return_noself)'
  40. -- ,rosn_copc DOUBLE COMMENT 'ROSN copc = rosn_real/rosn_pred'
  41. -- ,rosn_pred_origin DOUBLE COMMENT 'ROSN原始预估均值 = AVG(rosn_pred_origin)'
  42. -- ,rosn_mae DOUBLE COMMENT 'ROSN MAE = AVG(|rosn_pred - rosn_real|) WHERE is_return_noself=1'
  43. -- ,rosn_var DOUBLE COMMENT 'ROSN VAR = VARIANCE(rosn_pred - rosn_real) WHERE is_return_noself=1'
  44. -- -- ==================== 模型预估: ROVN (STR×ROSN) ====================
  45. -- ,rovn_real DOUBLE COMMENT '= return_uv_noself/exposure_cnt, 模型label'
  46. -- ,rovn_pred DOUBLE COMMENT 'rovn预估 = AVG(str_pred*rosn_pred)'
  47. -- ,rovn_copc DOUBLE COMMENT 'rovn copc = rovn_real/rovn_pred'
  48. -- ,rovn_mae DOUBLE COMMENT 'rovn MAE = AVG(|rovn_pred - rovn_real|)'
  49. -- ,rovn_var DOUBLE COMMENT 'rovn VAR = VARIANCE(rovn_pred - rovn_real)'
  50. -- ,sortscore_avg DOUBLE COMMENT 'sortscore均值'
  51. -- -- ==================== B链 (分享→点击) ====================
  52. -- ,bn_uv BIGINT COMMENT 'B链全量: 回流去重人数'
  53. -- ,bn_pv BIGINT COMMENT 'B链全量: 回流点击次数'
  54. -- ,bn_exp BIGINT COMMENT 'B链全量: 回流session曝光数'
  55. -- ,bn_ror DOUBLE COMMENT 'bn_uv/exposure_uv'
  56. -- ,bn_rov DOUBLE COMMENT 'bn_uv/exposure_cnt'
  57. -- ,b1_uv BIGINT COMMENT 'B链depth=1: 回流去重人数'
  58. -- ,b1_pv BIGINT COMMENT 'B链depth=1: 回流点击次数'
  59. -- ,b1_exp BIGINT COMMENT 'B链depth=1: 回流session曝光数'
  60. -- ,b1_ror DOUBLE COMMENT 'b1_uv/exposure_uv'
  61. -- ,b1_rov DOUBLE COMMENT 'b1_uv/exposure_cnt'
  62. -- ,b2_uv BIGINT COMMENT 'B链depth=2: 回流去重人数'
  63. -- ,b2_pv BIGINT COMMENT 'B链depth=2: 回流点击次数'
  64. -- ,b2_exp BIGINT COMMENT 'B链depth=2: 回流session曝光数'
  65. -- ,b2_ror DOUBLE COMMENT 'b2_uv/b1_uv'
  66. -- ,b2_rov DOUBLE COMMENT 'b2_uv/b1_exp'
  67. -- ,b3_uv BIGINT COMMENT 'B链depth=3: 回流去重人数'
  68. -- ,b3_pv BIGINT COMMENT 'B链depth=3: 回流点击次数'
  69. -- ,b3_exp BIGINT COMMENT 'B链depth=3: 回流session曝光数'
  70. -- ,b3_ror DOUBLE COMMENT 'b3_uv/b2_uv'
  71. -- ,b3_rov DOUBLE COMMENT 'b3_uv/b2_exp'
  72. -- -- ==================== C链 (全量depth, 按hop) ====================
  73. -- ,cn_1_uv BIGINT COMMENT 'C链hop1: 回流去重人数'
  74. -- ,cn_1_pv BIGINT COMMENT 'C链hop1: 回流点击次数'
  75. -- ,cn_1_exp BIGINT COMMENT 'C链hop1: 回流session曝光数'
  76. -- ,cn_1_ror DOUBLE COMMENT 'cn_1_uv/bn_uv'
  77. -- ,cn_1_rov DOUBLE COMMENT 'cn_1_uv/bn_exp'
  78. -- ,cn_2_uv BIGINT COMMENT 'C链hop2: 回流去重人数'
  79. -- ,cn_2_pv BIGINT COMMENT 'C链hop2: 回流点击次数'
  80. -- ,cn_2_exp BIGINT COMMENT 'C链hop2: 回流session曝光数'
  81. -- ,cn_2_ror DOUBLE COMMENT 'cn_2_uv/cn_1_uv'
  82. -- ,cn_2_rov DOUBLE COMMENT 'cn_2_uv/cn_1_exp'
  83. -- ,cn_3_uv BIGINT COMMENT 'C链hop3: 回流去重人数'
  84. -- ,cn_3_pv BIGINT COMMENT 'C链hop3: 回流点击次数'
  85. -- ,cn_3_exp BIGINT COMMENT 'C链hop3: 回流session曝光数'
  86. -- ,cn_3_ror DOUBLE COMMENT 'cn_3_uv/cn_2_uv'
  87. -- ,cn_3_rov DOUBLE COMMENT 'cn_3_uv/cn_2_exp'
  88. -- ,cn_total_uv BIGINT COMMENT 'C链合计UV'
  89. -- ,cn_total_ror DOUBLE COMMENT 'cn_total_uv/bn_uv'
  90. -- ,cn_total_rov DOUBLE COMMENT 'cn_total_uv/bn_exp'
  91. -- -- C链 depth拆分 hop1
  92. -- ,c1_1_uv BIGINT COMMENT 'C链d1-hop1: 回流去重人数'
  93. -- ,c1_1_pv BIGINT COMMENT 'C链d1-hop1: 回流点击次数'
  94. -- ,c1_1_exp BIGINT COMMENT 'C链d1-hop1: 回流session曝光数'
  95. -- ,c1_1_ror DOUBLE COMMENT 'c1_1_uv/bn_uv'
  96. -- ,c1_1_rov DOUBLE COMMENT 'c1_1_uv/bn_exp'
  97. -- ,c2_1_uv BIGINT COMMENT 'C链d2-hop1: 回流去重人数'
  98. -- ,c2_1_pv BIGINT COMMENT 'C链d2-hop1: 回流点击次数'
  99. -- ,c2_1_exp BIGINT COMMENT 'C链d2-hop1: 回流session曝光数'
  100. -- ,c2_1_ror DOUBLE COMMENT 'c2_1_uv/c1_1_uv'
  101. -- ,c2_1_rov DOUBLE COMMENT 'c2_1_uv/c1_1_exp'
  102. -- ,c3_1_uv BIGINT COMMENT 'C链d3-hop1: 回流去重人数'
  103. -- ,c3_1_pv BIGINT COMMENT 'C链d3-hop1: 回流点击次数'
  104. -- ,c3_1_exp BIGINT COMMENT 'C链d3-hop1: 回流session曝光数'
  105. -- ,c3_1_ror DOUBLE COMMENT 'c3_1_uv/c2_1_uv'
  106. -- ,c3_1_rov DOUBLE COMMENT 'c3_1_uv/c2_1_exp'
  107. -- -- C链 depth拆分 hop2
  108. -- ,c1_2_uv BIGINT COMMENT 'C链d1-hop2: 回流去重人数'
  109. -- ,c1_2_pv BIGINT COMMENT 'C链d1-hop2: 回流点击次数'
  110. -- ,c1_2_exp BIGINT COMMENT 'C链d1-hop2: 回流session曝光数'
  111. -- ,c1_2_ror DOUBLE COMMENT 'c1_2_uv/cn_1_uv'
  112. -- ,c1_2_rov DOUBLE COMMENT 'c1_2_uv/cn_1_exp'
  113. -- ,c2_2_uv BIGINT COMMENT 'C链d2-hop2: 回流去重人数'
  114. -- ,c2_2_pv BIGINT COMMENT 'C链d2-hop2: 回流点击次数'
  115. -- ,c2_2_exp BIGINT COMMENT 'C链d2-hop2: 回流session曝光数'
  116. -- ,c2_2_ror DOUBLE COMMENT 'c2_2_uv/c1_2_uv'
  117. -- ,c2_2_rov DOUBLE COMMENT 'c2_2_uv/c1_2_exp'
  118. -- ,c3_2_uv BIGINT COMMENT 'C链d3-hop2: 回流去重人数'
  119. -- ,c3_2_pv BIGINT COMMENT 'C链d3-hop2: 回流点击次数'
  120. -- ,c3_2_exp BIGINT COMMENT 'C链d3-hop2: 回流session曝光数'
  121. -- ,c3_2_ror DOUBLE COMMENT 'c3_2_uv/c2_2_uv'
  122. -- ,c3_2_rov DOUBLE COMMENT 'c3_2_uv/c2_2_exp'
  123. -- -- C链 depth拆分 hop3
  124. -- ,c1_3_uv BIGINT COMMENT 'C链d1-hop3: 回流去重人数'
  125. -- ,c1_3_pv BIGINT COMMENT 'C链d1-hop3: 回流点击次数'
  126. -- ,c1_3_exp BIGINT COMMENT 'C链d1-hop3: 回流session曝光数'
  127. -- ,c1_3_ror DOUBLE COMMENT 'c1_3_uv/cn_2_uv'
  128. -- ,c1_3_rov DOUBLE COMMENT 'c1_3_uv/cn_2_exp'
  129. -- ,c2_3_uv BIGINT COMMENT 'C链d2-hop3: 回流去重人数'
  130. -- ,c2_3_pv BIGINT COMMENT 'C链d2-hop3: 回流点击次数'
  131. -- ,c2_3_exp BIGINT COMMENT 'C链d2-hop3: 回流session曝光数'
  132. -- ,c2_3_ror DOUBLE COMMENT 'c2_3_uv/c1_3_uv'
  133. -- ,c2_3_rov DOUBLE COMMENT 'c2_3_uv/c1_3_exp'
  134. -- ,c3_3_uv BIGINT COMMENT 'C链d3-hop3: 回流去重人数'
  135. -- ,c3_3_pv BIGINT COMMENT 'C链d3-hop3: 回流点击次数'
  136. -- ,c3_3_exp BIGINT COMMENT 'C链d3-hop3: 回流session曝光数'
  137. -- ,c3_3_ror DOUBLE COMMENT 'c3_3_uv/c2_3_uv'
  138. -- ,c3_3_rov DOUBLE COMMENT 'c3_3_uv/c2_3_exp'
  139. -- -- ==================== D链 (session内后续曝光传播) ====================
  140. -- ,d0 BIGINT COMMENT 'D链初始成本: session内后续曝光数'
  141. -- ,dn_1_uv BIGINT COMMENT 'D链hop1: 回流去重人数'
  142. -- ,dn_1_pv BIGINT COMMENT 'D链hop1: 回流点击次数'
  143. -- ,dn_1_exp BIGINT COMMENT 'D链hop1: 回流session曝光数'
  144. -- ,dn_1_ror DOUBLE COMMENT 'dn_1_uv/exposure_uv'
  145. -- ,dn_1_rov DOUBLE COMMENT 'dn_1_uv/d0'
  146. -- ,dn_2_uv BIGINT COMMENT 'D链hop2: 回流去重人数'
  147. -- ,dn_2_pv BIGINT COMMENT 'D链hop2: 回流点击次数'
  148. -- ,dn_2_exp BIGINT COMMENT 'D链hop2: 回流session曝光数'
  149. -- ,dn_2_ror DOUBLE COMMENT 'dn_2_uv/dn_1_uv'
  150. -- ,dn_2_rov DOUBLE COMMENT 'dn_2_uv/dn_1_exp'
  151. -- ,dn_3_uv BIGINT COMMENT 'D链hop3: 回流去重人数'
  152. -- ,dn_3_pv BIGINT COMMENT 'D链hop3: 回流点击次数'
  153. -- ,dn_3_exp BIGINT COMMENT 'D链hop3: 回流session曝光数'
  154. -- ,dn_3_ror DOUBLE COMMENT 'dn_3_uv/dn_2_uv'
  155. -- ,dn_3_rov DOUBLE COMMENT 'dn_3_uv/dn_2_exp'
  156. -- ,dn_total_uv BIGINT COMMENT 'D链合计UV'
  157. -- ,dn_total_ror DOUBLE COMMENT 'dn_total_uv/exposure_uv'
  158. -- ,dn_total_rov DOUBLE COMMENT 'dn_total_uv/d0'
  159. -- -- D链 depth拆分 hop1
  160. -- ,d1_1_uv BIGINT COMMENT 'D链d1-hop1: 回流去重人数'
  161. -- ,d1_1_pv BIGINT COMMENT 'D链d1-hop1: 回流点击次数'
  162. -- ,d1_1_exp BIGINT COMMENT 'D链d1-hop1: 回流session曝光数'
  163. -- ,d1_1_ror DOUBLE COMMENT 'd1_1_uv/exposure_uv'
  164. -- ,d1_1_rov DOUBLE COMMENT 'd1_1_uv/d0'
  165. -- ,d2_1_uv BIGINT COMMENT 'D链d2-hop1: 回流去重人数'
  166. -- ,d2_1_pv BIGINT COMMENT 'D链d2-hop1: 回流点击次数'
  167. -- ,d2_1_exp BIGINT COMMENT 'D链d2-hop1: 回流session曝光数'
  168. -- ,d2_1_ror DOUBLE COMMENT 'd2_1_uv/d1_1_uv'
  169. -- ,d2_1_rov DOUBLE COMMENT 'd2_1_uv/d1_1_exp'
  170. -- ,d3_1_uv BIGINT COMMENT 'D链d3-hop1: 回流去重人数'
  171. -- ,d3_1_pv BIGINT COMMENT 'D链d3-hop1: 回流点击次数'
  172. -- ,d3_1_exp BIGINT COMMENT 'D链d3-hop1: 回流session曝光数'
  173. -- ,d3_1_ror DOUBLE COMMENT 'd3_1_uv/d2_1_uv'
  174. -- ,d3_1_rov DOUBLE COMMENT 'd3_1_uv/d2_1_exp'
  175. -- -- D链 depth拆分 hop2
  176. -- ,d1_2_uv BIGINT COMMENT 'D链d1-hop2: 回流去重人数'
  177. -- ,d1_2_pv BIGINT COMMENT 'D链d1-hop2: 回流点击次数'
  178. -- ,d1_2_exp BIGINT COMMENT 'D链d1-hop2: 回流session曝光数'
  179. -- ,d1_2_ror DOUBLE COMMENT 'd1_2_uv/dn_1_uv'
  180. -- ,d1_2_rov DOUBLE COMMENT 'd1_2_uv/dn_1_exp'
  181. -- ,d2_2_uv BIGINT COMMENT 'D链d2-hop2: 回流去重人数'
  182. -- ,d2_2_pv BIGINT COMMENT 'D链d2-hop2: 回流点击次数'
  183. -- ,d2_2_exp BIGINT COMMENT 'D链d2-hop2: 回流session曝光数'
  184. -- ,d2_2_ror DOUBLE COMMENT 'd2_2_uv/d1_2_uv'
  185. -- ,d2_2_rov DOUBLE COMMENT 'd2_2_uv/d1_2_exp'
  186. -- ,d3_2_uv BIGINT COMMENT 'D链d3-hop2: 回流去重人数'
  187. -- ,d3_2_pv BIGINT COMMENT 'D链d3-hop2: 回流点击次数'
  188. -- ,d3_2_exp BIGINT COMMENT 'D链d3-hop2: 回流session曝光数'
  189. -- ,d3_2_ror DOUBLE COMMENT 'd3_2_uv/d2_2_uv'
  190. -- ,d3_2_rov DOUBLE COMMENT 'd3_2_uv/d2_2_exp'
  191. -- -- D链 depth拆分 hop3
  192. -- ,d1_3_uv BIGINT COMMENT 'D链d1-hop3: 回流去重人数'
  193. -- ,d1_3_pv BIGINT COMMENT 'D链d1-hop3: 回流点击次数'
  194. -- ,d1_3_exp BIGINT COMMENT 'D链d1-hop3: 回流session曝光数'
  195. -- ,d1_3_ror DOUBLE COMMENT 'd1_3_uv/dn_2_uv'
  196. -- ,d1_3_rov DOUBLE COMMENT 'd1_3_uv/dn_2_exp'
  197. -- ,d2_3_uv BIGINT COMMENT 'D链d2-hop3: 回流去重人数'
  198. -- ,d2_3_pv BIGINT COMMENT 'D链d2-hop3: 回流点击次数'
  199. -- ,d2_3_exp BIGINT COMMENT 'D链d2-hop3: 回流session曝光数'
  200. -- ,d2_3_ror DOUBLE COMMENT 'd2_3_uv/d1_3_uv'
  201. -- ,d2_3_rov DOUBLE COMMENT 'd2_3_uv/d1_3_exp'
  202. -- ,d3_3_uv BIGINT COMMENT 'D链d3-hop3: 回流去重人数'
  203. -- ,d3_3_pv BIGINT COMMENT 'D链d3-hop3: 回流点击次数'
  204. -- ,d3_3_exp BIGINT COMMENT 'D链d3-hop3: 回流session曝光数'
  205. -- ,d3_3_ror DOUBLE COMMENT 'd3_3_uv/d2_3_uv'
  206. -- ,d3_3_rov DOUBLE COMMENT 'd3_3_uv/d2_3_exp'
  207. -- -- ==================== 全链路 ====================
  208. -- ,all_return_n_uv BIGINT COMMENT '全链路拉回UV = B + C + D'
  209. -- ,all_rovn DOUBLE COMMENT 'all_return_n_uv/exposure_cnt'
  210. -- ,all_ror DOUBLE COMMENT 'all_return_n_uv/exposure_uv'
  211. -- ,all_rov DOUBLE COMMENT 'all_return_n_uv/exposure_cnt'
  212. -- )
  213. -- COMMENT '曝光回流链路CUBE聚合-宽表版 (5维度: 用户分层/小时段/进入品类TOP1/推荐品类TOP10/内容idTOP1)'
  214. -- ;
  215. -- -- =====================================================================
  216. -- -- INSERT: 从 wide 宽表聚合, CUBE 全维度组合
  217. -- -- =====================================================================
  218. -- -- SELECT * FROM loghubods.dwd_recsys_alg_exposure_agg_wide_20260209 WHERE dt = '${dt}' ORDER BY exposure_cnt DESC LIMIT 100;
  219. -- INSERT OVERWRITE TABLE loghubods.dwd_recsys_alg_exposure_agg_wide_20260209
  220. WITH
  221. -- 用户拉活量分层
  222. t_user_type AS (
  223. SELECT DISTINCT type, openid
  224. FROM loghubods.mid_share_return_people_1year
  225. WHERE dt = TO_CHAR(DATEADD(TO_DATE('${dt}','YYYYMMDD'),-1,'dd'),'YYYYMMDD')
  226. AND type IS NOT NULL
  227. AND type != 'S_ALL'
  228. AND type NOT REGEXP 'R50'
  229. )
  230. -- 模型预估分数
  231. ,t_score AS (
  232. SELECT apptype
  233. ,videoid
  234. ,recommendtraceid
  235. ,scoresmap
  236. ,sortscore
  237. FROM (
  238. SELECT apptype
  239. ,videoid
  240. ,recommendtraceid
  241. ,scoresmap
  242. ,sortscore
  243. ,ROW_NUMBER() OVER (PARTITION BY apptype,videoid,recommendtraceid) AS rn
  244. FROM loghubods.statistics_log_hour
  245. WHERE dt LIKE '${dt}%'
  246. AND scoresmap IS NOT NULL
  247. )
  248. WHERE rn = 1
  249. )
  250. -- TOP1 进入内容品类(场): 按回流人数取 TOP1
  251. ,t_top_head_cate AS (
  252. SELECT vt.merge_leve2
  253. FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
  254. JOIN loghubods.video_merge_tag vt ON base.headvideoid = vt.videoid
  255. WHERE base.dt = '${dt}'
  256. AND vt.merge_leve2 IS NOT NULL
  257. GROUP BY vt.merge_leve2
  258. ORDER BY SUM(CAST(is_return_noself AS BIGINT)) DESC
  259. LIMIT 1
  260. )
  261. -- TOP10 推荐内容品类(货): 按曝光次数取 TOP10
  262. ,t_top_vid_cate AS (
  263. SELECT vt.merge_leve2
  264. FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
  265. JOIN loghubods.video_merge_tag vt ON base.vid = vt.videoid
  266. WHERE base.dt = '${dt}'
  267. AND vt.merge_leve2 IS NOT NULL
  268. GROUP BY vt.merge_leve2
  269. ORDER BY COUNT(1) DESC
  270. LIMIT 10
  271. )
  272. -- TOP1 内容id(货): 每品类按曝光次数取 TOP1 (曝光>10w)
  273. ,t_top_vid AS (
  274. SELECT merge_leve2, vid
  275. FROM (
  276. SELECT vt.merge_leve2
  277. ,base.vid
  278. ,COUNT(1) AS exp_cnt
  279. ,ROW_NUMBER() OVER (PARTITION BY vt.merge_leve2 ORDER BY COUNT(1) DESC) AS rk
  280. FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
  281. JOIN loghubods.video_merge_tag vt ON base.vid = vt.videoid
  282. WHERE base.dt = '${dt}'
  283. AND vt.merge_leve2 IS NOT NULL
  284. GROUP BY vt.merge_leve2, base.vid
  285. HAVING exp_cnt > 100000
  286. )
  287. WHERE rk <= 1
  288. )
  289. -- 宽表
  290. ,t_wide AS (
  291. SELECT base.*
  292. ,CASE WHEN e.type IS NULL OR e.type = 'R_0' THEN 'R0&新用户'
  293. WHEN e.type IN ('R_1','R_2_10','R_10_50') THEN 'R1-50'
  294. WHEN e.type IN ('R_50_100','R_100_180','R_180_330') THEN 'R_180_330'
  295. ELSE e.type
  296. END AS user_type
  297. ,CASE WHEN th.merge_leve2 IS NOT NULL THEN vt_head.merge_leve2 ELSE '其他' END AS head_merge_leve2
  298. ,CASE WHEN tv.merge_leve2 IS NOT NULL THEN vt_vid.merge_leve2 ELSE '其他' END AS vid_merge_leve2
  299. ,CASE WHEN ti.vid IS NOT NULL THEN base.vid ELSE '其他' END AS vid_id
  300. ,CAST(GET_JSON_OBJECT(e1.scoresmap,'$.fmRov') AS DOUBLE) AS str_pred
  301. ,1.22*POW(CAST(GET_JSON_OBJECT(e1.scoresmap,'$.NorXGBScore') AS DOUBLE),1.15) AS rosn_pred
  302. ,CAST(GET_JSON_OBJECT(e1.scoresmap,'$.hasReturnRovScore') AS DOUBLE) AS rosn_pred_origin
  303. ,e1.sortscore
  304. ,CASE
  305. WHEN CAST(hh AS INT) BETWEEN 0 AND 3 THEN '00-03'
  306. WHEN CAST(hh AS INT) BETWEEN 4 AND 7 THEN '04-07'
  307. WHEN CAST(hh AS INT) BETWEEN 8 AND 11 THEN '08-11'
  308. WHEN CAST(hh AS INT) BETWEEN 12 AND 15 THEN '12-15'
  309. WHEN CAST(hh AS INT) BETWEEN 16 AND 19 THEN '16-19'
  310. WHEN CAST(hh AS INT) BETWEEN 20 AND 23 THEN '20-23'
  311. ELSE '-'
  312. END AS hh_bucket
  313. FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
  314. LEFT JOIN t_user_type e
  315. ON SUBSTRING_INDEX(base.mid,'weixin_openid_',-1) = e.openid
  316. LEFT JOIN loghubods.video_merge_tag vt_head
  317. ON base.headvideoid = vt_head.videoid
  318. LEFT JOIN loghubods.video_merge_tag vt_vid
  319. ON base.vid = vt_vid.videoid
  320. LEFT JOIN t_score e1
  321. ON base.apptype = e1.apptype
  322. AND base.vid = e1.videoid
  323. AND base.recomtraceid = e1.recommendtraceid
  324. LEFT JOIN t_top_head_cate th
  325. ON vt_head.merge_leve2 = th.merge_leve2
  326. LEFT JOIN t_top_vid_cate tv
  327. ON vt_vid.merge_leve2 = tv.merge_leve2
  328. LEFT JOIN t_top_vid ti
  329. ON base.vid = ti.vid
  330. WHERE base.dt = '${dt}'
  331. )
  332. SELECT
  333. -- ==================== 维度列 ====================
  334. '${dt}' AS dt
  335. ,CASE WHEN GROUPING(user_type) = 1 THEN 'SUM' ELSE NVL(user_type, 'SUM') END AS user_type
  336. ,CASE WHEN GROUPING(hh_bucket) = 1 THEN 'SUM' ELSE NVL(hh_bucket, 'SUM') END AS hh_bucket
  337. ,CASE WHEN GROUPING(head_merge_leve2) = 1 THEN 'SUM' ELSE NVL(head_merge_leve2, 'SUM') END AS head_merge_leve2
  338. ,CASE WHEN GROUPING(vid_merge_leve2) = 1 THEN 'SUM' ELSE NVL(vid_merge_leve2, 'SUM') END AS vid_merge_leve2
  339. ,CASE WHEN GROUPING(vid_id) = 1 THEN 'SUM' ELSE NVL(vid_id, 'SUM') END AS vid_id
  340. -- ==================== 基础流量 ====================
  341. ,COUNT(1) AS exposure_cnt
  342. ,COUNT(DISTINCT mid) AS exposure_uv
  343. ,COUNT(DISTINCT vid) AS vid_cnt
  344. ,ROUND(COUNT(1) / COUNT(DISTINCT mid), 4) AS exposure_per_user
  345. -- ==================== 分享 & 回流漏斗 ====================
  346. ,SUM(CAST(is_share AS BIGINT)) AS share_exposure_cnt
  347. ,SUM(CAST(share_cnt AS BIGINT)) AS share_cnt
  348. ,SUM(CAST(is_return_n AS BIGINT)) AS return_exposure_cnt
  349. ,SUM(CAST(is_return_noself AS BIGINT)) AS return_exposure_cnt_noself
  350. ,SUM(CAST(return_n_uv AS BIGINT)) AS return_uv
  351. ,SUM(CAST(return_n_uv_noself AS BIGINT)) AS return_uv_noself
  352. ,ROUND(COALESCE(SUM(CAST(is_share AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS share_rate
  353. ,ROUND(COALESCE(SUM(CAST(is_return_n AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS return_rate
  354. ,ROUND(COALESCE(SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS return_rate_noself
  355. ,ROUND(COALESCE(SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(CAST(SUM(CAST(is_share AS BIGINT)) AS DOUBLE), 0), 0), 6) AS share_return_rate
  356. -- ==================== 模型预估: STR (曝光→非自身回流概率) ====================
  357. ,ROUND(COALESCE(SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(COUNT(1), 0), 0), 6) AS str_real
  358. ,ROUND(COALESCE(SUM(str_pred) / NULLIF(COUNT(1), 0), 0), 6) AS str_pred
  359. ,ROUND(
  360. (SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(COUNT(1), 0))
  361. / NULLIF(SUM(str_pred) / NULLIF(COUNT(1), 0), 0)
  362. , 4) AS str_copc
  363. ,ROUND(AVG(ABS(str_pred - CAST(is_return_noself AS BIGINT))), 6) AS str_mae
  364. ,ROUND(VARIANCE(str_pred - CAST(is_return_noself AS BIGINT)), 6) AS str_var
  365. -- ==================== 模型预估: ROSN (条件回流UV, 非自身) ====================
  366. ,ROUND(COALESCE(
  367. SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0)
  368. , 0), 6) AS rosn_real
  369. ,ROUND(COALESCE(SUM(CASE WHEN CAST(is_return_noself AS BIGINT) = 1 THEN rosn_pred END) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0), 0), 6) AS rosn_pred
  370. ,ROUND(
  371. (SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0))
  372. / NULLIF(SUM(CASE WHEN CAST(is_return_noself AS BIGINT) = 1 THEN rosn_pred END) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0), 0)
  373. , 4) AS rosn_copc
  374. ,ROUND(AVG(rosn_pred_origin), 6) AS rosn_pred_origin
  375. ,ROUND(AVG(
  376. CASE WHEN CAST(is_return_noself AS BIGINT) = 1
  377. THEN ABS(rosn_pred - CAST(return_n_uv_noself AS BIGINT))
  378. END
  379. ), 6) AS rosn_mae
  380. ,ROUND(VARIANCE(
  381. CASE WHEN CAST(is_return_noself AS BIGINT) = 1
  382. THEN rosn_pred - CAST(return_n_uv_noself AS BIGINT)
  383. END
  384. ), 6) AS rosn_var
  385. -- ==================== 模型预估: ROVN (STR×ROSN) ====================
  386. ,ROUND(COALESCE(SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(COUNT(1), 0), 0), 6) AS rovn_real
  387. ,ROUND(AVG(str_pred * rosn_pred), 6) AS rovn_pred
  388. ,ROUND(
  389. (SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(COUNT(1), 0))
  390. / NULLIF(AVG(str_pred * rosn_pred), 0)
  391. , 4) AS rovn_copc
  392. ,ROUND(AVG(ABS(str_pred * rosn_pred - CAST(return_n_uv_noself AS BIGINT))), 6) AS rovn_mae
  393. ,ROUND(VARIANCE(str_pred * rosn_pred - CAST(return_n_uv_noself AS BIGINT)), 6) AS rovn_var
  394. ,ROUND(AVG(CAST(sortscore AS DOUBLE)), 6) AS sortscore_avg
  395. -- ==================== B链 ====================
  396. ,SUM(CAST(bn_uv AS BIGINT)) AS bn_uv
  397. ,SUM(CAST(bn_pv AS BIGINT)) AS bn_pv
  398. ,SUM(CAST(bn_exp AS BIGINT)) AS bn_exp
  399. ,ROUND(COALESCE(SUM(CAST(bn_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS bn_ror
  400. ,ROUND(COALESCE(SUM(CAST(bn_uv AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS bn_rov
  401. ,SUM(CAST(b1_uv AS BIGINT)) AS b1_uv
  402. ,SUM(CAST(b1_pv AS BIGINT)) AS b1_pv
  403. ,SUM(CAST(b1_exp AS BIGINT)) AS b1_exp
  404. ,ROUND(COALESCE(SUM(CAST(b1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS b1_ror
  405. ,ROUND(COALESCE(SUM(CAST(b1_uv AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS b1_rov
  406. ,SUM(CAST(b2_uv AS BIGINT)) AS b2_uv
  407. ,SUM(CAST(b2_pv AS BIGINT)) AS b2_pv
  408. ,SUM(CAST(b2_exp AS BIGINT)) AS b2_exp
  409. ,ROUND(COALESCE(SUM(CAST(b2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b2_ror
  410. ,ROUND(COALESCE(SUM(CAST(b2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b2_rov
  411. ,SUM(CAST(b3_uv AS BIGINT)) AS b3_uv
  412. ,SUM(CAST(b3_pv AS BIGINT)) AS b3_pv
  413. ,SUM(CAST(b3_exp AS BIGINT)) AS b3_exp
  414. ,ROUND(COALESCE(SUM(CAST(b3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b3_ror
  415. ,ROUND(COALESCE(SUM(CAST(b3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b3_rov
  416. -- ==================== C链 (全量depth, 按hop) ====================
  417. ,SUM(CAST(cn_1_uv AS BIGINT)) AS cn_1_uv
  418. ,SUM(CAST(cn_1_pv AS BIGINT)) AS cn_1_pv
  419. ,SUM(CAST(cn_1_exp AS BIGINT)) AS cn_1_exp
  420. ,ROUND(COALESCE(SUM(CAST(cn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_1_ror
  421. ,ROUND(COALESCE(SUM(CAST(cn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_1_rov
  422. ,SUM(CAST(cn_2_uv AS BIGINT)) AS cn_2_uv
  423. ,SUM(CAST(cn_2_pv AS BIGINT)) AS cn_2_pv
  424. ,SUM(CAST(cn_2_exp AS BIGINT)) AS cn_2_exp
  425. ,ROUND(COALESCE(SUM(CAST(cn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_2_ror
  426. ,ROUND(COALESCE(SUM(CAST(cn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_2_rov
  427. ,SUM(CAST(cn_3_uv AS BIGINT)) AS cn_3_uv
  428. ,SUM(CAST(cn_3_pv AS BIGINT)) AS cn_3_pv
  429. ,SUM(CAST(cn_3_exp AS BIGINT)) AS cn_3_exp
  430. ,ROUND(COALESCE(SUM(CAST(cn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_3_ror
  431. ,ROUND(COALESCE(SUM(CAST(cn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_3_rov
  432. ,SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)) AS cn_total_uv
  433. ,ROUND(COALESCE(
  434. (SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)))
  435. / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0)
  436. , 0), 6) AS cn_total_ror
  437. ,ROUND(COALESCE(
  438. (SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)))
  439. / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0)
  440. , 0), 6) AS cn_total_rov
  441. -- ==================== C链 (按depth拆分) ====================
  442. -- hop1
  443. ,SUM(CAST(c1_1_uv AS BIGINT)) AS c1_1_uv
  444. ,SUM(CAST(c1_1_pv AS BIGINT)) AS c1_1_pv
  445. ,SUM(CAST(c1_1_exp AS BIGINT)) AS c1_1_exp
  446. ,ROUND(COALESCE(SUM(CAST(c1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_1_ror
  447. ,ROUND(COALESCE(SUM(CAST(c1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_1_rov
  448. ,SUM(CAST(c2_1_uv AS BIGINT)) AS c2_1_uv
  449. ,SUM(CAST(c2_1_pv AS BIGINT)) AS c2_1_pv
  450. ,SUM(CAST(c2_1_exp AS BIGINT)) AS c2_1_exp
  451. ,ROUND(COALESCE(SUM(CAST(c2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_1_ror
  452. ,ROUND(COALESCE(SUM(CAST(c2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_1_rov
  453. ,SUM(CAST(c3_1_uv AS BIGINT)) AS c3_1_uv
  454. ,SUM(CAST(c3_1_pv AS BIGINT)) AS c3_1_pv
  455. ,SUM(CAST(c3_1_exp AS BIGINT)) AS c3_1_exp
  456. ,ROUND(COALESCE(SUM(CAST(c3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_1_ror
  457. ,ROUND(COALESCE(SUM(CAST(c3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_1_rov
  458. -- hop2
  459. ,SUM(CAST(c1_2_uv AS BIGINT)) AS c1_2_uv
  460. ,SUM(CAST(c1_2_pv AS BIGINT)) AS c1_2_pv
  461. ,SUM(CAST(c1_2_exp AS BIGINT)) AS c1_2_exp
  462. ,ROUND(COALESCE(SUM(CAST(c1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_2_ror
  463. ,ROUND(COALESCE(SUM(CAST(c1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_2_rov
  464. ,SUM(CAST(c2_2_uv AS BIGINT)) AS c2_2_uv
  465. ,SUM(CAST(c2_2_pv AS BIGINT)) AS c2_2_pv
  466. ,SUM(CAST(c2_2_exp AS BIGINT)) AS c2_2_exp
  467. ,ROUND(COALESCE(SUM(CAST(c2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_2_ror
  468. ,ROUND(COALESCE(SUM(CAST(c2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_2_rov
  469. ,SUM(CAST(c3_2_uv AS BIGINT)) AS c3_2_uv
  470. ,SUM(CAST(c3_2_pv AS BIGINT)) AS c3_2_pv
  471. ,SUM(CAST(c3_2_exp AS BIGINT)) AS c3_2_exp
  472. ,ROUND(COALESCE(SUM(CAST(c3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_2_ror
  473. ,ROUND(COALESCE(SUM(CAST(c3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_2_rov
  474. -- hop3
  475. ,SUM(CAST(c1_3_uv AS BIGINT)) AS c1_3_uv
  476. ,SUM(CAST(c1_3_pv AS BIGINT)) AS c1_3_pv
  477. ,SUM(CAST(c1_3_exp AS BIGINT)) AS c1_3_exp
  478. ,ROUND(COALESCE(SUM(CAST(c1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_3_ror
  479. ,ROUND(COALESCE(SUM(CAST(c1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_3_rov
  480. ,SUM(CAST(c2_3_uv AS BIGINT)) AS c2_3_uv
  481. ,SUM(CAST(c2_3_pv AS BIGINT)) AS c2_3_pv
  482. ,SUM(CAST(c2_3_exp AS BIGINT)) AS c2_3_exp
  483. ,ROUND(COALESCE(SUM(CAST(c2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_3_ror
  484. ,ROUND(COALESCE(SUM(CAST(c2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_3_rov
  485. ,SUM(CAST(c3_3_uv AS BIGINT)) AS c3_3_uv
  486. ,SUM(CAST(c3_3_pv AS BIGINT)) AS c3_3_pv
  487. ,SUM(CAST(c3_3_exp AS BIGINT)) AS c3_3_exp
  488. ,ROUND(COALESCE(SUM(CAST(c3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_3_ror
  489. ,ROUND(COALESCE(SUM(CAST(c3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_3_rov
  490. -- ==================== D链 (全量depth, 按hop) ====================
  491. ,SUM(CAST(d0 AS BIGINT)) AS d0
  492. ,SUM(CAST(dn_1_uv AS BIGINT)) AS dn_1_uv
  493. ,SUM(CAST(dn_1_pv AS BIGINT)) AS dn_1_pv
  494. ,SUM(CAST(dn_1_exp AS BIGINT)) AS dn_1_exp
  495. ,ROUND(COALESCE(SUM(CAST(dn_1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS dn_1_ror
  496. ,ROUND(COALESCE(SUM(CAST(dn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_1_rov
  497. ,SUM(CAST(dn_2_uv AS BIGINT)) AS dn_2_uv
  498. ,SUM(CAST(dn_2_pv AS BIGINT)) AS dn_2_pv
  499. ,SUM(CAST(dn_2_exp AS BIGINT)) AS dn_2_exp
  500. ,ROUND(COALESCE(SUM(CAST(dn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_2_ror
  501. ,ROUND(COALESCE(SUM(CAST(dn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_2_rov
  502. ,SUM(CAST(dn_3_uv AS BIGINT)) AS dn_3_uv
  503. ,SUM(CAST(dn_3_pv AS BIGINT)) AS dn_3_pv
  504. ,SUM(CAST(dn_3_exp AS BIGINT)) AS dn_3_exp
  505. ,ROUND(COALESCE(SUM(CAST(dn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_3_ror
  506. ,ROUND(COALESCE(SUM(CAST(dn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_3_rov
  507. ,SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)) AS dn_total_uv
  508. ,ROUND(COALESCE(
  509. (SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)))
  510. / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0)
  511. , 0), 6) AS dn_total_ror
  512. ,ROUND(COALESCE(
  513. (SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)))
  514. / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0)
  515. , 0), 6) AS dn_total_rov
  516. -- ==================== D链 (按depth拆分) ====================
  517. -- hop1
  518. ,SUM(CAST(d1_1_uv AS BIGINT)) AS d1_1_uv
  519. ,SUM(CAST(d1_1_pv AS BIGINT)) AS d1_1_pv
  520. ,SUM(CAST(d1_1_exp AS BIGINT)) AS d1_1_exp
  521. ,ROUND(COALESCE(SUM(CAST(d1_1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS d1_1_ror
  522. ,ROUND(COALESCE(SUM(CAST(d1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_1_rov
  523. ,SUM(CAST(d2_1_uv AS BIGINT)) AS d2_1_uv
  524. ,SUM(CAST(d2_1_pv AS BIGINT)) AS d2_1_pv
  525. ,SUM(CAST(d2_1_exp AS BIGINT)) AS d2_1_exp
  526. ,ROUND(COALESCE(SUM(CAST(d2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_1_ror
  527. ,ROUND(COALESCE(SUM(CAST(d2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_1_rov
  528. ,SUM(CAST(d3_1_uv AS BIGINT)) AS d3_1_uv
  529. ,SUM(CAST(d3_1_pv AS BIGINT)) AS d3_1_pv
  530. ,SUM(CAST(d3_1_exp AS BIGINT)) AS d3_1_exp
  531. ,ROUND(COALESCE(SUM(CAST(d3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_1_ror
  532. ,ROUND(COALESCE(SUM(CAST(d3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_1_rov
  533. -- hop2
  534. ,SUM(CAST(d1_2_uv AS BIGINT)) AS d1_2_uv
  535. ,SUM(CAST(d1_2_pv AS BIGINT)) AS d1_2_pv
  536. ,SUM(CAST(d1_2_exp AS BIGINT)) AS d1_2_exp
  537. ,ROUND(COALESCE(SUM(CAST(d1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_2_ror
  538. ,ROUND(COALESCE(SUM(CAST(d1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_2_rov
  539. ,SUM(CAST(d2_2_uv AS BIGINT)) AS d2_2_uv
  540. ,SUM(CAST(d2_2_pv AS BIGINT)) AS d2_2_pv
  541. ,SUM(CAST(d2_2_exp AS BIGINT)) AS d2_2_exp
  542. ,ROUND(COALESCE(SUM(CAST(d2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_2_ror
  543. ,ROUND(COALESCE(SUM(CAST(d2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_2_rov
  544. ,SUM(CAST(d3_2_uv AS BIGINT)) AS d3_2_uv
  545. ,SUM(CAST(d3_2_pv AS BIGINT)) AS d3_2_pv
  546. ,SUM(CAST(d3_2_exp AS BIGINT)) AS d3_2_exp
  547. ,ROUND(COALESCE(SUM(CAST(d3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_2_ror
  548. ,ROUND(COALESCE(SUM(CAST(d3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_2_rov
  549. -- hop3
  550. ,SUM(CAST(d1_3_uv AS BIGINT)) AS d1_3_uv
  551. ,SUM(CAST(d1_3_pv AS BIGINT)) AS d1_3_pv
  552. ,SUM(CAST(d1_3_exp AS BIGINT)) AS d1_3_exp
  553. ,ROUND(COALESCE(SUM(CAST(d1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_3_ror
  554. ,ROUND(COALESCE(SUM(CAST(d1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_3_rov
  555. ,SUM(CAST(d2_3_uv AS BIGINT)) AS d2_3_uv
  556. ,SUM(CAST(d2_3_pv AS BIGINT)) AS d2_3_pv
  557. ,SUM(CAST(d2_3_exp AS BIGINT)) AS d2_3_exp
  558. ,ROUND(COALESCE(SUM(CAST(d2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_3_ror
  559. ,ROUND(COALESCE(SUM(CAST(d2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_3_rov
  560. ,SUM(CAST(d3_3_uv AS BIGINT)) AS d3_3_uv
  561. ,SUM(CAST(d3_3_pv AS BIGINT)) AS d3_3_pv
  562. ,SUM(CAST(d3_3_exp AS BIGINT)) AS d3_3_exp
  563. ,ROUND(COALESCE(SUM(CAST(d3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_3_ror
  564. ,ROUND(COALESCE(SUM(CAST(d3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_3_rov
  565. -- ==================== 全链路 ====================
  566. ,SUM(CAST(return_n_uv_noself AS BIGINT))
  567. + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
  568. + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
  569. AS all_return_n_uv
  570. ,ROUND(COALESCE(
  571. ( SUM(CAST(return_n_uv_noself AS BIGINT))
  572. + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
  573. + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
  574. ) / NULLIF(COUNT(1), 0)
  575. , 0), 6) AS all_rovn
  576. ,ROUND(COALESCE(
  577. ( SUM(CAST(return_n_uv_noself AS BIGINT))
  578. + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
  579. + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
  580. ) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0)
  581. , 0), 6) AS all_rov
  582. ,ROUND(COALESCE(
  583. ( SUM(CAST(return_n_uv_noself AS BIGINT))
  584. + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
  585. + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
  586. ) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0)
  587. , 0), 6) AS all_ror
  588. -- =====================================================================
  589. -- FROM + GROUP BY CUBE
  590. -- =====================================================================
  591. FROM t_wide
  592. GROUP BY CUBE(
  593. user_type
  594. ,hh_bucket
  595. ,head_merge_leve2
  596. ,vid_merge_leve2
  597. ,vid_id
  598. )
  599. ORDER BY exposure_cnt DESC
  600. ;