| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601 |
- -- =====================================================================
- -- 曝光回流链路 CUBE 聚合表 (基于 wide 宽表, 增加用户/品类维度 + 模型预估指标)
- -- 维度: user_type × hh_bucket × head_merge_leve2 × vid_merge_leve2 × vid_id (CUBE)
- -- 参考: de.sql + dwd_recsys_alg_exposure_agg_20260209
- -- =====================================================================
- -- -- DROP TABLE IF EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209;
- -- CREATE TABLE IF NOT EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209 (
- -- -- ==================== 维度列 ====================
- -- dt STRING COMMENT '日期'
- -- ,user_type STRING COMMENT '用户拉活量分层(R0&新用户/R1-50/R_180_330等,汇总为SUM)'
- -- ,hh_bucket STRING COMMENT '小时段(00-03/04-07/.../20-23,汇总为SUM)'
- -- ,head_merge_leve2 STRING COMMENT '进入内容品类(headvideoid品类,汇总为SUM)'
- -- ,vid_merge_leve2 STRING COMMENT '推荐内容品类(vid品类,TOP10曝光+其他,汇总为SUM)'
- -- ,vid_id STRING COMMENT '内容id(品类曝光TOP1+其他,汇总为SUM)'
- -- -- ==================== 基础流量 ====================
- -- ,exposure_cnt BIGINT COMMENT '曝光次数'
- -- ,exposure_uv BIGINT COMMENT '曝光人数(mid去重)'
- -- ,vid_cnt BIGINT COMMENT '视频个数(vid去重)'
- -- ,exposure_per_user DOUBLE COMMENT '人均曝光次数 = 曝光次数/曝光人数'
- -- -- ==================== 分享 ====================
- -- ,share_exposure_cnt BIGINT COMMENT '产生分享的曝光数'
- -- ,share_cnt BIGINT COMMENT '分享总次数'
- -- -- ==================== STR 指标 ====================
- -- ,str_real DOUBLE COMMENT 'STR实际 = is_return_noself/曝光次数'
- -- ,str_pred DOUBLE COMMENT 'STR预估 = SUM(str_pred)/曝光次数'
- -- ,str_copc DOUBLE COMMENT 'STR copc = str_real/str_pred'
- -- ,str_mae DOUBLE COMMENT 'STR MAE = AVG(ABS(str_pred - is_return_noself))'
- -- ,str_var DOUBLE COMMENT 'STR VAR = VARIANCE(str_pred - is_return_noself)'
- -- -- ==================== ROSN 指标 ====================
- -- ,rosn_real DOUBLE COMMENT 'ROSN实际 = return_n_uv_noself/is_return_noself'
- -- ,rosn_pred DOUBLE COMMENT 'ROSN预估 = SUM(rosn_pred)/is_return_noself'
- -- ,rosn_copc DOUBLE COMMENT 'ROSN copc = rosn_real/rosn_pred'
- -- ,rosn_pred_origin DOUBLE COMMENT 'ROSN原始预估均值 = AVG(rosn_pred_origin)'
- -- ,rosn_mae DOUBLE COMMENT 'ROSN MAE = AVG(ABS(rosn_pred - return_n_uv_noself)) WHERE is_return_noself=1'
- -- ,rosn_var DOUBLE COMMENT 'ROSN VAR = VARIANCE(rosn_pred - return_n_uv_noself) WHERE is_return_noself=1'
- -- -- ==================== ROVN 指标 ====================
- -- ,rovn DOUBLE COMMENT 'rovn实际 = return_n_uv_noself/曝光次数'
- -- ,rovn_pred DOUBLE COMMENT 'rovn预估 = AVG(str_pred*rosn_pred)'
- -- ,rovn_copc DOUBLE COMMENT 'rovn copc = rovn/rovn_pred'
- -- ,rovn_mae DOUBLE COMMENT 'rovn MAE = AVG(ABS(str_pred*rosn_pred - return_n_uv_noself/曝光次数))'
- -- ,rovn_var DOUBLE COMMENT 'rovn VAR = VARIANCE(str_pred*rosn_pred - return_n_uv_noself/曝光次数)'
- -- ,sortscore_avg DOUBLE COMMENT 'sortscore均值'
- -- -- ==================== B链 (分享→点击) ====================
- -- ,bn_exp BIGINT COMMENT 'B链全量: 回流session曝光数'
- -- ,bn_pv BIGINT COMMENT 'B链全量: 回流点击次数'
- -- ,bn_uv BIGINT COMMENT 'B链全量: 回流去重人数'
- -- ,b1_exp BIGINT COMMENT 'B链depth=1: 回流session曝光数'
- -- ,b1_pv BIGINT COMMENT 'B链depth=1: 回流点击次数'
- -- ,b1_uv BIGINT COMMENT 'B链depth=1: 回流去重人数'
- -- ,b2_exp BIGINT COMMENT 'B链depth=2: 回流session曝光数'
- -- ,b2_pv BIGINT COMMENT 'B链depth=2: 回流点击次数'
- -- ,b2_uv BIGINT COMMENT 'B链depth=2: 回流去重人数'
- -- ,b3_exp BIGINT COMMENT 'B链depth=3: 回流session曝光数'
- -- ,b3_pv BIGINT COMMENT 'B链depth=3: 回流点击次数'
- -- ,b3_uv BIGINT COMMENT 'B链depth=3: 回流去重人数'
- -- ,bn_rov DOUBLE COMMENT 'B链全量: rov = bn_uv/曝光次数'
- -- ,bn_ror DOUBLE COMMENT 'B链全量: ror = bn_uv/曝光人数'
- -- ,b1_rov DOUBLE COMMENT 'B链depth=1: rov = b1_uv/曝光次数'
- -- ,b1_ror DOUBLE COMMENT 'B链depth=1: ror = b1_uv/曝光人数'
- -- ,b2_rov DOUBLE COMMENT 'B链depth=2: rov = b2_uv/b1曝光数'
- -- ,b2_ror DOUBLE COMMENT 'B链depth=2: ror = b2_uv/b1人数'
- -- ,b3_rov DOUBLE COMMENT 'B链depth=3: rov = b3_uv/b2曝光数'
- -- ,b3_ror DOUBLE COMMENT 'B链depth=3: ror = b3_uv/b2人数'
- -- -- ==================== C链 (全量depth, 按hop) ====================
- -- ,cn_1_exp BIGINT COMMENT 'C链hop1: 回流session曝光数'
- -- ,cn_1_pv BIGINT COMMENT 'C链hop1: 回流点击次数'
- -- ,cn_1_uv BIGINT COMMENT 'C链hop1: 回流去重人数'
- -- ,cn_2_exp BIGINT COMMENT 'C链hop2: 回流session曝光数'
- -- ,cn_2_pv BIGINT COMMENT 'C链hop2: 回流点击次数'
- -- ,cn_2_uv BIGINT COMMENT 'C链hop2: 回流去重人数'
- -- ,cn_3_exp BIGINT COMMENT 'C链hop3: 回流session曝光数'
- -- ,cn_3_pv BIGINT COMMENT 'C链hop3: 回流点击次数'
- -- ,cn_3_uv BIGINT COMMENT 'C链hop3: 回流去重人数'
- -- ,cn_total_uv BIGINT COMMENT 'C链合计UV'
- -- ,cn_1_rov DOUBLE COMMENT 'C链hop1: rov = cn_1_uv/bn曝光数'
- -- ,cn_1_ror DOUBLE COMMENT 'C链hop1: ror = cn_1_uv/bn人数'
- -- ,cn_2_rov DOUBLE COMMENT 'C链hop2: rov = cn_2_uv/cn_1曝光数'
- -- ,cn_2_ror DOUBLE COMMENT 'C链hop2: ror = cn_2_uv/cn_1人数'
- -- ,cn_3_rov DOUBLE COMMENT 'C链hop3: rov = cn_3_uv/cn_2曝光数'
- -- ,cn_3_ror DOUBLE COMMENT 'C链hop3: ror = cn_3_uv/cn_2人数'
- -- ,cn_total_rov DOUBLE COMMENT 'C链合计: rov = cn_total_uv/bn曝光数'
- -- ,cn_total_ror DOUBLE COMMENT 'C链合计: ror = cn_total_uv/bn人数'
- -- ,c1_1_exp BIGINT COMMENT 'C链depth1-hop1: 回流session曝光数'
- -- ,c1_1_pv BIGINT COMMENT 'C链depth1-hop1: 回流点击次数'
- -- ,c1_1_uv BIGINT COMMENT 'C链depth1-hop1: 回流去重人数'
- -- ,c1_2_exp BIGINT COMMENT 'C链depth1-hop2: 回流session曝光数'
- -- ,c1_2_pv BIGINT COMMENT 'C链depth1-hop2: 回流点击次数'
- -- ,c1_2_uv BIGINT COMMENT 'C链depth1-hop2: 回流去重人数'
- -- ,c1_3_exp BIGINT COMMENT 'C链depth1-hop3: 回流session曝光数'
- -- ,c1_3_pv BIGINT COMMENT 'C链depth1-hop3: 回流点击次数'
- -- ,c1_3_uv BIGINT COMMENT 'C链depth1-hop3: 回流去重人数'
- -- ,c2_1_exp BIGINT COMMENT 'C链depth2-hop1: 回流session曝光数'
- -- ,c2_1_pv BIGINT COMMENT 'C链depth2-hop1: 回流点击次数'
- -- ,c2_1_uv BIGINT COMMENT 'C链depth2-hop1: 回流去重人数'
- -- ,c2_2_exp BIGINT COMMENT 'C链depth2-hop2: 回流session曝光数'
- -- ,c2_2_pv BIGINT COMMENT 'C链depth2-hop2: 回流点击次数'
- -- ,c2_2_uv BIGINT COMMENT 'C链depth2-hop2: 回流去重人数'
- -- ,c2_3_exp BIGINT COMMENT 'C链depth2-hop3: 回流session曝光数'
- -- ,c2_3_pv BIGINT COMMENT 'C链depth2-hop3: 回流点击次数'
- -- ,c2_3_uv BIGINT COMMENT 'C链depth2-hop3: 回流去重人数'
- -- ,c3_1_exp BIGINT COMMENT 'C链depth3-hop1: 回流session曝光数'
- -- ,c3_1_pv BIGINT COMMENT 'C链depth3-hop1: 回流点击次数'
- -- ,c3_1_uv BIGINT COMMENT 'C链depth3-hop1: 回流去重人数'
- -- ,c3_2_exp BIGINT COMMENT 'C链depth3-hop2: 回流session曝光数'
- -- ,c3_2_pv BIGINT COMMENT 'C链depth3-hop2: 回流点击次数'
- -- ,c3_2_uv BIGINT COMMENT 'C链depth3-hop2: 回流去重人数'
- -- ,c3_3_exp BIGINT COMMENT 'C链depth3-hop3: 回流session曝光数'
- -- ,c3_3_pv BIGINT COMMENT 'C链depth3-hop3: 回流点击次数'
- -- ,c3_3_uv BIGINT COMMENT 'C链depth3-hop3: 回流去重人数'
- -- ,c1_1_rov DOUBLE COMMENT 'C链d1-hop1: rov = c1_1_uv/bn曝光数'
- -- ,c1_1_ror DOUBLE COMMENT 'C链d1-hop1: ror = c1_1_uv/bn人数'
- -- ,c2_1_rov DOUBLE COMMENT 'C链d2-hop1: rov = c2_1_uv/c1_1曝光数'
- -- ,c2_1_ror DOUBLE COMMENT 'C链d2-hop1: ror = c2_1_uv/c1_1人数'
- -- ,c3_1_rov DOUBLE COMMENT 'C链d3-hop1: rov = c3_1_uv/c2_1曝光数'
- -- ,c3_1_ror DOUBLE COMMENT 'C链d3-hop1: ror = c3_1_uv/c2_1人数'
- -- ,c1_2_rov DOUBLE COMMENT 'C链d1-hop2: rov = c1_2_uv/cn_1曝光数'
- -- ,c1_2_ror DOUBLE COMMENT 'C链d1-hop2: ror = c1_2_uv/cn_1人数'
- -- ,c2_2_rov DOUBLE COMMENT 'C链d2-hop2: rov = c2_2_uv/c1_2曝光数'
- -- ,c2_2_ror DOUBLE COMMENT 'C链d2-hop2: ror = c2_2_uv/c1_2人数'
- -- ,c3_2_rov DOUBLE COMMENT 'C链d3-hop2: rov = c3_2_uv/c2_2曝光数'
- -- ,c3_2_ror DOUBLE COMMENT 'C链d3-hop2: ror = c3_2_uv/c2_2人数'
- -- ,c1_3_rov DOUBLE COMMENT 'C链d1-hop3: rov = c1_3_uv/cn_2曝光数'
- -- ,c1_3_ror DOUBLE COMMENT 'C链d1-hop3: ror = c1_3_uv/cn_2人数'
- -- ,c2_3_rov DOUBLE COMMENT 'C链d2-hop3: rov = c2_3_uv/c1_3曝光数'
- -- ,c2_3_ror DOUBLE COMMENT 'C链d2-hop3: ror = c2_3_uv/c1_3人数'
- -- ,c3_3_rov DOUBLE COMMENT 'C链d3-hop3: rov = c3_3_uv/c2_3曝光数'
- -- ,c3_3_ror DOUBLE COMMENT 'C链d3-hop3: ror = c3_3_uv/c2_3人数'
- -- -- ==================== D链 (session内后续曝光传播) ====================
- -- ,d0 BIGINT COMMENT 'D链初始成本: session内后续曝光数'
- -- ,dn_1_exp BIGINT COMMENT 'D链hop1: 回流session曝光数'
- -- ,dn_1_pv BIGINT COMMENT 'D链hop1: 回流点击次数'
- -- ,dn_1_uv BIGINT COMMENT 'D链hop1: 回流去重人数'
- -- ,dn_2_exp BIGINT COMMENT 'D链hop2: 回流session曝光数'
- -- ,dn_2_pv BIGINT COMMENT 'D链hop2: 回流点击次数'
- -- ,dn_2_uv BIGINT COMMENT 'D链hop2: 回流去重人数'
- -- ,dn_3_exp BIGINT COMMENT 'D链hop3: 回流session曝光数'
- -- ,dn_3_pv BIGINT COMMENT 'D链hop3: 回流点击次数'
- -- ,dn_3_uv BIGINT COMMENT 'D链hop3: 回流去重人数'
- -- ,dn_total_uv BIGINT COMMENT 'D链合计UV'
- -- ,dn_1_rov DOUBLE COMMENT 'D链hop1: rov = dn_1_uv/d0初始曝光数'
- -- ,dn_1_ror DOUBLE COMMENT 'D链hop1: ror = dn_1_uv/曝光人数'
- -- ,dn_2_rov DOUBLE COMMENT 'D链hop2: rov = dn_2_uv/dn_1曝光数'
- -- ,dn_2_ror DOUBLE COMMENT 'D链hop2: ror = dn_2_uv/dn_1人数'
- -- ,dn_3_rov DOUBLE COMMENT 'D链hop3: rov = dn_3_uv/dn_2曝光数'
- -- ,dn_3_ror DOUBLE COMMENT 'D链hop3: ror = dn_3_uv/dn_2人数'
- -- ,dn_total_rov DOUBLE COMMENT 'D链合计: rov = dn_total_uv/d0初始曝光数'
- -- ,dn_total_ror DOUBLE COMMENT 'D链合计: ror = dn_total_uv/曝光人数'
- -- ,d1_1_exp BIGINT COMMENT 'D链depth1-hop1: 回流session曝光数'
- -- ,d1_1_pv BIGINT COMMENT 'D链depth1-hop1: 回流点击次数'
- -- ,d1_1_uv BIGINT COMMENT 'D链depth1-hop1: 回流去重人数'
- -- ,d1_2_exp BIGINT COMMENT 'D链depth1-hop2: 回流session曝光数'
- -- ,d1_2_pv BIGINT COMMENT 'D链depth1-hop2: 回流点击次数'
- -- ,d1_2_uv BIGINT COMMENT 'D链depth1-hop2: 回流去重人数'
- -- ,d1_3_exp BIGINT COMMENT 'D链depth1-hop3: 回流session曝光数'
- -- ,d1_3_pv BIGINT COMMENT 'D链depth1-hop3: 回流点击次数'
- -- ,d1_3_uv BIGINT COMMENT 'D链depth1-hop3: 回流去重人数'
- -- ,d2_1_exp BIGINT COMMENT 'D链depth2-hop1: 回流session曝光数'
- -- ,d2_1_pv BIGINT COMMENT 'D链depth2-hop1: 回流点击次数'
- -- ,d2_1_uv BIGINT COMMENT 'D链depth2-hop1: 回流去重人数'
- -- ,d2_2_exp BIGINT COMMENT 'D链depth2-hop2: 回流session曝光数'
- -- ,d2_2_pv BIGINT COMMENT 'D链depth2-hop2: 回流点击次数'
- -- ,d2_2_uv BIGINT COMMENT 'D链depth2-hop2: 回流去重人数'
- -- ,d2_3_exp BIGINT COMMENT 'D链depth2-hop3: 回流session曝光数'
- -- ,d2_3_pv BIGINT COMMENT 'D链depth2-hop3: 回流点击次数'
- -- ,d2_3_uv BIGINT COMMENT 'D链depth2-hop3: 回流去重人数'
- -- ,d3_1_exp BIGINT COMMENT 'D链depth3-hop1: 回流session曝光数'
- -- ,d3_1_pv BIGINT COMMENT 'D链depth3-hop1: 回流点击次数'
- -- ,d3_1_uv BIGINT COMMENT 'D链depth3-hop1: 回流去重人数'
- -- ,d3_2_exp BIGINT COMMENT 'D链depth3-hop2: 回流session曝光数'
- -- ,d3_2_pv BIGINT COMMENT 'D链depth3-hop2: 回流点击次数'
- -- ,d3_2_uv BIGINT COMMENT 'D链depth3-hop2: 回流去重人数'
- -- ,d3_3_exp BIGINT COMMENT 'D链depth3-hop3: 回流session曝光数'
- -- ,d3_3_pv BIGINT COMMENT 'D链depth3-hop3: 回流点击次数'
- -- ,d3_3_uv BIGINT COMMENT 'D链depth3-hop3: 回流去重人数'
- -- ,d1_1_rov DOUBLE COMMENT 'D链d1-hop1: rov = d1_1_uv/d0初始曝光数'
- -- ,d1_1_ror DOUBLE COMMENT 'D链d1-hop1: ror = d1_1_uv/曝光人数'
- -- ,d2_1_rov DOUBLE COMMENT 'D链d2-hop1: rov = d2_1_uv/d1_1曝光数'
- -- ,d2_1_ror DOUBLE COMMENT 'D链d2-hop1: ror = d2_1_uv/d1_1人数'
- -- ,d3_1_rov DOUBLE COMMENT 'D链d3-hop1: rov = d3_1_uv/d2_1曝光数'
- -- ,d3_1_ror DOUBLE COMMENT 'D链d3-hop1: ror = d3_1_uv/d2_1人数'
- -- ,d1_2_rov DOUBLE COMMENT 'D链d1-hop2: rov = d1_2_uv/dn_1曝光数'
- -- ,d1_2_ror DOUBLE COMMENT 'D链d1-hop2: ror = d1_2_uv/dn_1人数'
- -- ,d2_2_rov DOUBLE COMMENT 'D链d2-hop2: rov = d2_2_uv/d1_2曝光数'
- -- ,d2_2_ror DOUBLE COMMENT 'D链d2-hop2: ror = d2_2_uv/d1_2人数'
- -- ,d3_2_rov DOUBLE COMMENT 'D链d3-hop2: rov = d3_2_uv/d2_2曝光数'
- -- ,d3_2_ror DOUBLE COMMENT 'D链d3-hop2: ror = d3_2_uv/d2_2人数'
- -- ,d1_3_rov DOUBLE COMMENT 'D链d1-hop3: rov = d1_3_uv/dn_2曝光数'
- -- ,d1_3_ror DOUBLE COMMENT 'D链d1-hop3: ror = d1_3_uv/dn_2人数'
- -- ,d2_3_rov DOUBLE COMMENT 'D链d2-hop3: rov = d2_3_uv/d1_3曝光数'
- -- ,d2_3_ror DOUBLE COMMENT 'D链d2-hop3: ror = d2_3_uv/d1_3人数'
- -- ,d3_3_rov DOUBLE COMMENT 'D链d3-hop3: rov = d3_3_uv/d2_3曝光数'
- -- ,d3_3_ror DOUBLE COMMENT 'D链d3-hop3: ror = d3_3_uv/d2_3人数'
- -- -- ==================== 全链路 ====================
- -- ,all_return_n_uv BIGINT COMMENT '全链路拉回UV = B + C + D'
- -- ,all_rovn DOUBLE COMMENT '全链路拉回率 = all_return_n_uv/曝光次数'
- -- ,all_rov DOUBLE COMMENT '全链路: rov = all_return_n_uv/曝光次数'
- -- ,all_ror DOUBLE COMMENT '全链路: ror = all_return_n_uv/曝光人数'
- -- )
- -- COMMENT '曝光回流链路CUBE聚合-宽表版 (5维度: 用户分层/小时段/进入品类TOP1/推荐品类TOP10/内容idTOP1)'
- -- ;
- WITH
- -- 用户拉活量分层
- t_user_type AS (
- SELECT DISTINCT type, openid
- FROM loghubods.mid_share_return_people_1year
- WHERE dt = TO_CHAR(DATEADD(TO_DATE('${dt}','YYYYMMDD'),-1,'dd'),'YYYYMMDD')
- AND type IS NOT NULL
- AND type != 'S_ALL'
- AND type NOT REGEXP 'R50'
- )
- -- 模型预估分数
- ,t_score AS (
- SELECT apptype
- ,videoid
- ,recommendtraceid
- ,scoresmap
- ,sortscore
- FROM (
- SELECT apptype
- ,videoid
- ,recommendtraceid
- ,scoresmap
- ,sortscore
- ,ROW_NUMBER() OVER (PARTITION BY apptype,videoid,recommendtraceid) AS rn
- FROM loghubods.statistics_log_hour
- WHERE dt LIKE '${dt}%'
- AND scoresmap IS NOT NULL
- )
- WHERE rn = 1
- )
- -- TOP1 进入内容品类(场): 按回流人数取 TOP1
- ,t_top_head_cate AS (
- SELECT vt.merge_leve2
- FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
- JOIN loghubods.video_merge_tag vt ON base.headvideoid = vt.videoid
- WHERE base.dt = '${dt}'
- AND vt.merge_leve2 IS NOT NULL
- GROUP BY vt.merge_leve2
- ORDER BY SUM(CAST(is_return_noself AS BIGINT)) DESC
- LIMIT 1
- )
- -- TOP10 推荐内容品类(货): 按曝光次数取 TOP10
- ,t_top_vid_cate AS (
- SELECT vt.merge_leve2
- FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
- JOIN loghubods.video_merge_tag vt ON base.vid = vt.videoid
- WHERE base.dt = '${dt}'
- AND vt.merge_leve2 IS NOT NULL
- GROUP BY vt.merge_leve2
- ORDER BY COUNT(1) DESC
- LIMIT 10
- )
- -- TOP1 内容id(货): 每品类按曝光次数取 TOP1 (曝光>10w)
- ,t_top_vid AS (
- SELECT merge_leve2, vid
- FROM (
- SELECT vt.merge_leve2
- ,base.vid
- ,COUNT(1) AS exp_cnt
- ,ROW_NUMBER() OVER (PARTITION BY vt.merge_leve2 ORDER BY COUNT(1) DESC) AS rk
- FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
- JOIN loghubods.video_merge_tag vt ON base.vid = vt.videoid
- WHERE base.dt = '${dt}'
- AND vt.merge_leve2 IS NOT NULL
- GROUP BY vt.merge_leve2, base.vid
- HAVING exp_cnt > 100000
- )
- WHERE rk <= 1
- )
- -- 宽表
- ,t_wide AS (
- SELECT base.*
- ,CASE WHEN e.type IS NULL OR e.type = 'R_0' THEN 'R0&新用户'
- WHEN e.type IN ('R_1','R_2_10','R_10_50') THEN 'R1-50'
- WHEN e.type IN ('R_50_100','R_100_180','R_180_330') THEN 'R_180_330'
- ELSE e.type
- END AS user_type
- ,CASE WHEN th.merge_leve2 IS NOT NULL THEN vt_head.merge_leve2 ELSE '其他' END AS head_merge_leve2
- ,CASE WHEN tv.merge_leve2 IS NOT NULL THEN vt_vid.merge_leve2 ELSE '其他' END AS vid_merge_leve2
- ,CASE WHEN ti.vid IS NOT NULL THEN base.vid ELSE '其他' END AS vid_id
- ,CAST(GET_JSON_OBJECT(e1.scoresmap,'$.fmRov') AS DOUBLE) AS str_pred
- ,1.22*POW(CAST(GET_JSON_OBJECT(e1.scoresmap,'$.NorXGBScore') AS DOUBLE),1.15) AS rosn_pred
- ,CAST(GET_JSON_OBJECT(e1.scoresmap,'$.hasReturnRovScore') AS DOUBLE) AS rosn_pred_origin
- ,e1.sortscore
- ,CASE
- WHEN CAST(hh AS INT) BETWEEN 0 AND 3 THEN '00-03'
- WHEN CAST(hh AS INT) BETWEEN 4 AND 7 THEN '04-07'
- WHEN CAST(hh AS INT) BETWEEN 8 AND 11 THEN '08-11'
- WHEN CAST(hh AS INT) BETWEEN 12 AND 15 THEN '12-15'
- WHEN CAST(hh AS INT) BETWEEN 16 AND 19 THEN '16-19'
- WHEN CAST(hh AS INT) BETWEEN 20 AND 23 THEN '20-23'
- ELSE '-'
- END AS hh_bucket
- FROM loghubods.dwd_recsys_alg_exposure_base_20260209 base
- LEFT JOIN t_user_type e
- ON SUBSTRING_INDEX(base.mid,'weixin_openid_',-1) = e.openid
- LEFT JOIN loghubods.video_merge_tag vt_head
- ON base.headvideoid = vt_head.videoid
- LEFT JOIN loghubods.video_merge_tag vt_vid
- ON base.vid = vt_vid.videoid
- LEFT JOIN t_score e1
- ON base.apptype = e1.apptype
- AND base.vid = e1.videoid
- AND base.recomtraceid = e1.recommendtraceid
- LEFT JOIN t_top_head_cate th
- ON vt_head.merge_leve2 = th.merge_leve2
- LEFT JOIN t_top_vid_cate tv
- ON vt_vid.merge_leve2 = tv.merge_leve2
- LEFT JOIN t_top_vid ti
- ON base.vid = ti.vid
- WHERE base.dt = '${dt}'
- )
- SELECT
- -- ==================== 维度列 ====================
- '${dt}' AS dt
- ,CASE WHEN GROUPING(user_type) = 1 THEN 'SUM' ELSE NVL(user_type, 'SUM') END AS user_type
- ,CASE WHEN GROUPING(hh_bucket) = 1 THEN 'SUM' ELSE NVL(hh_bucket, 'SUM') END AS hh_bucket
- ,CASE WHEN GROUPING(head_merge_leve2) = 1 THEN 'SUM' ELSE NVL(head_merge_leve2, 'SUM') END AS head_merge_leve2
- ,CASE WHEN GROUPING(vid_merge_leve2) = 1 THEN 'SUM' ELSE NVL(vid_merge_leve2, 'SUM') END AS vid_merge_leve2
- ,CASE WHEN GROUPING(vid_id) = 1 THEN 'SUM' ELSE NVL(vid_id, 'SUM') END AS vid_id
- -- ==================== 基础流量 ====================
- ,COUNT(1) AS exposure_cnt
- ,COUNT(DISTINCT mid) AS exposure_uv
- ,COUNT(DISTINCT vid) AS vid_cnt
- ,ROUND(COUNT(1) / COUNT(DISTINCT mid), 4) AS exposure_per_user
- -- ==================== 分享 ====================
- ,SUM(CAST(is_share AS BIGINT)) AS share_exposure_cnt
- ,SUM(CAST(share_cnt AS BIGINT)) AS share_cnt
- -- ==================== STR 指标 ====================
- ,ROUND(COALESCE(SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(COUNT(1), 0), 0), 6) AS str_real
- ,ROUND(COALESCE(SUM(str_pred) / NULLIF(COUNT(1), 0), 0), 6) AS str_pred
- ,ROUND(
- (SUM(CAST(is_return_noself AS BIGINT)) / NULLIF(COUNT(1), 0))
- / NULLIF(SUM(str_pred) / NULLIF(COUNT(1), 0), 0)
- , 4) AS str_copc
- ,ROUND(AVG(ABS(str_pred - CAST(is_return_noself AS BIGINT))), 6) AS str_mae
- ,ROUND(VARIANCE(str_pred - CAST(is_return_noself AS BIGINT)), 6) AS str_var
- -- ==================== ROSN 指标 ====================
- ,ROUND(COALESCE(
- SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0)
- , 0), 6) AS rosn_real
- ,ROUND(COALESCE(SUM(rosn_pred) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0), 0), 6) AS rosn_pred
- ,ROUND(
- (SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0))
- / NULLIF(SUM(rosn_pred) / NULLIF(SUM(CAST(is_return_noself AS BIGINT)), 0), 0)
- , 4) AS rosn_copc
- ,ROUND(AVG(rosn_pred_origin), 6) AS rosn_pred_origin
- ,ROUND(AVG(
- CASE WHEN CAST(is_return_noself AS BIGINT) = 1
- THEN ABS(rosn_pred - CAST(return_n_uv_noself AS BIGINT))
- END
- ), 6) AS rosn_mae
- ,ROUND(VARIANCE(
- CASE WHEN CAST(is_return_noself AS BIGINT) = 1
- THEN rosn_pred - CAST(return_n_uv_noself AS BIGINT)
- END
- ), 6) AS rosn_var
- -- ==================== ROVN 指标 ====================
- ,ROUND(COALESCE(SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(COUNT(1), 0), 0), 6) AS rovn
- ,ROUND(AVG(str_pred * rosn_pred), 6) AS rovn_pred
- ,ROUND(
- (SUM(CAST(return_n_uv_noself AS BIGINT)) / NULLIF(COUNT(1), 0))
- / NULLIF(AVG(str_pred * rosn_pred), 0)
- , 4) AS rovn_copc
- ,ROUND(AVG(ABS(str_pred * rosn_pred - CAST(return_n_uv_noself AS BIGINT))), 6) AS rovn_mae
- ,ROUND(VARIANCE(str_pred * rosn_pred - CAST(return_n_uv_noself AS BIGINT)), 6) AS rovn_var
- ,ROUND(AVG(CAST(sortscore AS DOUBLE)), 6) AS sortscore_avg
- -- ==================== B链 ====================
- ,SUM(CAST(bn_exp AS BIGINT)) AS bn_exp
- ,SUM(CAST(bn_pv AS BIGINT)) AS bn_pv
- ,SUM(CAST(bn_uv AS BIGINT)) AS bn_uv
- ,SUM(CAST(b1_exp AS BIGINT)) AS b1_exp
- ,SUM(CAST(b1_pv AS BIGINT)) AS b1_pv
- ,SUM(CAST(b1_uv AS BIGINT)) AS b1_uv
- ,SUM(CAST(b2_exp AS BIGINT)) AS b2_exp
- ,SUM(CAST(b2_pv AS BIGINT)) AS b2_pv
- ,SUM(CAST(b2_uv AS BIGINT)) AS b2_uv
- ,SUM(CAST(b3_exp AS BIGINT)) AS b3_exp
- ,SUM(CAST(b3_pv AS BIGINT)) AS b3_pv
- ,SUM(CAST(b3_uv AS BIGINT)) AS b3_uv
- ,ROUND(COALESCE(SUM(CAST(bn_uv AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS bn_rov
- ,ROUND(COALESCE(SUM(CAST(bn_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS bn_ror
- ,ROUND(COALESCE(SUM(CAST(b1_uv AS BIGINT)) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0), 0), 6) AS b1_rov
- ,ROUND(COALESCE(SUM(CAST(b1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS b1_ror
- ,ROUND(COALESCE(SUM(CAST(b2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b2_rov
- ,ROUND(COALESCE(SUM(CAST(b2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b2_ror
- ,ROUND(COALESCE(SUM(CAST(b3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b3_rov
- ,ROUND(COALESCE(SUM(CAST(b3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(b2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS b3_ror
- -- ==================== C链 (全量depth, 按hop) ====================
- ,SUM(CAST(cn_1_exp AS BIGINT)) AS cn_1_exp
- ,SUM(CAST(cn_1_pv AS BIGINT)) AS cn_1_pv
- ,SUM(CAST(cn_1_uv AS BIGINT)) AS cn_1_uv
- ,SUM(CAST(cn_2_exp AS BIGINT)) AS cn_2_exp
- ,SUM(CAST(cn_2_pv AS BIGINT)) AS cn_2_pv
- ,SUM(CAST(cn_2_uv AS BIGINT)) AS cn_2_uv
- ,SUM(CAST(cn_3_exp AS BIGINT)) AS cn_3_exp
- ,SUM(CAST(cn_3_pv AS BIGINT)) AS cn_3_pv
- ,SUM(CAST(cn_3_uv AS BIGINT)) AS cn_3_uv
- ,SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)) AS cn_total_uv
- ,ROUND(COALESCE(SUM(CAST(cn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_1_rov
- ,ROUND(COALESCE(SUM(CAST(cn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_1_ror
- ,ROUND(COALESCE(SUM(CAST(cn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_2_rov
- ,ROUND(COALESCE(SUM(CAST(cn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_2_ror
- ,ROUND(COALESCE(SUM(CAST(cn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_3_rov
- ,ROUND(COALESCE(SUM(CAST(cn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS cn_3_ror
- ,ROUND(COALESCE(
- (SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)))
- / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0)
- , 0), 6) AS cn_total_rov
- ,ROUND(COALESCE(
- (SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT)))
- / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0)
- , 0), 6) AS cn_total_ror
- -- ==================== C链 (按depth拆分) ====================
- ,SUM(CAST(c1_1_exp AS BIGINT)) AS c1_1_exp
- ,SUM(CAST(c1_1_pv AS BIGINT)) AS c1_1_pv
- ,SUM(CAST(c1_1_uv AS BIGINT)) AS c1_1_uv
- ,SUM(CAST(c1_2_exp AS BIGINT)) AS c1_2_exp
- ,SUM(CAST(c1_2_pv AS BIGINT)) AS c1_2_pv
- ,SUM(CAST(c1_2_uv AS BIGINT)) AS c1_2_uv
- ,SUM(CAST(c1_3_exp AS BIGINT)) AS c1_3_exp
- ,SUM(CAST(c1_3_pv AS BIGINT)) AS c1_3_pv
- ,SUM(CAST(c1_3_uv AS BIGINT)) AS c1_3_uv
- ,SUM(CAST(c2_1_exp AS BIGINT)) AS c2_1_exp
- ,SUM(CAST(c2_1_pv AS BIGINT)) AS c2_1_pv
- ,SUM(CAST(c2_1_uv AS BIGINT)) AS c2_1_uv
- ,SUM(CAST(c2_2_exp AS BIGINT)) AS c2_2_exp
- ,SUM(CAST(c2_2_pv AS BIGINT)) AS c2_2_pv
- ,SUM(CAST(c2_2_uv AS BIGINT)) AS c2_2_uv
- ,SUM(CAST(c2_3_exp AS BIGINT)) AS c2_3_exp
- ,SUM(CAST(c2_3_pv AS BIGINT)) AS c2_3_pv
- ,SUM(CAST(c2_3_uv AS BIGINT)) AS c2_3_uv
- ,SUM(CAST(c3_1_exp AS BIGINT)) AS c3_1_exp
- ,SUM(CAST(c3_1_pv AS BIGINT)) AS c3_1_pv
- ,SUM(CAST(c3_1_uv AS BIGINT)) AS c3_1_uv
- ,SUM(CAST(c3_2_exp AS BIGINT)) AS c3_2_exp
- ,SUM(CAST(c3_2_pv AS BIGINT)) AS c3_2_pv
- ,SUM(CAST(c3_2_uv AS BIGINT)) AS c3_2_uv
- ,SUM(CAST(c3_3_exp AS BIGINT)) AS c3_3_exp
- ,SUM(CAST(c3_3_pv AS BIGINT)) AS c3_3_pv
- ,SUM(CAST(c3_3_uv AS BIGINT)) AS c3_3_uv
- -- C链depth拆分 hop1 rov/ror
- ,ROUND(COALESCE(SUM(CAST(c1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_1_rov
- ,ROUND(COALESCE(SUM(CAST(c1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(bn_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_1_ror
- ,ROUND(COALESCE(SUM(CAST(c2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_1_rov
- ,ROUND(COALESCE(SUM(CAST(c2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_1_ror
- ,ROUND(COALESCE(SUM(CAST(c3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_1_rov
- ,ROUND(COALESCE(SUM(CAST(c3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_1_ror
- -- C链depth拆分 hop2 rov/ror
- ,ROUND(COALESCE(SUM(CAST(c1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_2_rov
- ,ROUND(COALESCE(SUM(CAST(c1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_2_ror
- ,ROUND(COALESCE(SUM(CAST(c2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_2_rov
- ,ROUND(COALESCE(SUM(CAST(c2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_2_ror
- ,ROUND(COALESCE(SUM(CAST(c3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_2_rov
- ,ROUND(COALESCE(SUM(CAST(c3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_2_ror
- -- C链depth拆分 hop3 rov/ror
- ,ROUND(COALESCE(SUM(CAST(c1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_3_rov
- ,ROUND(COALESCE(SUM(CAST(c1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(cn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c1_3_ror
- ,ROUND(COALESCE(SUM(CAST(c2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_3_rov
- ,ROUND(COALESCE(SUM(CAST(c2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c1_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c2_3_ror
- ,ROUND(COALESCE(SUM(CAST(c3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_3_rov
- ,ROUND(COALESCE(SUM(CAST(c3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(c2_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS c3_3_ror
- -- ==================== D链 (全量depth, 按hop) ====================
- ,SUM(CAST(d0 AS BIGINT)) AS d0
- ,SUM(CAST(dn_1_exp AS BIGINT)) AS dn_1_exp
- ,SUM(CAST(dn_1_pv AS BIGINT)) AS dn_1_pv
- ,SUM(CAST(dn_1_uv AS BIGINT)) AS dn_1_uv
- ,SUM(CAST(dn_2_exp AS BIGINT)) AS dn_2_exp
- ,SUM(CAST(dn_2_pv AS BIGINT)) AS dn_2_pv
- ,SUM(CAST(dn_2_uv AS BIGINT)) AS dn_2_uv
- ,SUM(CAST(dn_3_exp AS BIGINT)) AS dn_3_exp
- ,SUM(CAST(dn_3_pv AS BIGINT)) AS dn_3_pv
- ,SUM(CAST(dn_3_uv AS BIGINT)) AS dn_3_uv
- ,SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)) AS dn_total_uv
- ,ROUND(COALESCE(SUM(CAST(dn_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_1_rov
- ,ROUND(COALESCE(SUM(CAST(dn_1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS dn_1_ror
- ,ROUND(COALESCE(SUM(CAST(dn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_2_rov
- ,ROUND(COALESCE(SUM(CAST(dn_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_2_ror
- ,ROUND(COALESCE(SUM(CAST(dn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_3_rov
- ,ROUND(COALESCE(SUM(CAST(dn_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS dn_3_ror
- ,ROUND(COALESCE(
- (SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)))
- / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0)
- , 0), 6) AS dn_total_rov
- ,ROUND(COALESCE(
- (SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT)))
- / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0)
- , 0), 6) AS dn_total_ror
- -- ==================== D链 (按depth拆分) ====================
- ,SUM(CAST(d1_1_exp AS BIGINT)) AS d1_1_exp
- ,SUM(CAST(d1_1_pv AS BIGINT)) AS d1_1_pv
- ,SUM(CAST(d1_1_uv AS BIGINT)) AS d1_1_uv
- ,SUM(CAST(d1_2_exp AS BIGINT)) AS d1_2_exp
- ,SUM(CAST(d1_2_pv AS BIGINT)) AS d1_2_pv
- ,SUM(CAST(d1_2_uv AS BIGINT)) AS d1_2_uv
- ,SUM(CAST(d1_3_exp AS BIGINT)) AS d1_3_exp
- ,SUM(CAST(d1_3_pv AS BIGINT)) AS d1_3_pv
- ,SUM(CAST(d1_3_uv AS BIGINT)) AS d1_3_uv
- ,SUM(CAST(d2_1_exp AS BIGINT)) AS d2_1_exp
- ,SUM(CAST(d2_1_pv AS BIGINT)) AS d2_1_pv
- ,SUM(CAST(d2_1_uv AS BIGINT)) AS d2_1_uv
- ,SUM(CAST(d2_2_exp AS BIGINT)) AS d2_2_exp
- ,SUM(CAST(d2_2_pv AS BIGINT)) AS d2_2_pv
- ,SUM(CAST(d2_2_uv AS BIGINT)) AS d2_2_uv
- ,SUM(CAST(d2_3_exp AS BIGINT)) AS d2_3_exp
- ,SUM(CAST(d2_3_pv AS BIGINT)) AS d2_3_pv
- ,SUM(CAST(d2_3_uv AS BIGINT)) AS d2_3_uv
- ,SUM(CAST(d3_1_exp AS BIGINT)) AS d3_1_exp
- ,SUM(CAST(d3_1_pv AS BIGINT)) AS d3_1_pv
- ,SUM(CAST(d3_1_uv AS BIGINT)) AS d3_1_uv
- ,SUM(CAST(d3_2_exp AS BIGINT)) AS d3_2_exp
- ,SUM(CAST(d3_2_pv AS BIGINT)) AS d3_2_pv
- ,SUM(CAST(d3_2_uv AS BIGINT)) AS d3_2_uv
- ,SUM(CAST(d3_3_exp AS BIGINT)) AS d3_3_exp
- ,SUM(CAST(d3_3_pv AS BIGINT)) AS d3_3_pv
- ,SUM(CAST(d3_3_uv AS BIGINT)) AS d3_3_uv
- -- D链depth拆分 hop1 rov/ror
- ,ROUND(COALESCE(SUM(CAST(d1_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d0 AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_1_rov
- ,ROUND(COALESCE(SUM(CAST(d1_1_uv AS BIGINT)) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0), 0), 6) AS d1_1_ror
- ,ROUND(COALESCE(SUM(CAST(d2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_1_rov
- ,ROUND(COALESCE(SUM(CAST(d2_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_1_ror
- ,ROUND(COALESCE(SUM(CAST(d3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_1_rov
- ,ROUND(COALESCE(SUM(CAST(d3_1_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_1_ror
- -- D链depth拆分 hop2 rov/ror
- ,ROUND(COALESCE(SUM(CAST(d1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_2_rov
- ,ROUND(COALESCE(SUM(CAST(d1_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_1_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_2_ror
- ,ROUND(COALESCE(SUM(CAST(d2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_2_rov
- ,ROUND(COALESCE(SUM(CAST(d2_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_2_ror
- ,ROUND(COALESCE(SUM(CAST(d3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_2_rov
- ,ROUND(COALESCE(SUM(CAST(d3_2_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_2_ror
- -- D链depth拆分 hop3 rov/ror
- ,ROUND(COALESCE(SUM(CAST(d1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_3_rov
- ,ROUND(COALESCE(SUM(CAST(d1_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(dn_2_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d1_3_ror
- ,ROUND(COALESCE(SUM(CAST(d2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_3_rov
- ,ROUND(COALESCE(SUM(CAST(d2_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d1_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d2_3_ror
- ,ROUND(COALESCE(SUM(CAST(d3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_3_exp AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_3_rov
- ,ROUND(COALESCE(SUM(CAST(d3_3_uv AS BIGINT)) / NULLIF(CAST(SUM(CAST(d2_3_uv AS BIGINT)) AS DOUBLE), 0), 0), 6) AS d3_3_ror
- -- ==================== 全链路 ====================
- ,SUM(CAST(return_n_uv_noself AS BIGINT))
- + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
- + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
- AS all_return_n_uv
- ,ROUND(COALESCE(
- ( SUM(CAST(return_n_uv_noself AS BIGINT))
- + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
- + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
- ) / NULLIF(COUNT(1), 0)
- , 0), 6) AS all_rovn
- ,ROUND(COALESCE(
- ( SUM(CAST(return_n_uv_noself AS BIGINT))
- + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
- + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
- ) / NULLIF(CAST(COUNT(1) AS DOUBLE), 0)
- , 0), 6) AS all_rov
- ,ROUND(COALESCE(
- ( SUM(CAST(return_n_uv_noself AS BIGINT))
- + SUM(CAST(cn_1_uv AS BIGINT)) + SUM(CAST(cn_2_uv AS BIGINT)) + SUM(CAST(cn_3_uv AS BIGINT))
- + SUM(CAST(dn_1_uv AS BIGINT)) + SUM(CAST(dn_2_uv AS BIGINT)) + SUM(CAST(dn_3_uv AS BIGINT))
- ) / NULLIF(CAST(COUNT(DISTINCT mid) AS DOUBLE), 0)
- , 0), 6) AS all_ror
- -- =====================================================================
- -- FROM + GROUP BY CUBE
- -- =====================================================================
- FROM t_wide
- GROUP BY CUBE(
- user_type
- ,hh_bucket
- ,head_merge_leve2
- ,vid_merge_leve2
- ,vid_id
- )
- ORDER BY exposure_cnt DESC
- ;
|