|
|
@@ -1,8 +1,43 @@
|
|
|
-- =====================================================================
|
|
|
--- 曝光回流链路 CUBE 聚合表 (基于 wide 宽表, 增加用户/品类维度 + 模型预估指标)
|
|
|
+-- 曝光回流链路 CUBE 聚合表 (宽表版, 含用户/品类维度 + 模型预估 + 全链路漏斗)
|
|
|
-- 维度: user_type × hh_bucket × head_merge_leve2 × vid_merge_leve2 × vid_id (CUBE)
|
|
|
+-- 依赖: base_20260209 → (JOIN user_type + video_merge_tag + t_score) → CUBE 聚合
|
|
|
-- 参考: de.sql + dwd_recsys_alg_exposure_agg_20260209
|
|
|
-- =====================================================================
|
|
|
+--
|
|
|
+-- 指标分区:
|
|
|
+-- 基础流量 exposure_cnt / exposure_uv / vid_cnt / exposure_per_user
|
|
|
+-- 分享&回流漏斗 share_exposure_cnt → share_cnt → return_exposure_cnt → return_uv
|
|
|
+-- + 4 个 rate (share_rate / return_rate / return_rate_noself / share_return_rate)
|
|
|
+-- 模型预估 STR (曝光→非自身回流概率) / ROSN (条件回流UV) / ROVN (STR×ROSN)
|
|
|
+-- 每组: _real(label) + _pred(预估) + _copc + _mae + _var
|
|
|
+-- _real 与漏斗字段等价: str_real=return_rate_noself, rovn_real=return_uv_noself/exposure_cnt
|
|
|
+-- B/C/D 链 每级: _uv + _pv + _exp + _ror + _rov
|
|
|
+-- 全链路 all_return_n_uv = B + C + D
|
|
|
+--
|
|
|
+-- rov/ror 分母推导 (逐级递推):
|
|
|
+-- depth 维度: depth=1 的成本=该hop入口; depth=N+1 的成本=depth=N 的输出
|
|
|
+-- hop 维度: hop1 的成本=链路入口; hop N+1 的成本=hop N 全量depth的输出
|
|
|
+--
|
|
|
+-- B链: bn/b1 → rov=uv/COUNT(1), ror=uv/COUNT(DISTINCT mid)
|
|
|
+-- b2 → rov=uv/b1_exp, ror=uv/b1_uv
|
|
|
+-- b3 → rov=uv/b2_exp, ror=uv/b2_uv
|
|
|
+-- C链全量: cn_1 → rov=uv/bn_exp, ror=uv/bn_uv
|
|
|
+-- cn_2 → rov=uv/cn_1_exp, ror=uv/cn_1_uv
|
|
|
+-- cn_3 → rov=uv/cn_2_exp, ror=uv/cn_2_uv
|
|
|
+-- C链depth拆分: cX_Y → rov=uv/上级exp, ror=uv/上级uv (X=depth, Y=hop)
|
|
|
+-- hop1: c1_1→bn, c2_1→c1_1, c3_1→c2_1
|
|
|
+-- hop2: c1_2→cn_1, c2_2→c1_2, c3_2→c2_2
|
|
|
+-- hop3: c1_3→cn_2, c2_3→c1_3, c3_3→c2_3
|
|
|
+-- D链全量: dn_1 → rov=uv/d0, ror=uv/COUNT(DISTINCT mid)
|
|
|
+-- dn_2 → rov=uv/dn_1_exp, ror=uv/dn_1_uv
|
|
|
+-- dn_3 → rov=uv/dn_2_exp, ror=uv/dn_2_uv
|
|
|
+-- D链depth拆分: dX_Y (同 C 链模式)
|
|
|
+-- hop1: d1_1→d0/mid, d2_1→d1_1, d3_1→d2_1
|
|
|
+-- hop2: d1_2→dn_1, d2_2→d1_2, d3_2→d2_2
|
|
|
+-- hop3: d1_3→dn_2, d2_3→d1_3, d3_3→d2_3
|
|
|
+-- 全链路: all → rov=uv/COUNT(1), ror=uv/COUNT(DISTINCT mid)
|
|
|
+-- =====================================================================
|
|
|
|
|
|
-- DROP TABLE IF EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209;
|
|
|
CREATE TABLE IF NOT EXISTS loghubods.dwd_recsys_alg_exposure_agg_wide_20260209 (
|