loghubods.vid_festive_labels.sql 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237
  1. -- Task: 节日标签视频库 ID: 1019838087 Type: ODPS_SQL
  2. --odps sql
  3. --********************************************************************--
  4. --author:于卓异
  5. --create time:2024-08-29 17:16:57
  6. --********************************************************************--
  7. CREATE TABLE IF NOT EXISTS vid_festive_labels(
  8. videoid BIGINT COMMENT '视频ID',
  9. first_labels STRING COMMENT '一级标签',
  10. secondary_labels STRING COMMENT '二级标签'
  11. )
  12. STORED AS ALIORC ;
  13. INSERT INTO TABLE vid_festive_labels
  14. SELECT videoid
  15. ,CASE WHEN secondary_labels IN ('元旦','腊八节','小年','除夕','春节','情人节','元宵节','龙抬头','妇女节','劳动节','母亲节','儿童节','端午节','父亲节','建党节','七七事变','建军节','七夕节','中元节','中秋节','毛主席逝世','国庆节','重阳节','感恩节','公祭日','平安夜','圣诞节','毛主席诞辰','初一','初二','初三','初四','初五','初六','初七','初八','初九','初十') THEN '节假日'
  16. WHEN secondary_labels IN ('小寒','大寒','立春','雨水','惊蛰','春分','清明','谷雨','立夏','小满','芒种','夏至','小暑','大暑','立秋','处暑','白露','秋分','寒露','霜降','立冬','小雪','大雪','冬至') THEN '节气'
  17. WHEN secondary_labels IN ('早上好','中午好','下午好','晚上好','晚安') THEN '问候语'
  18. WHEN secondary_labels IN ('祝福') THEN '祝福语'
  19. WHEN secondary_labels IN ('孙中山诞辰','孙中山逝世','周恩来诞辰','周恩来逝世','邓小平诞辰','邓小平逝世','李克强诞辰','李克强逝世','袁隆平诞辰','袁隆平逝世','彭德怀诞辰','彭德怀逝世','朱德诞辰','朱德逝世','吴尊友逝世') THEN '人物'
  20. WHEN secondary_labels IN ('两会','315国际消费者权益日','四龙日') THEN '热点'
  21. END AS first_labels
  22. ,secondary_labels
  23. FROM (
  24. SELECT id AS videoid
  25. ,title
  26. ,CASE WHEN title REGEXP '元旦' THEN '元旦'
  27. WHEN title REGEXP '腊八' THEN '腊八节'
  28. WHEN title REGEXP '小年' THEN '小年'
  29. WHEN title REGEXP '除夕' THEN '除夕'
  30. WHEN title REGEXP '春节|新春佳节|新年|过年|大年' THEN '春节'
  31. WHEN title REGEXP '初一|迎春日|开门红|新春' THEN '初一'
  32. WHEN title REGEXP '初二|犯娘日|迎婿日|回娘家|祭财神' THEN '初二'
  33. WHEN title REGEXP '初三|赤狗日|福神' THEN '初三'
  34. WHEN title REGEXP '初四|迎接神灵日|灶神|喜神|五路|扔穷' THEN '初四'
  35. WHEN title REGEXP '初五|破五|迎财神|送穷神|财神日|五穷' THEN '初五'
  36. WHEN title REGEXP '初六' THEN '初六'
  37. WHEN title REGEXP '初七' THEN '初七'
  38. WHEN title REGEXP '初八' THEN '初八'
  39. WHEN title REGEXP '初九' THEN '初九'
  40. WHEN title REGEXP '初十' THEN '初十'
  41. WHEN title REGEXP '情人节' THEN '情人节'
  42. WHEN title REGEXP '元宵|正月十五' THEN '元宵节'
  43. WHEN title REGEXP '龙抬头|二月二|2月2|剃头日|春耕节|农事节|青龙节|春龙节|龙头节' THEN '龙抬头'
  44. WHEN title REGEXP '妇女节|三八|38节|38节快乐|38节祝福|女神节|女王节' THEN '妇女节'
  45. WHEN title REGEXP '5.1|5·1|五一|劳动节|国际示威游行日|51' THEN '劳动节'
  46. WHEN title REGEXP '母亲节' THEN '母亲节'
  47. WHEN title REGEXP '儿童节|六一' THEN '儿童节'
  48. WHEN title REGEXP '端午' THEN '端午节'
  49. WHEN title REGEXP '父亲节' THEN '父亲节'
  50. WHEN title REGEXP '七一|建党' THEN '建党节'
  51. WHEN title REGEXP '七七事变' THEN '七七事变'
  52. WHEN title REGEXP '建军节|八一' THEN '建军节'
  53. WHEN title REGEXP '七夕' THEN '七夕节'
  54. WHEN title REGEXP '鬼节|中元节' THEN '中元节'
  55. WHEN title REGEXP '中秋|元旦将至' THEN '中秋节'
  56. WHEN title REGEXP '毛主席逝世' THEN '毛主席逝世'
  57. WHEN title REGEXP '国庆' THEN '国庆节'
  58. WHEN title REGEXP '重阳' THEN '重阳节'
  59. WHEN title REGEXP '感恩节' THEN '感恩节'
  60. WHEN title REGEXP '公祭日|南京大屠杀' THEN '公祭日'
  61. WHEN title REGEXP '平安夜' THEN '平安夜'
  62. WHEN title REGEXP '圣诞' THEN '圣诞节'
  63. WHEN title REGEXP '毛主席诞辰' THEN '毛主席诞辰'
  64. WHEN title REGEXP '小寒' THEN '小寒'
  65. WHEN title REGEXP '大寒' THEN '大寒'
  66. WHEN title REGEXP '立春' THEN '立春'
  67. WHEN title REGEXP '雨水' THEN '雨水'
  68. WHEN title REGEXP '惊蛰' THEN '惊蛰'
  69. WHEN title REGEXP '春分' THEN '春分'
  70. WHEN title REGEXP '清明|踏青节|踏青节|行清节|三月节|祭祖' THEN '清明'
  71. WHEN title REGEXP '谷雨' THEN '谷雨'
  72. WHEN title REGEXP '立夏' THEN '立夏'
  73. WHEN title REGEXP '小满' THEN '小满'
  74. WHEN title REGEXP '芒种' THEN '芒种'
  75. WHEN title REGEXP '夏至' THEN '夏至'
  76. WHEN title REGEXP '小暑' THEN '小暑'
  77. WHEN title REGEXP '大暑' THEN '大暑'
  78. WHEN title REGEXP '立秋' THEN '立秋'
  79. WHEN title REGEXP '处暑' THEN '处暑'
  80. WHEN title REGEXP '白露' THEN '白露'
  81. WHEN title REGEXP '秋分' THEN '秋分'
  82. WHEN title REGEXP '寒露' THEN '寒露'
  83. WHEN title REGEXP '霜降' THEN '霜降'
  84. WHEN title REGEXP '立冬' THEN '立冬'
  85. WHEN title REGEXP '小雪' THEN '小雪'
  86. WHEN title REGEXP '大雪' THEN '大雪'
  87. WHEN title REGEXP '冬至' THEN '冬至'
  88. WHEN title REGEXP '早晨|早上|清晨' THEN '早上好'
  89. WHEN title REGEXP '中午好|中午' THEN '中午好'
  90. WHEN title REGEXP '下午好|下午' THEN '下午好'
  91. WHEN title REGEXP '晚上好|晚上' THEN '晚上好'
  92. WHEN title REGEXP '晚安' THEN '晚安'
  93. WHEN title REGEXP '祝福|祝愿|祝你|祝贺|祝大家|祝您|祝好运|祝群主|祝朋友' THEN '祝福'
  94. WHEN title REGEXP '孙中山诞辰' THEN '孙中山诞辰'
  95. WHEN title REGEXP '孙中山逝世' THEN '孙中山逝世'
  96. WHEN title REGEXP '周恩来诞辰' THEN '周恩来诞辰'
  97. WHEN title REGEXP '周恩来逝世' THEN '周恩来逝世'
  98. WHEN title REGEXP '邓小平诞辰' THEN '邓小平诞辰'
  99. WHEN title REGEXP '邓小平逝世' THEN '邓小平逝世'
  100. WHEN title REGEXP '李克强诞辰' THEN '李克强诞辰'
  101. WHEN title REGEXP '李克强逝世' THEN '李克强逝世'
  102. WHEN title REGEXP '袁隆平诞辰' THEN '袁隆平诞辰'
  103. WHEN title REGEXP '袁隆平逝世' THEN '袁隆平逝世'
  104. WHEN title REGEXP '彭德怀诞辰' THEN '彭德怀诞辰'
  105. WHEN title REGEXP '彭德怀逝世' THEN '彭德怀逝世'
  106. WHEN title REGEXP '朱德诞辰' THEN '朱德诞辰'
  107. WHEN title REGEXP '朱德逝世' THEN '朱德逝世'
  108. WHEN title REGEXP '吴尊友逝世' THEN '吴尊友逝世'
  109. WHEN title REGEXP '两会|人大代表|人民代表大会|政协' THEN '两会'
  110. WHEN title REGEXP '315|消费者|三一五|3·15|打假日' THEN '315国际消费者权益日'
  111. WHEN title REGEXP '四龙日|龙年龙月龙日龙时' THEN '四龙日'
  112. END AS secondary_labels
  113. ,gmt_create
  114. ,recommend_status
  115. FROM videoods.wx_video_per1h
  116. WHERE title NOT REGEXP '2018|2019|2020|2021|2022|2023|鼠年|牛年|虎年|兔年|小年糕|小年轻' --AND TO_CHAR(gmt_create,'YYYYMMDDHH') = '${datetime}${hhl}'
  117. AND TO_CHAR(gmt_create,'YYYYMMDDHH') = '${datetime}${hhl}'
  118. --AND TO_CHAR(gmt_create,'YYYYMMDDHH') <= '${datetime}${hhl}'
  119. AND recommend_status IN (-6,-7)
  120. )
  121. where '${hhl}'<>23
  122. ;
  123. INSERT INTO TABLE vid_festive_labels
  124. SELECT videoid
  125. ,CASE WHEN secondary_labels IN ('元旦','腊八节','小年','除夕','春节','情人节','元宵节','龙抬头','妇女节','劳动节','母亲节','儿童节','端午节','父亲节','建党节','七七事变','建军节','七夕节','中元节','中秋节','毛主席逝世','国庆节','重阳节','感恩节','公祭日','平安夜','圣诞节','毛主席诞辰','初一','初二','初三','初四','初五','初六','初七','初八','初九','初十') THEN '节假日'
  126. WHEN secondary_labels IN ('小寒','大寒','立春','雨水','惊蛰','春分','清明','谷雨','立夏','小满','芒种','夏至','小暑','大暑','立秋','处暑','白露','秋分','寒露','霜降','立冬','小雪','大雪','冬至') THEN '节气'
  127. WHEN secondary_labels IN ('早上好','中午好','下午好','晚上好','晚安') THEN '问候语'
  128. WHEN secondary_labels IN ('祝福') THEN '祝福语'
  129. WHEN secondary_labels IN ('孙中山诞辰','孙中山逝世','周恩来诞辰','周恩来逝世','邓小平诞辰','邓小平逝世','李克强诞辰','李克强逝世','袁隆平诞辰','袁隆平逝世','彭德怀诞辰','彭德怀逝世','朱德诞辰','朱德逝世','吴尊友逝世') THEN '人物'
  130. WHEN secondary_labels IN ('两会','315国际消费者权益日','四龙日') THEN '热点'
  131. END AS first_labels
  132. ,secondary_labels
  133. FROM (
  134. SELECT id AS videoid
  135. ,title
  136. ,CASE WHEN title REGEXP '元旦' THEN '元旦'
  137. WHEN title REGEXP '腊八' THEN '腊八节'
  138. WHEN title REGEXP '小年' THEN '小年'
  139. WHEN title REGEXP '除夕' THEN '除夕'
  140. WHEN title REGEXP '春节|新春佳节|新年|过年|大年' THEN '春节'
  141. WHEN title REGEXP '初一|迎春日|开门红|新春' THEN '初一'
  142. WHEN title REGEXP '初二|犯娘日|迎婿日|回娘家|祭财神' THEN '初二'
  143. WHEN title REGEXP '初三|赤狗日|福神' THEN '初三'
  144. WHEN title REGEXP '初四|迎接神灵日|灶神|喜神|五路|扔穷' THEN '初四'
  145. WHEN title REGEXP '初五|破五|迎财神|送穷神|财神日|五穷' THEN '初五'
  146. WHEN title REGEXP '初六' THEN '初六'
  147. WHEN title REGEXP '初七' THEN '初七'
  148. WHEN title REGEXP '初八' THEN '初八'
  149. WHEN title REGEXP '初九' THEN '初九'
  150. WHEN title REGEXP '初十' THEN '初十'
  151. WHEN title REGEXP '情人节' THEN '情人节'
  152. WHEN title REGEXP '元宵|正月十五' THEN '元宵节'
  153. WHEN title REGEXP '龙抬头|二月二|2月2|剃头日|春耕节|农事节|青龙节|春龙节|龙头节' THEN '龙抬头'
  154. WHEN title REGEXP '妇女节|三八|38节|38节快乐|38节祝福|女神节|女王节' THEN '妇女节'
  155. WHEN title REGEXP '5.1|5·1|五一|劳动节|国际示威游行日|51' THEN '劳动节'
  156. WHEN title REGEXP '母亲节' THEN '母亲节'
  157. WHEN title REGEXP '儿童节|六一' THEN '儿童节'
  158. WHEN title REGEXP '端午' THEN '端午节'
  159. WHEN title REGEXP '父亲节' THEN '父亲节'
  160. WHEN title REGEXP '七一|建党' THEN '建党节'
  161. WHEN title REGEXP '七七事变' THEN '七七事变'
  162. WHEN title REGEXP '建军节|八一' THEN '建军节'
  163. WHEN title REGEXP '七夕' THEN '七夕节'
  164. WHEN title REGEXP '鬼节|中元节' THEN '中元节'
  165. WHEN title REGEXP '中秋|元旦将至' THEN '中秋节'
  166. WHEN title REGEXP '毛主席逝世' THEN '毛主席逝世'
  167. WHEN title REGEXP '国庆' THEN '国庆节'
  168. WHEN title REGEXP '重阳' THEN '重阳节'
  169. WHEN title REGEXP '感恩节' THEN '感恩节'
  170. WHEN title REGEXP '公祭日|南京大屠杀' THEN '公祭日'
  171. WHEN title REGEXP '平安夜' THEN '平安夜'
  172. WHEN title REGEXP '圣诞' THEN '圣诞节'
  173. WHEN title REGEXP '毛主席诞辰' THEN '毛主席诞辰'
  174. WHEN title REGEXP '小寒' THEN '小寒'
  175. WHEN title REGEXP '大寒' THEN '大寒'
  176. WHEN title REGEXP '立春' THEN '立春'
  177. WHEN title REGEXP '雨水' THEN '雨水'
  178. WHEN title REGEXP '惊蛰' THEN '惊蛰'
  179. WHEN title REGEXP '春分' THEN '春分'
  180. WHEN title REGEXP '清明|踏青节|踏青节|行清节|三月节|祭祖' THEN '清明'
  181. WHEN title REGEXP '谷雨' THEN '谷雨'
  182. WHEN title REGEXP '立夏' THEN '立夏'
  183. WHEN title REGEXP '小满' THEN '小满'
  184. WHEN title REGEXP '芒种' THEN '芒种'
  185. WHEN title REGEXP '夏至' THEN '夏至'
  186. WHEN title REGEXP '小暑' THEN '小暑'
  187. WHEN title REGEXP '大暑' THEN '大暑'
  188. WHEN title REGEXP '立秋' THEN '立秋'
  189. WHEN title REGEXP '处暑' THEN '处暑'
  190. WHEN title REGEXP '白露' THEN '白露'
  191. WHEN title REGEXP '秋分' THEN '秋分'
  192. WHEN title REGEXP '寒露' THEN '寒露'
  193. WHEN title REGEXP '霜降' THEN '霜降'
  194. WHEN title REGEXP '立冬' THEN '立冬'
  195. WHEN title REGEXP '小雪' THEN '小雪'
  196. WHEN title REGEXP '大雪' THEN '大雪'
  197. WHEN title REGEXP '冬至' THEN '冬至'
  198. WHEN title REGEXP '早晨|早上|清晨' THEN '早上好'
  199. WHEN title REGEXP '中午好|中午' THEN '中午好'
  200. WHEN title REGEXP '下午好|下午' THEN '下午好'
  201. WHEN title REGEXP '晚上好|晚上' THEN '晚上好'
  202. WHEN title REGEXP '晚安' THEN '晚安'
  203. WHEN title REGEXP '祝福|祝愿|祝你|祝贺|祝大家|祝您|祝好运|祝群主|祝朋友' THEN '祝福'
  204. WHEN title REGEXP '孙中山诞辰' THEN '孙中山诞辰'
  205. WHEN title REGEXP '孙中山逝世' THEN '孙中山逝世'
  206. WHEN title REGEXP '周恩来诞辰' THEN '周恩来诞辰'
  207. WHEN title REGEXP '周恩来逝世' THEN '周恩来逝世'
  208. WHEN title REGEXP '邓小平诞辰' THEN '邓小平诞辰'
  209. WHEN title REGEXP '邓小平逝世' THEN '邓小平逝世'
  210. WHEN title REGEXP '李克强诞辰' THEN '李克强诞辰'
  211. WHEN title REGEXP '李克强逝世' THEN '李克强逝世'
  212. WHEN title REGEXP '袁隆平诞辰' THEN '袁隆平诞辰'
  213. WHEN title REGEXP '袁隆平逝世' THEN '袁隆平逝世'
  214. WHEN title REGEXP '彭德怀诞辰' THEN '彭德怀诞辰'
  215. WHEN title REGEXP '彭德怀逝世' THEN '彭德怀逝世'
  216. WHEN title REGEXP '朱德诞辰' THEN '朱德诞辰'
  217. WHEN title REGEXP '朱德逝世' THEN '朱德逝世'
  218. WHEN title REGEXP '吴尊友逝世' THEN '吴尊友逝世'
  219. WHEN title REGEXP '两会|人大代表|人民代表大会|政协' THEN '两会'
  220. WHEN title REGEXP '315|消费者|三一五|3·15|打假日' THEN '315国际消费者权益日'
  221. WHEN title REGEXP '四龙日|龙年龙月龙日龙时' THEN '四龙日'
  222. END AS secondary_labels
  223. ,gmt_create
  224. ,recommend_status
  225. FROM videoods.wx_video_per1h
  226. WHERE title NOT REGEXP '2018|2019|2020|2021|2022|2023|鼠年|牛年|虎年|兔年|小年糕|小年轻' --AND TO_CHAR(gmt_create,'YYYYMMDDHH') = '${datetime}${hhl}'
  227. AND TO_CHAR(gmt_create,'YYYYMMDDHH') = '${datetime-1}${hhl}'
  228. AND recommend_status IN (-6,-7)
  229. )
  230. where '${hhl}'=23
  231. ;