Pārlūkot izejas kodu

插入数据库之前,判断content_id是否有相同的out_video_id了

luojunhui 3 mēneši atpakaļ
vecāks
revīzija
298a42b4eb
1 mainītis faili ar 10 papildinājumiem un 0 dzēšanām
  1. 10 0
      applications/spider/__init__.py

+ 10 - 0
applications/spider/__init__.py

@@ -57,6 +57,16 @@ async def save_video_to_mysql(video_obj, user, trace_id, platform, content_id, c
         mq_obj = {}
         mq_obj = {}
     mq_obj['trace_id'] = trace_id
     mq_obj['trace_id'] = trace_id
     mq_obj['content_id'] = content_id
     mq_obj['content_id'] = content_id
+    # 先查询此content_id下是否有out_video_id了
+    select_sql = f"""
+        SELECT id
+        FROM {crawler_video_table}
+        WHERE out_video_id = '{mq_obj['video_id']}' and content_id = '{content_id}';
+    """
+    result = await db_client.async_select(select_sql)
+    if result:
+        return
+
     insert_sql = f"""
     insert_sql = f"""
     INSERT INTO {crawler_video_table}
     INSERT INTO {crawler_video_table}
     (content_id, out_video_id, platform, video_title, play_count, like_count, publish_time, crawler_time, duration, video_url, cover_url, user_id, trace_id, score, score_version)
     (content_id, out_video_id, platform, video_title, play_count, like_count, publish_time, crawler_time, duration, video_url, cover_url, user_id, trace_id, score, score_version)