Browse Source

优先抓未抓过的账号

luojunhui 7 months ago
parent
commit
a022a4020b
1 changed files with 1 additions and 0 deletions
  1. 1 0
      coldStartTasks/crawler/weixin_video_crawler.py

+ 1 - 0
coldStartTasks/crawler/weixin_video_crawler.py

@@ -159,6 +159,7 @@ class WeixinVideoCrawler(object):
                     url_unique = functions.generateGzhId(article_url)
                     url_unique = functions.generateGzhId(article_url)
                     # 判断该视频链接是否下载,若已经下载则直接跳过
                     # 判断该视频链接是否下载,若已经下载则直接跳过
                     if self.is_downloaded(url_unique):
                     if self.is_downloaded(url_unique):
+                        print("url exists")
                         continue
                         continue
 
 
                     title = article.get("Title", None)
                     title = article.get("Title", None)