luojunhui пре 10 месеци
родитељ
комит
ecac6d5261
2 измењених фајлова са 3 додато и 3 уклоњено
  1. 2 2
      applications/functions.py
  2. 1 1
      coldStartTasks/crawler/weixin_video_crawler.py

+ 2 - 2
applications/functions.py

@@ -172,7 +172,7 @@ class Functions(object):
         response = requests.get(
             url=article_url,
             headers={'User-Agent': FakeUserAgent().random},
-            proxies=cls.proxy()
+            # proxies=cls.proxy()
         )
         html_text = response.text
         w = re.search(
@@ -195,7 +195,7 @@ class Functions(object):
         response = requests.get(
             url=article_url,
             headers={'User-Agent': FakeUserAgent().random},
-            proxies=cls.proxy()
+            # proxies=cls.proxy()
         )
         html_text = response.text
         # 正则表达式用于提取 hit_nickname 和 hit_username

+ 1 - 1
coldStartTasks/crawler/weixin_video_crawler.py

@@ -124,7 +124,7 @@ class WeixinVideoCrawler(object):
             publish_type = info.get("AppMsg", {}).get("BaseInfo", {}).get("Type", None)
             detail_article_list = info.get("AppMsg", {}).get("DetailInfo", [])
             if detail_article_list:
-                for article in tqdm(detail_article_list, desc="crawler_in_msg_list"):
+                for article in tqdm(detail_article_list, desc="{}: crawler_in_msg_list".format(account_name)):
                     article_url = article.get("ContentUrl", None)
                     url_unique = functions.generateGzhId(article_url)
                     # 判断该视频链接是否下载,若已经下载则直接跳过