瀏覽代碼

zhufuquanzi 获取视频url

zhangyong 1 年之前
父節點
當前提交
b5b8cf104d
共有 1 個文件被更改,包括 1 次插入8 次删除
  1. 1 8
      application/spider/crawler_offline/zhufuquanzi.py

+ 1 - 8
application/spider/crawler_offline/zhufuquanzi.py

@@ -226,14 +226,7 @@ class ZhuFuQuanZiRecommend(object):
             video_url_elements = self.search_elements(
             video_url_elements = self.search_elements(
                 '//*[@class="index--video-item index--video"]'
                 '//*[@class="index--video-item index--video"]'
             )
             )
-            url = video_url_elements[0].get_attribute("src")
-            # 校验url是否正确
-            url_pattern = re.compile(r'^(https?://)?([\da-z.-]+)\.([a-z.]{2,6})([/\w .-]*)*/?$')
-            parsed = urlparse(url)
-            if bool(parsed.scheme) and bool(parsed.netloc) and url_pattern.match(url):
-                return url
-            else:
-                return ""
+            return video_url_elements[0].get_attribute("src")
 
 
     def get_video_info_2(self, video_element):
     def get_video_info_2(self, video_element):
         Local.logger(self.log_type, self.crawler).info(f"本轮已抓取{self.download_cnt}条视频\n")
         Local.logger(self.log_type, self.crawler).info(f"本轮已抓取{self.download_cnt}条视频\n")