lierqiang 2 år sedan
förälder
incheckning
2817169d51
1 ändrade filer med 4 tillägg och 4 borttagningar
  1. 4 4
      douyin/douyin_follow/follow_dy.py

+ 4 - 4
douyin/douyin_follow/follow_dy.py

@@ -107,10 +107,10 @@ class DyFollow(object):
         else:
             title3 = title_split3[-1]
 
-        video_title = title3.strip().replace("\n", "") \
+        video_title = title3.strip().split('#')[0].replace("\n", "") \
                           .replace("/", "").replace("抖音", "").replace(" ", "") \
                           .replace(" ", "").replace("&NBSP", "").replace("\r", "") \
-                          .replace("#", "").replace(".", "。").replace("\\", "") \
+                          .replace(".", "。").replace("\\", "") \
                           .replace(":", "").replace("*", "").replace("?", "") \
                           .replace("?", "").replace('"', "").replace("<", "") \
                           .replace(">", "").replace("|", "").replace("@", "").replace('"', '').replace("'", '')[:40]
@@ -171,8 +171,8 @@ class DyFollow(object):
             Common.logger(log_type, crawler).warning(f"抖音作者没有获取到更多数据")
             return
         for info in aweme_list:
-            # if info.get('is_ads'):
-            #     continue
+            if info.get('is_ads'):
+                continue
             publish_time = info['create_time']
             publish_time_str = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime(publish_time))
             publish_day = int((int(time.time()) - publish_time) / (3600 * 24))