瀏覽代碼

抖查查暂停服务

罗俊辉 9 月之前
父節點
當前提交
cd7b5450c0
共有 1 個文件被更改,包括 50 次插入44 次删除
  1. 50 44
      applications/search/dy_search.py

+ 50 - 44
applications/search/dy_search.py

@@ -17,53 +17,59 @@ def douyin_search(keyword, sensitive_words, trace_id):
     :param keyword: the words needs to be searched
     :param keyword: the words needs to be searched
     :return:
     :return:
     """
     """
-    url = "http://8.217.190.241:8888/crawler/dou_yin/top_hub_content"
-    payload = json.dumps({
-        "keyword": keyword,
-        "category": "全部",
-        "period": "近90天",
-        "content_modal": "视频",
-        "cursor": ""
-    })
-    headers = {
-        'Content-Type': 'application/json'
-    }
-
-    response = requests.request("POST", url, headers=headers, data=payload)
-    try:
-        dt_list = response.json()['data']['data']
-        L = []
-        for obj in dt_list:
-            try:
-                title = obj['video_desc']
-                video_id = obj['video_id']
-                duration = int(obj['duration'])
-                if sensitive_flag(sensitive_words, title) and duration < 30000:
-                    res = douyin_detail(video_id)
-                    if res:
-                        L.append(res)
-                else:
-                    continue
-            except Exception as e:
-                continue
-        logging(
-            code="8001",
-            info="抖音搜索",
-            data={
-                "keys": keyword,
-                "search_count": len(dt_list),
-                "useful_count": len(L)
-            },
-            trace_id=trace_id
-        )
-        return L
-    except Exception as e:
-        logging(
+    # url = "http://8.217.190.241:8888/crawler/dou_yin/top_hub_content"
+    # payload = json.dumps({
+    #     "keyword": keyword,
+    #     "category": "全部",
+    #     "period": "近90天",
+    #     "content_modal": "视频",
+    #     "cursor": ""
+    # })
+    # headers = {
+    #     'Content-Type': 'application/json'
+    # }
+    #
+    # response = requests.request("POST", url, headers=headers, data=payload)
+    # try:
+    #     dt_list = response.json()['data']['data']
+    #     L = []
+    #     for obj in dt_list:
+    #         try:
+    #             title = obj['video_desc']
+    #             video_id = obj['video_id']
+    #             duration = int(obj['duration'])
+    #             if sensitive_flag(sensitive_words, title) and duration < 30000:
+    #                 res = douyin_detail(video_id)
+    #                 if res:
+    #                     L.append(res)
+    #             else:
+    #                 continue
+    #         except Exception as e:
+    #             continue
+    #     logging(
+    #         code="8001",
+    #         info="抖音搜索",
+    #         data={
+    #             "keys": keyword,
+    #             "search_count": len(dt_list),
+    #             "useful_count": len(L)
+    #         },
+    #         trace_id=trace_id
+    #     )
+    #     return L
+    # except Exception as e:
+    #     logging(
+    #         code="4003",
+    #         info="抖音搜索失败-搜索词:{} 原因:-{}".format(keyword, e),
+    #         trace_id=trace_id
+    #     )
+    #     return []
+    logging(
             code="4003",
             code="4003",
-            info="抖音搜索失败-搜索词:{} 原因:-{}".format(keyword, e),
+            info="抖音搜索失败-搜索词:{} 原因:-{}".format(keyword, "抖查查暂停服务"),
             trace_id=trace_id
             trace_id=trace_id
         )
         )
-        return []
+    return []
 
 
 
 
 def douyin_detail(video_id):
 def douyin_detail(video_id):