1 年間前 · cd7b5450c0
--- a/applications/search/dy_search.py
+++ b/applications/search/dy_search.py
@@ -17,53 +17,59 @@ def douyin_search(keyword, sensitive_words, trace_id):
 
															     :param keyword: the words needs to be searched
														
 
															     :return:
														
 
															     """
														
 
															-    url = "http://8.217.190.241:8888/crawler/dou_yin/top_hub_content"
														
 
															-    payload = json.dumps({
														
 
															-        "keyword": keyword,
														
 
															-        "category": "全部",
														
 
															-        "period": "近90天",
														
 
															-        "content_modal": "视频",
														
 
															-        "cursor": ""
														
 
															-    })
														
 
															-    headers = {
														
 
															-        'Content-Type': 'application/json'
														
 
															-    }
														
 
															-
														
 
															-    response = requests.request("POST", url, headers=headers, data=payload)
														
 
															-    try:
														
 
															-        dt_list = response.json()['data']['data']
														
 
															-        L = []
														
 
															-        for obj in dt_list:
														
 
															-            try:
														
 
															-                title = obj['video_desc']
														
 
															-                video_id = obj['video_id']
														
 
															-                duration = int(obj['duration'])
														
 
															-                if sensitive_flag(sensitive_words, title) and duration < 30000:
														
 
															-                    res = douyin_detail(video_id)
														
 
															-                    if res:
														
 
															-                        L.append(res)
														
 
															-                else:
														
 
															-                    continue
														
 
															-            except Exception as e:
														
 
															-                continue
														
 
															-        logging(
														
 
															-            code="8001",
														
 
															-            info="抖音搜索",
														
 
															-            data={
														
 
															-                "keys": keyword,
														
 
															-                "search_count": len(dt_list),
														
 
															-                "useful_count": len(L)
														
 
															-            },
														
 
															-            trace_id=trace_id
														
 
															-        )
														
 
															-        return L
														
 
															-    except Exception as e:
														
 
															-        logging(
														
 
															+    # url = "http://8.217.190.241:8888/crawler/dou_yin/top_hub_content"
														
 
															+    # payload = json.dumps({
														
 
															+    #     "keyword": keyword,
														
 
															+    #     "category": "全部",
														
 
															+    #     "period": "近90天",
														
 
															+    #     "content_modal": "视频",
														
 
															+    #     "cursor": ""
														
 
															+    # })
														
 
															+    # headers = {
														
 
															+    #     'Content-Type': 'application/json'
														
 
															+    # }
														
 
															+    #
														
 
															+    # response = requests.request("POST", url, headers=headers, data=payload)
														
 
															+    # try:
														
 
															+    #     dt_list = response.json()['data']['data']
														
 
															+    #     L = []
														
 
															+    #     for obj in dt_list:
														
 
															+    #         try:
														
 
															+    #             title = obj['video_desc']
														
 
															+    #             video_id = obj['video_id']
														
 
															+    #             duration = int(obj['duration'])
														
 
															+    #             if sensitive_flag(sensitive_words, title) and duration < 30000:
														
 
															+    #                 res = douyin_detail(video_id)
														
 
															+    #                 if res:
														
 
															+    #                     L.append(res)
														
 
															+    #             else:
														
 
															+    #                 continue
														
 
															+    #         except Exception as e:
														
 
															+    #             continue
														
 
															+    #     logging(
														
 
															+    #         code="8001",
														
 
															+    #         info="抖音搜索",
														
 
															+    #         data={
														
 
															+    #             "keys": keyword,
														
 
															+    #             "search_count": len(dt_list),
														
 
															+    #             "useful_count": len(L)
														
 
															+    #         },
														
 
															+    #         trace_id=trace_id
														
 
															+    #     )
														
 
															+    #     return L
														
 
															+    # except Exception as e:
														
 
															+    #     logging(
														
 
															+    #         code="4003",
														
 
															+    #         info="抖音搜索失败-搜索词：{} 原因：-{}".format(keyword, e),
														
 
															+    #         trace_id=trace_id
														
 
															+    #     )
														
 
															+    #     return []
														
 
															+    logging(
														
 
															             code="4003",
														
 
															-            info="抖音搜索失败-搜索词：{} 原因：-{}".format(keyword, e),
														
 
															+            info="抖音搜索失败-搜索词：{} 原因：-{}".format(keyword, "抖查查暂停服务"),
														
 
															             trace_id=trace_id
														
 
															         )
														
 
															-        return []
														
 
															+    return []
														
 
															 def douyin_detail(video_id):