|
@@ -4,7 +4,6 @@ import base64
|
|
|
import json
|
|
|
import random
|
|
|
import sys
|
|
|
-import datetime
|
|
|
import time
|
|
|
import uuid
|
|
|
|
|
@@ -14,6 +13,7 @@ sys.path.append(os.getcwd())
|
|
|
from common.video_item import VideoItem
|
|
|
from common import PiaoQuanPipeline, AliyunLogger
|
|
|
from common.mq import MQ
|
|
|
+from common.scheduling_db import MysqlHelper
|
|
|
|
|
|
|
|
|
class HaoKanVideoAccount(object):
|
|
@@ -61,7 +61,8 @@ class HaoKanVideoAccount(object):
|
|
|
}
|
|
|
response = requests.request("GET", url, headers=headers, params=params)
|
|
|
result = response.json()
|
|
|
- print(json.dumps(result, ensure_ascii=False, indent=4))
|
|
|
+ # print(json.dumps(result, ensure_ascii=False, indent=4))
|
|
|
+ self.process_video_list(result)
|
|
|
|
|
|
def get_tiny_video_list(self):
|
|
|
url = "https://haokan.baidu.com/web/author/listall"
|
|
@@ -83,7 +84,7 @@ class HaoKanVideoAccount(object):
|
|
|
}
|
|
|
response = requests.request("GET", url, headers=headers, params=params)
|
|
|
result = response.json()
|
|
|
- print(json.dumps(result, ensure_ascii=False, indent=4))
|
|
|
+ # print(json.dumps(result, ensure_ascii=False, indent=4))
|
|
|
self.process_video_list(result)
|
|
|
|
|
|
def process_video_list(self, result):
|
|
@@ -152,8 +153,8 @@ class HaoKanVideoAccount(object):
|
|
|
item.add_video_info("like_cnt", d_obj["like"])
|
|
|
item.add_video_info("comment_cnt", d_obj["comment"])
|
|
|
item.add_video_info("cover_url", video_obj["content"]["cover_src"])
|
|
|
- item.add_video_info("user_id", self.user_dict['link'])
|
|
|
- item.add_video_info("user_name", "123")
|
|
|
+ item.add_video_info("user_id", self.user_dict['uid'])
|
|
|
+ item.add_video_info("user_name", self.user_dict['nick_name'])
|
|
|
item.add_video_info("out_video_id", d_obj["id"])
|
|
|
item.add_video_info("platform", self.platform)
|
|
|
item.add_video_info("strategy", self.mode)
|
|
@@ -170,7 +171,6 @@ class HaoKanVideoAccount(object):
|
|
|
item=mq_obj,
|
|
|
trace_id=trace_id,
|
|
|
)
|
|
|
- print(mq_obj)
|
|
|
if pipeline.process_item():
|
|
|
self.mq.send_msg(mq_obj)
|
|
|
print(mq_obj)
|
|
@@ -186,11 +186,14 @@ class HaoKanVideoAccount(object):
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
- T = HaoKanVideoAccount(
|
|
|
- platform="haokanshipin",
|
|
|
- mode="author",
|
|
|
- rule_dict={},
|
|
|
- user_dict={"link": 1657075178605219},
|
|
|
- env="prod",
|
|
|
- )
|
|
|
- T.get_tiny_video_list()
|
|
|
+ select_user_sql = f"""select * from crawler_user_v3 where source = 'haokanshipin';"""
|
|
|
+ user_list = MysqlHelper.get_values("author", "haokanshipin", select_user_sql, "prod", action="")
|
|
|
+ print(json.dumps(user_list[0], ensure_ascii=False, indent=4))
|
|
|
+ # T = HaoKanVideoAccount(
|
|
|
+ # platform="haokanshipin",
|
|
|
+ # mode="author",
|
|
|
+ # rule_dict={},
|
|
|
+ # user_dict={"link": 1657075178605219},
|
|
|
+ # env="prod",
|
|
|
+ # )
|
|
|
+ # T.get_tiny_video_list()
|