|
@@ -132,7 +132,7 @@ class SpiderProcess(object):
|
|
|
select_sql = "SELECT video_id, video_title, label, channel, out_user_id, spider_mode, out_play_cnt, out_like_cnt, out_share_cnt FROM lightgbm_data WHERE type = 'spider';"
|
|
|
data_list = self.client_spider.select(select_sql)
|
|
|
df = []
|
|
|
- for line in tqdm(data_list[:10]):
|
|
|
+ for line in tqdm(data_list):
|
|
|
try:
|
|
|
temp = list(line)
|
|
|
video_id = line[0]
|
|
@@ -157,7 +157,7 @@ class SpiderProcess(object):
|
|
|
continue
|
|
|
df = pd.DataFrame(df, columns=['label', 'channel', 'out_user_id', 'mode', 'out_play_cnt', 'out_like_cnt',
|
|
|
'out_share_cnt', 'lop', 'duration', 'tag1', 'tag2', 'tag3'])
|
|
|
- df.to_json("data/train_data/spider_data_{}.json".format(datetime.datetime.today().strftime("y%m%d")),
|
|
|
+ df.to_json("data/train_data/spider_data_{}.json".format(datetime.datetime.today().strftime("%y%m%d")),
|
|
|
orient='records')
|
|
|
|
|
|
|