9 місяців тому · 5cd3bbe92c
--- a/app.py
+++ b/app.py
@@ -2,13 +2,16 @@
 
				 @author: luojunhui
			
 
				 """
			
 
				 from quart import Quart
			
 
				-from applications.routes import Routes
			
 
				-from applications.functions.async_mysql import AsyncMySQLClient
			
 
				+from server.routes import Routes
			
 
				+from applications.db import AsyncMySQLClient
			
 
				+from applications.config import Config
			
 
				 
			
 
				 # 初始化 App
			
 
				 app = Quart(__name__, static_folder='applications/static')
			
 
				+config = Config()
			
 
				+# 注册连接池
			
 
				 AsyncMySQL = AsyncMySQLClient(app)
			
 
				-app_routes = Routes(AsyncMySQL)
			
 
				+app_routes = Routes(AsyncMySQL, config)
			
 
				 app.register_blueprint(app_routes)
			
 
				 
			
 
				 
			
@@ -18,7 +21,7 @@ async def init_db():
 
				     初始化
			
 
				     :return:
			
 
				     """
			
 
				-    await AsyncMySQL.init_pool()
			
 
				+    await AsyncMySQL.initPool()
			
 
				 
			
 
				 
			
 
				 @app.after_serving
			
@@ -27,7 +30,7 @@ async def close_db():
 
				     关闭连接
			
 
				     :return:
			
 
				     """
			
 
				-    await AsyncMySQL.close_pool()
			
 
				+    await AsyncMySQL.closePool()
			
 
				 
			
 
				 
			
 
				 if __name__ == '__main__':
			
--- a/applications/config/__init__.py
+++ b/applications/config/__init__.py
@@ -0,0 +1,57 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import json
			
 
				+
			
 
				+import pyapollos
			
 
				+
			
 
				+
			
 
				+class Config(object):
			
 
				+    """
			
 
				+    apolloConfig
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, env="pre"):
			
 
				+        """
			
 
				+        :param env:
			
 
				+        """
			
 
				+        match env:
			
 
				+            case "prod":
			
 
				+                self.apolloConnection = pyapollos.ApolloClient(
			
 
				+                    app_id="LongArticlesMatchServer",
			
 
				+                    config_server_url="https://apolloconfig-internal.piaoquantv.com/",
			
 
				+                    timeout=10
			
 
				+                )
			
 
				+                self.articleVideos = "long_articles_match_videos"
			
 
				+                self.articleText = "long_articles_text"
			
 
				+                self.articleCrawlerVideos = "long_articles_crawler_videos"
			
 
				+                self.rootSourceIdTable = "long_articles_root_source_id"
			
 
				+            case "dev":
			
 
				+                self.apolloConnection = pyapollos.ApolloClient(
			
 
				+                    app_id="LongArticlesMatchServer",
			
 
				+                    config_server_url="https://devapolloconfig-internal.piaoquantv.com/",
			
 
				+                    timeout=10
			
 
				+                )
			
 
				+                self.articleVideos = "long_articles_match_videos_dev"
			
 
				+                self.articleText = "long_articles_text_dev"
			
 
				+                self.articleCrawlerVideos = "long_articles_crawler_videos_dev"
			
 
				+                self.rootSourceIdTable = "long_articles_root_source_id_dev"
			
 
				+            case "pre":
			
 
				+                self.articleVideos = "long_articles_match_videos"
			
 
				+                self.articleText = "long_articles_text"
			
 
				+                self.articleCrawlerVideos = "long_articles_crawler_videos"
			
 
				+                self.rootSourceIdTable = "long_articles_root_source_id"
			
 
				+                self.apolloConnection = pyapollos.ApolloClient(
			
 
				+                    app_id="LongArticlesMatchServer",
			
 
				+                    config_server_url="http://preapolloconfig-internal.piaoquantv.com/",
			
 
				+                    timeout=10
			
 
				+                )
			
 
				+
			
 
				+    def getConfigValue(self, key):
			
 
				+        """
			
 
				+        通过 key 获取配置的 Config
			
 
				+        :param key:
			
 
				+        :return:
			
 
				+        """
			
 
				+        response = self.apolloConnection.get_value(key)
			
 
				+        return response
			
--- a/applications/db/__init__.py
+++ b/applications/db/__init__.py
@@ -0,0 +1,137 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+self.app.mysql_pool = await aiomysql.create_pool(
			
 
				+            host='rm-bp1159bu17li9hi94.mysql.rds.aliyuncs.com',
			
 
				+            port=3306,
			
 
				+            user='crawler',
			
 
				+            password='crawler123456@',
			
 
				+            db='piaoquan-crawler',
			
 
				+            charset='utf8mb4',
			
 
				+            connect_timeout=120,
			
 
				+        )
			
 
				+"""
			
 
				+import aiomysql
			
 
				+
			
 
				+
			
 
				+class AsyncMySQLClient(object):
			
 
				+    """
			
 
				+    Async MySQL
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, app):
			
 
				+        self.app = app
			
 
				+
			
 
				+    async def initPool(self):
			
 
				+        """
			
 
				+        初始化连接
			
 
				+        host='',
			
 
				+        port=3306,
			
 
				+        user='changwen_admin',
			
 
				+        password='changwen@123456',
			
 
				+        db='long_articles',
			
 
				+        charset='utf8mb4'
			
 
				+        :return:
			
 
				+        """
			
 
				+        self.app.mysql_pool = await aiomysql.create_pool(
			
 
				+            host='rm-bp14529nwwcw75yr1ko.mysql.rds.aliyuncs.com',
			
 
				+            port=3306,
			
 
				+            user='changwen_admin',
			
 
				+            password='changwen@123456',
			
 
				+            db='long_articles',
			
 
				+            charset='utf8mb4',
			
 
				+            connect_timeout=120,
			
 
				+        )
			
 
				+        print("mysql init successfully")
			
 
				+
			
 
				+    async def closePool(self):
			
 
				+        """
			
 
				+        关闭 mysql 连接
			
 
				+        :return:
			
 
				+        """
			
 
				+        self.app.mysql_pool.close()
			
 
				+        await self.app.mysql_pool.wait_closed()
			
 
				+
			
 
				+    async def asyncSelect(self, sql):
			
 
				+        """
			
 
				+        select method
			
 
				+        :param sql:
			
 
				+        :return:
			
 
				+        """
			
 
				+        async with self.app.mysql_pool.acquire() as conn:
			
 
				+            async with conn.cursor() as cursor:
			
 
				+                await cursor.execute(sql)
			
 
				+                result = await cursor.fetchall()
			
 
				+                return result
			
 
				+
			
 
				+    async def asyncInsert(self, sql, params):
			
 
				+        """
			
 
				+        insert and update method
			
 
				+        :param params:
			
 
				+        :param sql:
			
 
				+        :return:
			
 
				+        """
			
 
				+        async with self.app.mysql_pool.acquire() as coon:
			
 
				+            async with coon.cursor() as cursor:
			
 
				+                try:
			
 
				+                    await cursor.execute(sql, params)
			
 
				+                    await coon.commit()
			
 
				+                except Exception as e:
			
 
				+                    await coon.rollback()
			
 
				+                    raise
			
 
				+
			
 
				+
			
 
				+class TaskMySQLClient(object):
			
 
				+    """
			
 
				+    Async MySQL
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self):
			
 
				+        self.mysql_pool = None
			
 
				+
			
 
				+    async def init_pool(self):
			
 
				+        """
			
 
				+        初始化连接
			
 
				+        :return:
			
 
				+        """
			
 
				+        self.mysql_pool = await aiomysql.create_pool(
			
 
				+            host='rm-bp14529nwwcw75yr1ko.mysql.rds.aliyuncs.com',
			
 
				+            port=3306,
			
 
				+            user='changwen_admin',
			
 
				+            password='changwen@123456',
			
 
				+            db='long_articles',
			
 
				+            charset='utf8mb4',
			
 
				+            connect_timeout=120
			
 
				+        )
			
 
				+        print("mysql init successfully")
			
 
				+
			
 
				+    async def close_pool(self):
			
 
				+        """
			
 
				+        关闭 mysql 连接
			
 
				+        :return:
			
 
				+        """
			
 
				+        self.mysql_pool.close()
			
 
				+        await self.mysql_pool.wait_closed()
			
 
				+
			
 
				+    async def asyncSelect(self, sql):
			
 
				+        """
			
 
				+        select method
			
 
				+        :param sql:
			
 
				+        :return:
			
 
				+        """
			
 
				+        async with self.mysql_pool.acquire() as conn:
			
 
				+            async with conn.cursor() as cursor:
			
 
				+                await cursor.execute(sql)
			
 
				+                result = await cursor.fetchall()
			
 
				+                return result
			
 
				+
			
 
				+    async def asyncInsert(self, sql, params):
			
 
				+        """
			
 
				+        insert and update method
			
 
				+        :param params:
			
 
				+        :param sql:
			
 
				+        :return:
			
 
				+        """
			
 
				+        async with self.mysql_pool.acquire() as coon:
			
 
				+            async with coon.cursor() as cursor:
			
 
				+                await cursor.execute(sql, params)
			
 
				+                await coon.commit()
			
--- a/applications/deal/getOffVideos.py
+++ b/applications/deal/getOffVideos.py
@@ -3,8 +3,6 @@
 
				 """
			
 
				 import time
			
 
				 
			
 
				-from static.config import db_article
			
 
				-
			
 
				 
			
 
				 class GetOffVideos(object):
			
 
				     """
			
--- a/applications/functions/async_mysql.py
+++ b/applications/functions/async_mysql.py
@@ -1,61 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import aiomysql
			
 
				-
			
 
				-
			
 
				-class AsyncMySQLClient(object):
			
 
				-    """
			
 
				-    Async MySQL
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self, app):
			
 
				-        self.app = app
			
 
				-
			
 
				-    async def init_pool(self):
			
 
				-        """
			
 
				-        初始化连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.app.mysql_pool = await aiomysql.create_pool(
			
 
				-            host='rm-bp1159bu17li9hi94.mysql.rds.aliyuncs.com',
			
 
				-            port=3306,
			
 
				-            user='crawler',
			
 
				-            password='crawler123456@',
			
 
				-            db='piaoquan-crawler',
			
 
				-            charset='utf8mb4',
			
 
				-            connect_timeout=120,
			
 
				-        )
			
 
				-        print("mysql init successfully")
			
 
				-
			
 
				-    async def close_pool(self):
			
 
				-        """
			
 
				-        关闭 mysql 连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.app.mysql_pool.close()
			
 
				-        await self.app.mysql_pool.wait_closed()
			
 
				-
			
 
				-    async def async_select(self, sql):
			
 
				-        """
			
 
				-        select method
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.app.mysql_pool.acquire() as conn:
			
 
				-            async with conn.cursor() as cursor:
			
 
				-                await cursor.execute(sql)
			
 
				-                result = await cursor.fetchall()
			
 
				-                return result
			
 
				-
			
 
				-    async def async_insert(self, sql, params):
			
 
				-        """
			
 
				-        insert and update method
			
 
				-        :param params:
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.app.mysql_pool.acquire() as coon:
			
 
				-            async with coon.cursor() as cursor:
			
 
				-                await cursor.execute(sql, params)
			
 
				-                await coon.commit()
			
--- a/applications/functions/kimi.py
+++ b/applications/functions/kimi.py
@@ -21,9 +21,9 @@ class KimiServer(object):
 
				         :param params:
			
 
				         :return:
			
 
				         """
			
 
				-        title = params['title'].split("@@")[-1]
			
 
				-        contents = params['content']
			
 
				-        trace_id = params['trace_id']
			
 
				+        title = params['articleTitle'].split("@@")[-1]
			
 
				+        contents = params['articleText']
			
 
				+        trace_id = params['contentId']
			
 
				         try:
			
 
				             kimi_title = await cls.kimi_title(title)
			
 
				         except Exception as e:
			
--- a/applications/functions/pqFunctions.py
+++ b/applications/functions/pqFunctions.py
@@ -43,13 +43,8 @@ async def publishToPQ(video_obj):
 
				         "appType": 888880,
			
 
				         "repeatStatus": 1
			
 
				     }
			
 
				-    # response = requests.post(
			
 
				-    #     url=url,
			
 
				-    #     headers=headers,
			
 
				-    #     data=payload,
			
 
				-    # )
			
 
				-    # return response.json()
			
 
				     response = await async_post(url, headers, payload)
			
 
				+    print(json.dumps(response, ensure_ascii=False, indent=4))
			
 
				     return response
			
 
				 
			
 
				 
			
--- a/applications/functions/video_item.py
+++ b/applications/functions/video_item.py
@@ -74,7 +74,7 @@ class VideoItem(object):
 
				         must_keys = [
			
 
				             "video_id",
			
 
				             "user_id",
			
 
				-            "user_name",
			
 
				+            # "user_name",
			
 
				             "out_video_id",
			
 
				             "session",
			
 
				             "video_url",
			
@@ -126,8 +126,8 @@ class VideoProducer(object):
 
				         platform = "weixin_search"
			
 
				         publish_time_stamp = int(video_obj['pubTime'])
			
 
				         item = VideoItem()
			
 
				-        item.add_video_info("user_id", user["uid"])
			
 
				-        item.add_video_info("user_name", user["nick_name"])
			
 
				+        item.add_video_info("user_id", user)
			
 
				+        # item.add_video_info("user_name", user["nick_name"])
			
 
				         item.add_video_info("video_id", video_obj['hashDocID'])
			
 
				         item.add_video_info("video_title", trace_id)
			
 
				         item.add_video_info("publish_time_stamp", int(publish_time_stamp))
			
@@ -153,10 +153,10 @@ class VideoProducer(object):
 
				         platform = "baidu_search"
			
 
				         publish_time_stamp = int(video_obj['publish_time'])
			
 
				         item = VideoItem()
			
 
				-        print("baidu")
			
 
				-        print(json.dumps(video_obj, ensure_ascii=False, indent=4))
			
 
				-        item.add_video_info("user_id", user["uid"])
			
 
				-        item.add_video_info("user_name", user["nick_name"])
			
 
				+        # print("baidu")
			
 
				+        # print(json.dumps(video_obj, ensure_ascii=False, indent=4))
			
 
				+        item.add_video_info("user_id", user)
			
 
				+        # item.add_video_info("user_name", user["nick_name"])
			
 
				         item.add_video_info("video_id", video_obj['id'])
			
 
				         item.add_video_info("video_title", video_obj['title'])
			
 
				         item.add_video_info("publish_time_stamp", publish_time_stamp)
			
@@ -185,8 +185,8 @@ class VideoProducer(object):
 
				         platform = "xg_search"
			
 
				         publish_time_stamp = int(video_obj['publish_time'])
			
 
				         item = VideoItem()
			
 
				-        item.add_video_info("user_id", user["uid"])
			
 
				-        item.add_video_info("user_name", user["nick_name"])
			
 
				+        item.add_video_info("user_id", user)
			
 
				+        # item.add_video_info("user_name", user["nick_name"])
			
 
				         item.add_video_info("video_id", video_obj['video_id'])
			
 
				         item.add_video_info("video_title", video_obj.get('video_title'))
			
 
				         item.add_video_info("publish_time_stamp", int(publish_time_stamp))
			
@@ -214,10 +214,10 @@ class VideoProducer(object):
 
				         platform = "dy_search"
			
 
				         publish_time_stamp = int(video_obj['publish_timestamp'] / 1000)
			
 
				         item = VideoItem()
			
 
				-        print("douyin")
			
 
				-        print(json.dumps(video_obj, ensure_ascii=False, indent=4))
			
 
				-        item.add_video_info("user_id", user["uid"])
			
 
				-        item.add_video_info("user_name", user["nick_name"])
			
 
				+        # print("douyin")
			
 
				+        # print(json.dumps(video_obj, ensure_ascii=False, indent=4))
			
 
				+        item.add_video_info("user_id", user)
			
 
				+        # item.add_video_info("user_name", user["nick_name"])
			
 
				         item.add_video_info("video_id", video_obj['channel_content_id'])
			
 
				         item.add_video_info("video_title", video_obj['title'])
			
 
				         item.add_video_info("publish_time_stamp", int(publish_time_stamp))
			
--- a/applications/spider/__init__.py
+++ b/applications/spider/__init__.py
@@ -0,0 +1,116 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+from datetime import datetime
			
 
				+
			
 
				+from applications.functions.video_item import VideoProducer
			
 
				+from applications.functions.log import logging
			
 
				+from applications.match_algorithm.rank import title_similarity_rank
			
 
				+from .spiderAB import SearchABTest
			
 
				+from .spiderSchedule import SearchMethod
			
 
				+
			
 
				+
			
 
				+async def videoSender(video_obj, user, trace_id, platform, content_id, table, dbClient):
			
 
				+    """
			
 
				+    异步处理微信 video_obj
			
 
				+    公众号和站内账号一一对应
			
 
				+    :param dbClient:
			
 
				+    :param table:
			
 
				+    :param content_id：
			
 
				+    :param platform:
			
 
				+    :param user:
			
 
				+    :param trace_id:
			
 
				+    :param video_obj:
			
 
				+    :return:
			
 
				+    """
			
 
				+    Video = VideoProducer()
			
 
				+    if platform == "xg_search":
			
 
				+        mq_obj = Video.xg_video_producer(
			
 
				+            video_obj=video_obj,
			
 
				+            user=user,
			
 
				+            trace_id=trace_id,
			
 
				+        )
			
 
				+    elif platform == "baidu_search":
			
 
				+        mq_obj = Video.baidu_video_producer(
			
 
				+            video_obj=video_obj,
			
 
				+            user=user,
			
 
				+            trace_id=trace_id,
			
 
				+        )
			
 
				+    elif platform == "wx_search":
			
 
				+        mq_obj = Video.wx_video_producer(
			
 
				+            video_obj=video_obj,
			
 
				+            user=user,
			
 
				+            trace_id=trace_id,
			
 
				+        )
			
 
				+    elif platform == "dy_search":
			
 
				+        mq_obj = Video.dy_video_producer(
			
 
				+            video_obj=video_obj,
			
 
				+            user=user,
			
 
				+            trace_id=trace_id,
			
 
				+        )
			
 
				+    else:
			
 
				+        mq_obj = {}
			
 
				+    mq_obj['trace_id'] = trace_id
			
 
				+    mq_obj['content_id'] = content_id
			
 
				+    insert_sql = f"""
			
 
				+    INSERT INTO {table}
			
 
				+    (content_id, out_video_id, platform, video_title, play_count, like_count, publish_time, crawler_time, duration, video_url, cover_url, user_id, trace_id)
			
 
				+    values 
			
 
				+    (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s);
			
 
				+    """
			
 
				+    await dbClient.asyncInsert(
			
 
				+        sql=insert_sql,
			
 
				+        params=(
			
 
				+            content_id,
			
 
				+            mq_obj['video_id'],
			
 
				+            platform,
			
 
				+            mq_obj['video_title'],
			
 
				+            mq_obj['play_cnt'],
			
 
				+            mq_obj['like_cnt'],
			
 
				+            datetime.fromtimestamp(mq_obj['publish_time_stamp']).strftime('%Y-%m-%d %H:%M:%S'),
			
 
				+            datetime.now().__str__(),
			
 
				+            mq_obj['duration'],
			
 
				+            mq_obj['video_url'],
			
 
				+            mq_obj['cover_url'],
			
 
				+            mq_obj['user_id'],
			
 
				+            trace_id
			
 
				+        )
			
 
				+    )
			
 
				+
			
 
				+
			
 
				+async def searchVideos(info, ghIdMap, dbClient):
			
 
				+    """
			
 
				+    search and send msg to ETL
			
 
				+    :param dbClient:
			
 
				+    :param ghIdMap:
			
 
				+    :param info:
			
 
				+    :return:
			
 
				+    """
			
 
				+    SearchAB = SearchABTest(info=info, searchMethod=SearchMethod())
			
 
				+    # 启三个搜索，每个搜索都保证要搜索到， 分别用key1， key2， key3去搜索
			
 
				+    trace_id = info['traceId']
			
 
				+    gh_id = info['ghId']
			
 
				+    content_id = info['contentId']
			
 
				+    recall_list = await SearchAB.ab_5()
			
 
				+    logging(
			
 
				+        code="1006",
			
 
				+        info="搜索到{}条视频".format(len(recall_list)),
			
 
				+        data=recall_list,
			
 
				+        trace_id=info['traceId']
			
 
				+    )
			
 
				+    # 按照标题相似度排序
			
 
				+    ranked_list = title_similarity_rank(content_title=info['oriTitle'].split("@@")[-1], recall_list=recall_list)
			
 
				+    for recall_obj in ranked_list:
			
 
				+        if recall_obj:
			
 
				+            platform = recall_obj['platform']
			
 
				+            recall_video = recall_obj['result']
			
 
				+            if recall_video:
			
 
				+                await videoSender(
			
 
				+                    video_obj=recall_video,
			
 
				+                    user=ghIdMap.get(gh_id, 69637498),
			
 
				+                    trace_id=trace_id,
			
 
				+                    platform=platform,
			
 
				+                    content_id=content_id,
			
 
				+                    table=info['spider'],
			
 
				+                    dbClient=dbClient
			
 
				+                )
			
--- a/applications/spider/spiderAB.py
+++ b/applications/spider/spiderAB.py
@@ -0,0 +1,169 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+
			
 
				+
			
 
				+class SearchABTest(object):
			
 
				+    """
			
 
				+    搜索策略实验方案
			
 
				+    """
			
 
				+
			
 
				+    ori_title = None
			
 
				+    article_summary = None
			
 
				+    article_keys = None
			
 
				+    trace_id = None
			
 
				+
			
 
				+    def __init__(self, info, searchMethod):
			
 
				+        SearchABTest.set_class_properties(info, searchMethod)
			
 
				+
			
 
				+    @classmethod
			
 
				+    def set_class_properties(cls, info, searchMethod):
			
 
				+        """
			
 
				+        初始化搜索策略实验类
			
 
				+        :param searchMethod:
			
 
				+        :param info: kimi 挖掘的基本信息
			
 
				+        :return:
			
 
				+        """
			
 
				+        cls.ori_title = info["oriTitle"]
			
 
				+        cls.article_summary = info["kimiSummary"]
			
 
				+        cls.article_keys = info["kimiKeys"]
			
 
				+        cls.trace_id = info["traceId"]
			
 
				+        cls.searchMethod = searchMethod
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def base_line(cls):
			
 
				+        """
			
 
				+        兜底策略
			
 
				+        """
			
 
				+        result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.article_keys[0],
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if result:
			
 
				+            return result
			
 
				+        else:
			
 
				+            sub_result = await cls.searchMethod.search_v1(
			
 
				+                text=cls.article_keys[1],
			
 
				+                trace_id=cls.trace_id)
			
 
				+            if sub_result:
			
 
				+                return sub_result
			
 
				+            else:
			
 
				+                return await cls.searchMethod.search_v1(
			
 
				+                    text=cls.article_keys[2],
			
 
				+                    trace_id=cls.trace_id
			
 
				+                )
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_0(cls):
			
 
				+        """
			
 
				+        默认原标题搜索
			
 
				+        :return:
			
 
				+        """
			
 
				+        search_result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.ori_title,
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if search_result:
			
 
				+            return search_result
			
 
				+        else:
			
 
				+            return await cls.base_line()
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_1(cls):
			
 
				+        """
			
 
				+        使用 content_summary搜索
			
 
				+        :return:
			
 
				+        """
			
 
				+        search_result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.article_summary,
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if search_result:
			
 
				+            return search_result
			
 
				+        else:
			
 
				+            return await cls.ab_0()
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_2(cls):
			
 
				+        """
			
 
				+        使用文本关键词搜索
			
 
				+        :return:
			
 
				+        """
			
 
				+        search_result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.article_keys[0],
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if search_result:
			
 
				+            return search_result
			
 
				+        else:
			
 
				+            return await cls.base_line()
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_3(cls):
			
 
				+        """
			
 
				+        使用文本关键词搜索
			
 
				+        :return:
			
 
				+        """
			
 
				+        search_result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.article_keys[1],
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if search_result:
			
 
				+            return search_result
			
 
				+        else:
			
 
				+            return await cls.base_line()
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_4(cls):
			
 
				+        """
			
 
				+        使用文本关键词搜索
			
 
				+        :return:
			
 
				+        """
			
 
				+        search_result = await cls.searchMethod.search_v1(
			
 
				+            text=cls.article_keys[2],
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if search_result:
			
 
				+            return search_result
			
 
				+        else:
			
 
				+            return await cls.base_line()
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def ab_5(cls):
			
 
				+        """
			
 
				+        增量搜索, 返回result_list
			
 
				+        :return:
			
 
				+        """
			
 
				+        result_list = await cls.searchMethod.search_v2(
			
 
				+            text=cls.article_summary[:15],
			
 
				+            trace_id=cls.trace_id
			
 
				+        )
			
 
				+        if len(result_list) > 3:
			
 
				+            return result_list
			
 
				+        else:
			
 
				+            result_list += await cls.searchMethod.search_v2(
			
 
				+                text=cls.ori_title[:15],
			
 
				+                trace_id=cls.trace_id
			
 
				+            )
			
 
				+            if len(result_list) > 3:
			
 
				+                return result_list
			
 
				+            else:
			
 
				+                result_list += await cls.searchMethod.search_v2(
			
 
				+                    text=cls.article_keys[0],
			
 
				+                    trace_id=cls.trace_id
			
 
				+                )
			
 
				+                if len(result_list) > 3:
			
 
				+                    return result_list
			
 
				+                else:
			
 
				+                    result_list += await cls.searchMethod.search_v2(
			
 
				+                        text=cls.article_keys[1],
			
 
				+                        trace_id=cls.trace_id
			
 
				+                    )
			
 
				+                    if result_list:
			
 
				+                        return result_list
			
 
				+                    else:
			
 
				+                        result_list += await cls.searchMethod.search_v2(
			
 
				+                            text=cls.article_keys[2],
			
 
				+                            trace_id=cls.trace_id
			
 
				+                        )
			
 
				+                        return result_list
			
--- a/applications/spider/spiderSchedule.py
+++ b/applications/spider/spiderSchedule.py
@@ -0,0 +1,58 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import time
			
 
				+from applications.search import *
			
 
				+
			
 
				+
			
 
				+class SearchMethod(object):
			
 
				+    """
			
 
				+    搜索召回模式
			
 
				+    """
			
 
				+    s_words = []
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def search_v1(cls, text, trace_id):
			
 
				+        """
			
 
				+        dy ---> baidu ---> xigua
			
 
				+        :param text:
			
 
				+        :param trace_id:
			
 
				+        :return:
			
 
				+        """
			
 
				+        douyin_result = douyin_search(keyword=text, sensitive_words=cls.s_words, trace_id=trace_id)
			
 
				+        if douyin_result:
			
 
				+            return {"platform": "dy_search", "result": douyin_result[0]}
			
 
				+        else:
			
 
				+            time.sleep(1)
			
 
				+            baidu_result = hksp_search(key=text, sensitive_words=cls.s_words, trace_id=trace_id)
			
 
				+            if baidu_result:
			
 
				+                return {"platform": "baidu_search", "result": baidu_result[0]}
			
 
				+            else:
			
 
				+                xigua_result = xigua_search_v2(keyword=text, sensitive_words=cls.s_words)
			
 
				+                if xigua_result:
			
 
				+                    return {"platform": "xg_search", "result": xigua_result[0]}
			
 
				+                else:
			
 
				+                    return None
			
 
				+
			
 
				+    @classmethod
			
 
				+    async def search_v2(cls, text, trace_id):
			
 
				+        """
			
 
				+        dy ---> baidu ---> xigua
			
 
				+        :param trace_id:
			
 
				+        :param text:
			
 
				+        :return:
			
 
				+        """
			
 
				+        L = []
			
 
				+        douyin_result = douyin_search(keyword=text, sensitive_words=cls.s_words, trace_id=trace_id)
			
 
				+        for vid_obj in douyin_result:
			
 
				+            L.append({"platform": "dy_search", "result": vid_obj})
			
 
				+        if len(L) >= 3:
			
 
				+            return L
			
 
				+        else:
			
 
				+            baidu_result = hksp_search(key=text, sensitive_words=cls.s_words, trace_id=trace_id)
			
 
				+            if baidu_result:
			
 
				+                L.append({"platform": "baidu_search", "result": baidu_result[0]})
			
 
				+            xigua_result = xigua_search_v2(keyword=text, sensitive_words=cls.s_words)
			
 
				+            if xigua_result:
			
 
				+                L.append({"platform": "xg_search", "result": xigua_result[0]})
			
 
				+            return L
			
--- a/etlTask.py
+++ b/etlTask.py
@@ -0,0 +1,27 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import time
			
 
				+import asyncio
			
 
				+import datetime
			
 
				+from tasks.etl_task import AsyncETL
			
 
				+from applications.db import TaskMySQLClient
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    """
			
 
				+    main job
			
 
				+    :return:
			
 
				+    """
			
 
				+    TMC = TaskMySQLClient()
			
 
				+    await TMC.init_pool()
			
 
				+    PD = AsyncETL(TMC)
			
 
				+    await PD.deal()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    while True:
			
 
				+        asyncio.run(main())
			
 
				+        now_str = datetime.datetime.now().__str__()
			
 
				+        print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				+        time.sleep(10)
			
--- a/historyTask.py
+++ b/historyTask.py
@@ -0,0 +1,27 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import time
			
 
				+import asyncio
			
 
				+import datetime
			
 
				+from tasks.history_task import historyContentIdTask
			
 
				+from applications.db import TaskMySQLClient
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    """
			
 
				+    main job
			
 
				+    :return:
			
 
				+    """
			
 
				+    TMC = TaskMySQLClient()
			
 
				+    await TMC.init_pool()
			
 
				+    PD = historyContentIdTask(TMC)
			
 
				+    await PD.deal()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    while True:
			
 
				+        asyncio.run(main())
			
 
				+        now_str = datetime.datetime.now().__str__()
			
 
				+        print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				+        time.sleep(10)
			
--- a/kimiTask.py
+++ b/kimiTask.py
@@ -0,0 +1,24 @@
 
				+import time
			
 
				+import asyncio
			
 
				+import datetime
			
 
				+from tasks.kimi_task import KimiTask
			
 
				+from applications.db import TaskMySQLClient
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    """
			
 
				+    main job
			
 
				+    :return:
			
 
				+    """
			
 
				+    TMC = TaskMySQLClient()
			
 
				+    await TMC.init_pool()
			
 
				+    PD = KimiTask(TMC)
			
 
				+    await PD.deal()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    while True:
			
 
				+        asyncio.run(main())
			
 
				+        now_str = datetime.datetime.now().__str__()
			
 
				+        print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				+        time.sleep(10)
			
--- a/matchVideoFromHistoryArticleASC.py
+++ b/matchVideoFromHistoryArticleASC.py
@@ -1,86 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import datetime
			
 
				-import time
			
 
				-
			
 
				-import aiomysql
			
 
				-import asyncio
			
 
				-
			
 
				-from tasks import MatchTask3
			
 
				-
			
 
				-
			
 
				-class TaskMySQLClient(object):
			
 
				-    """
			
 
				-    Async MySQL
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self):
			
 
				-        self.mysql_pool = None
			
 
				-
			
 
				-    async def init_pool(self):
			
 
				-        """
			
 
				-        初始化连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool = await aiomysql.create_pool(
			
 
				-            host='rm-bp1159bu17li9hi94.mysql.rds.aliyuncs.com',
			
 
				-            port=3306,
			
 
				-            user='crawler',
			
 
				-            password='crawler123456@',
			
 
				-            db='piaoquan-crawler',
			
 
				-            charset='utf8mb4',
			
 
				-            connect_timeout=120,
			
 
				-        )
			
 
				-        print("mysql init successfully")
			
 
				-
			
 
				-    async def close_pool(self):
			
 
				-        """
			
 
				-        关闭 mysql 连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool.close()
			
 
				-        await self.mysql_pool.wait_closed()
			
 
				-
			
 
				-    async def async_select(self, sql):
			
 
				-        """
			
 
				-        select method
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as conn:
			
 
				-            async with conn.cursor() as cursor:
			
 
				-                await cursor.execute(sql)
			
 
				-                result = await cursor.fetchall()
			
 
				-                return result
			
 
				-
			
 
				-    async def async_insert(self, sql, params):
			
 
				-        """
			
 
				-        insert and update method
			
 
				-        :param params:
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as coon:
			
 
				-            async with coon.cursor() as cursor:
			
 
				-                await cursor.execute(sql, params)
			
 
				-                await coon.commit()
			
 
				-
			
 
				-
			
 
				-async def main():
			
 
				-    """
			
 
				-    main job
			
 
				-    :return:
			
 
				-    """
			
 
				-    TMC = TaskMySQLClient()
			
 
				-    await TMC.init_pool()
			
 
				-    PD = MatchTask3(TMC)
			
 
				-    await PD.deal()
			
 
				-    now_str = datetime.datetime.now().__str__()
			
 
				-    print("{}    请求执行完成， 等待1分钟".format(now_str))
			
 
				-    await asyncio.sleep(1 * 60)
			
 
				-
			
 
				-
			
 
				-if __name__ == '__main__':
			
 
				-    while True:
			
 
				-        asyncio.run(main())
			
--- a/matchVideoFromHistoryArticleDESC.py
+++ b/matchVideoFromHistoryArticleDESC.py
@@ -1,84 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import datetime
			
 
				-import aiomysql
			
 
				-import asyncio
			
 
				-
			
 
				-from tasks import MatchTask4
			
 
				-
			
 
				-
			
 
				-class TaskMySQLClient(object):
			
 
				-    """
			
 
				-    Async MySQL
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self):
			
 
				-        self.mysql_pool = None
			
 
				-
			
 
				-    async def init_pool(self):
			
 
				-        """
			
 
				-        初始化连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool = await aiomysql.create_pool(
			
 
				-            host='rm-bp1159bu17li9hi94.mysql.rds.aliyuncs.com',
			
 
				-            port=3306,
			
 
				-            user='crawler',
			
 
				-            password='crawler123456@',
			
 
				-            db='piaoquan-crawler',
			
 
				-            charset='utf8mb4',
			
 
				-            connect_timeout=120,
			
 
				-        )
			
 
				-        print("mysql init successfully")
			
 
				-
			
 
				-    async def close_pool(self):
			
 
				-        """
			
 
				-        关闭 mysql 连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool.close()
			
 
				-        await self.mysql_pool.wait_closed()
			
 
				-
			
 
				-    async def async_select(self, sql):
			
 
				-        """
			
 
				-        select method
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as conn:
			
 
				-            async with conn.cursor() as cursor:
			
 
				-                await cursor.execute(sql)
			
 
				-                result = await cursor.fetchall()
			
 
				-                return result
			
 
				-
			
 
				-    async def async_insert(self, sql, params):
			
 
				-        """
			
 
				-        insert and update method
			
 
				-        :param params:
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as coon:
			
 
				-            async with coon.cursor() as cursor:
			
 
				-                await cursor.execute(sql, params)
			
 
				-                await coon.commit()
			
 
				-
			
 
				-
			
 
				-async def main():
			
 
				-    """
			
 
				-    main2
			
 
				-    :return:
			
 
				-    """
			
 
				-    TMC = TaskMySQLClient()
			
 
				-    await TMC.init_pool()
			
 
				-    PD = MatchTask4(TMC)
			
 
				-    await PD.deal()
			
 
				-    now_str = datetime.datetime.now().__str__()
			
 
				-    print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				-    await asyncio.sleep(10)
			
 
				-
			
 
				-
			
 
				-if __name__ == '__main__':
			
 
				-    while True:
			
 
				-        asyncio.run(main())
			
--- a/match_video_task.py
+++ b/match_video_task.py
@@ -1,86 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import time
			
 
				-import datetime
			
 
				-import asyncio
			
 
				-
			
 
				-import aiomysql
			
 
				-from tasks import MatchTask1
			
 
				-
			
 
				-
			
 
				-class TaskMySQLClient(object):
			
 
				-    """
			
 
				-    Async MySQL
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self):
			
 
				-        self.mysql_pool = None
			
 
				-
			
 
				-    async def init_pool(self):
			
 
				-        """
			
 
				-        初始化连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool = await aiomysql.create_pool(
			
 
				-            host='rm-bp1159bu17li9hi94.mysql.rds.aliyuncs.com',
			
 
				-            port=3306,
			
 
				-            user='crawler',
			
 
				-            password='crawler123456@',
			
 
				-            db='piaoquan-crawler',
			
 
				-            charset='utf8mb4',
			
 
				-            connect_timeout=120,
			
 
				-        )
			
 
				-        print("mysql init successfully")
			
 
				-
			
 
				-    async def close_pool(self):
			
 
				-        """
			
 
				-        关闭 mysql 连接
			
 
				-        :return:
			
 
				-        """
			
 
				-        self.mysql_pool.close()
			
 
				-        await self.mysql_pool.wait_closed()
			
 
				-
			
 
				-    async def async_select(self, sql):
			
 
				-        """
			
 
				-        select method
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as conn:
			
 
				-            async with conn.cursor() as cursor:
			
 
				-                await cursor.execute(sql)
			
 
				-                result = await cursor.fetchall()
			
 
				-                return result
			
 
				-
			
 
				-    async def async_insert(self, sql, params):
			
 
				-        """
			
 
				-        insert and update method
			
 
				-        :param params:
			
 
				-        :param sql:
			
 
				-        :return:
			
 
				-        """
			
 
				-        async with self.mysql_pool.acquire() as coon:
			
 
				-            async with coon.cursor() as cursor:
			
 
				-                await cursor.execute(sql, params)
			
 
				-                await coon.commit()
			
 
				-
			
 
				-
			
 
				-async def main():
			
 
				-    """
			
 
				-    main job
			
 
				-    :return:
			
 
				-    """
			
 
				-    TMC = TaskMySQLClient()
			
 
				-    await TMC.init_pool()
			
 
				-    PD = MatchTask1(TMC)
			
 
				-    await PD.deal()
			
 
				-
			
 
				-
			
 
				-if __name__ == '__main__':
			
 
				-    while True:
			
 
				-        asyncio.run(main())
			
 
				-        now_str = datetime.datetime.now().__str__()
			
 
				-        print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				-        time.sleep(10)
			
 
				-
			
--- a/publishtask.py
+++ b/publishtask.py
@@ -0,0 +1,27 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import time
			
 
				+import asyncio
			
 
				+import datetime
			
 
				+from tasks.publish_task import publishTask
			
 
				+from applications.db import TaskMySQLClient
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    """
			
 
				+    main job
			
 
				+    :return:
			
 
				+    """
			
 
				+    TMC = TaskMySQLClient()
			
 
				+    await TMC.init_pool()
			
 
				+    PD = publishTask(TMC)
			
 
				+    await PD.deal()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    while True:
			
 
				+        asyncio.run(main())
			
 
				+        now_str = datetime.datetime.now().__str__()
			
 
				+        print("{}    请求执行完成， 等待10s".format(now_str))
			
 
				+        time.sleep(10)
			
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,107 +1,11 @@
 
				-aiofiles==23.2.1
			
 
				-aiohttp==3.9.3
			
 
				-aiosignal==1.3.1
			
 
				-alembic==1.11.1
			
 
				-aliyun-log-python-sdk==0.9.1
			
 
				-aliyun-python-sdk-core==2.15.1
			
 
				-aliyun-python-sdk-kms==2.16.2
			
 
				-annotated-types==0.6.0
			
 
				-anyio==4.3.0
			
 
				-APScheduler==3.10.1
			
 
				-async-timeout==4.0.3
			
 
				-attrs==23.2.0
			
 
				-backports.zoneinfo==0.2.1
			
 
				-black==24.3.0
			
 
				-blinker==1.6.2
			
 
				-cachelib==0.12.0
			
 
				-certifi==2024.2.2
			
 
				-cffi==1.15.1
			
 
				-charset-normalizer==3.3.2
			
 
				-click==8.1.6
			
 
				-colorama==0.4.6
			
 
				-crcmod==1.7
			
 
				-cryptography==41.0.2
			
 
				-dateparser==1.2.0
			
 
				-decorator==5.1.1
			
 
				-distro==1.9.0
			
 
				-elastic-transport==8.13.0
			
 
				-elasticsearch==8.13.0
			
 
				-exceptiongroup==1.2.0
			
 
				-Flask==3.0.3
			
 
				-Flask-APScheduler==1.12.4
			
 
				-Flask-Login==0.6.2
			
 
				-Flask-Mail==0.9.1
			
 
				-flask-marshmallow==0.15.0
			
 
				-Flask-Migrate==4.0.4
			
 
				-Flask-Reuploaded==1.3.0
			
 
				-Flask-Session==0.5.0
			
 
				-Flask-SQLAlchemy==3.1.1
			
 
				-Flask-WTF==1.2.1
			
 
				-frozenlist==1.4.1
			
 
				-greenlet==2.0.2
			
 
				-h11==0.14.0
			
 
				-h2==4.1.0
			
 
				-hpack==4.0.0
			
 
				-httpcore==1.0.4
			
 
				-httpx==0.27.0
			
 
				-Hypercorn==0.16.0
			
 
				-hyperframe==6.0.1
			
 
				-idna==3.6
			
 
				-importlib-metadata==6.8.0
			
 
				-importlib_resources==6.1.2
			
 
				-itsdangerous==2.1.2
			
 
				-Jinja2==3.1.2
			
 
				-jmespath==0.10.0
			
 
				-Mako==1.2.4
			
 
				-MarkupSafe==2.1.3
			
 
				-marshmallow==3.20.1
			
 
				-marshmallow-sqlalchemy==0.29.0
			
 
				-mq-http-sdk==1.0.3
			
 
				-multidict==6.0.5
			
 
				-mypy-extensions==1.0.0
			
 
				-numpy==1.24.4
			
 
				-odps==3.5.1
			
 
				-openai==1.21.2
			
 
				-oss2==2.18.4
			
 
				-packaging==23.1
			
 
				-pandas==2.0.3
			
 
				-pathspec==0.12.1
			
 
				-Pillow==10.0.0
			
 
				-platformdirs==4.2.0
			
 
				-priority==2.0.0
			
 
				-protobuf==3.20.3
			
 
				-psutil==5.9.5
			
 
				-pyarrow==15.0.2
			
 
				-pycparser==2.21
			
 
				-pycryptodome==3.20.0
			
 
				-pydantic==2.6.4
			
 
				-pydantic_core==2.16.3
			
 
				-PyMySQL==1.1.0
			
 
				-pyodps==0.11.6
			
 
				-python-dateutil==2.8.2
			
 
				-pytz==2023.3
			
 
				-Quart==0.19.5
			
 
				-regex==2024.4.16
			
 
				-requests==2.31.0
			
 
				-schedule==1.2.1
			
 
				-six==1.16.0
			
 
				-sniffio==1.3.1
			
 
				-SQLAlchemy==2.0.21
			
 
				-style==1.1.0
			
 
				-taskgroup==0.0.0a4
			
 
				-tomli==2.0.1
			
 
				-tqdm==4.66.2
			
 
				-typing_extensions==4.7.1
			
 
				-tzdata==2023.3
			
 
				-tzlocal==5.0.1
			
 
				-update==0.0.1
			
 
				-urllib3==2.2.1
			
 
				-validators==0.20.0
			
 
				-Werkzeug==3.0.2
			
 
				-wsproto==1.2.0
			
 
				-WTForms==3.1.2
			
 
				-yarl==1.9.4
			
 
				-zipp==3.16.2
			
 
				-
			
 
				-lxml~=5.2.1
			
 
				+aiofiles
			
 
				+aiohttp~=3.10.4
			
 
				+aliyun-log-python-sdk
			
 
				+aliyun-python-sdk-core
			
 
				+aliyun-python-sdk-kms
			
 
				+quart~=0.19.6
			
 
				+requests~=2.32.3
			
 
				+tqdm~=4.66.5
			
 
				+pymysql~=1.1.1
			
 
				+pyapollos~=0.1.5
			
 
				 aiomysql~=0.2.0
			
--- a/server/api/__init__.py
+++ b/server/api/__init__.py
@@ -0,0 +1,7 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+from .get_off_videos import GetOffVideos
			
 
				+from .minigram import Minigram
			
 
				+from .response import Response
			
 
				+from .record import Record
			
--- a/server/api/get_off_videos.py
+++ b/server/api/get_off_videos.py
@@ -0,0 +1,78 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import json
			
 
				+import time
			
 
				+
			
 
				+
			
 
				+class GetOffVideos(object):
			
 
				+    """
			
 
				+    下架视频
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, params, mysql_client, config):
			
 
				+        self.params = params
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.articles_video = config.articleVideos
			
 
				+        self.trace_id = None
			
 
				+
			
 
				+    def checkParams(self):
			
 
				+        """
			
 
				+
			
 
				+        :return:
			
 
				+        """
			
 
				+        try:
			
 
				+            self.trace_id = self.params['traceId']
			
 
				+            return None
			
 
				+        except Exception as e:
			
 
				+            response = {
			
 
				+                "error": "params error",
			
 
				+                "info": str(e),
			
 
				+                "data": self.params
			
 
				+            }
			
 
				+            return response
			
 
				+
			
 
				+    async def pushVideoIntoQueue(self):
			
 
				+        """
			
 
				+        将视频id记录到待下架表中
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        select response from {self.articles_video} where trace_id = '{self.trace_id}';
			
 
				+        """
			
 
				+        result = await self.mysql_client.asyncSelect(sql=select_sql)
			
 
				+        if result:
			
 
				+            video_list = json.loads(result[0][0])
			
 
				+            for video in video_list:
			
 
				+                video_id = video['videoId']
			
 
				+                try:
			
 
				+                    update_sql = f"""
			
 
				+                    INSERT INTO get_off_videos
			
 
				+                    (video_id, publish_time, video_status, trace_id)
			
 
				+                    values 
			
 
				+                    (%s, %s, %s, %s);
			
 
				+                    """
			
 
				+                    await self.mysql_client.asyncInsert(
			
 
				+                        sql=update_sql,
			
 
				+                        params=(video_id, int(time.time()), 1, self.trace_id)
			
 
				+                    )
			
 
				+                except Exception as e:
			
 
				+                    print(e)
			
 
				+        else:
			
 
				+            print("该 trace_id不存在")
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+
			
 
				+        :return:
			
 
				+        """
			
 
				+        params_error = self.checkParams()
			
 
				+        if params_error:
			
 
				+            return params_error
			
 
				+        else:
			
 
				+            await self.pushVideoIntoQueue()
			
 
				+            response = {
			
 
				+                "status": "success",
			
 
				+                "traceId": self.trace_id
			
 
				+            }
			
 
				+            return response
			
--- a/server/api/minigram.py
+++ b/server/api/minigram.py
@@ -0,0 +1,110 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+minigram_map = {
			
 
				+    1: {
			
 
				+        # 25: {
			
 
				+        #     "avatar": "https://rescdn.yishihui.com/0temp/ttmhzfsh.png",
			
 
				+        #     "id": "wx0b7d95eb293b783b",
			
 
				+        #     "name": "天天美好祝福生活",
			
 
				+        #     "index": 25
			
 
				+        # },
			
 
				+        25: {
			
 
				+                "avatar": "https://rescdn.yishihui.com/0temp/pqsp.png",
			
 
				+                "id": "wxbdd2a2e93d9a6e25",
			
 
				+                "name": "票圈视频",
			
 
				+                "index": 25
			
 
				+            },
			
 
				+        29: {
			
 
				+            "avatar": "https://rescdn.yishihui.com/0temp/cyfyld.png",
			
 
				+            "id": "wx65c76bb4c67934db",
			
 
				+            "name": "财运福运来到",
			
 
				+            "index": 29
			
 
				+        },
			
 
				+        31: {
			
 
				+            "avatar": "https://rescdn.yishihui.com/0temp/mhzfshxf2.png",
			
 
				+            "id": "wx2e4478b1641b3b15",
			
 
				+            "name": "美好祝福生活幸福",
			
 
				+            "index": 31
			
 
				+        }
			
 
				+    },
			
 
				+    2: {
			
 
				+        36: {
			
 
				+            "avatar": "https://rescdn.yishihui.com/0temp/zfyfyc.jpeg",
			
 
				+            "id": "wxcddf231abd0dabdc",
			
 
				+            "name": "祝福有福有财",
			
 
				+            "index": 36
			
 
				+        },
			
 
				+        33: {
			
 
				+            "avatar": "https://rescdn.yishihui.com/0temp/pqsp.png",
			
 
				+            "id": "wxbdd2a2e93d9a6e25",
			
 
				+            "name": "票圈视频",
			
 
				+            "index": 33
			
 
				+            }
			
 
				+    },
			
 
				+    3: {
			
 
				+        27: {
			
 
				+            "avatar": "https://rescdn.yishihui.com/0temp/xymhfqdd.png",
			
 
				+            "id": "wx7187c217efef24a7",
			
 
				+            "name": "幸运美好福气多多",
			
 
				+            "index": 27
			
 
				+        }
			
 
				+    }
			
 
				+}
			
 
				+
			
 
				+
			
 
				+class Minigram(object):
			
 
				+    """
			
 
				+    小程序卡片
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, params):
			
 
				+        self.params = params
			
 
				+        self.business_type = None
			
 
				+        self.mini_code = None
			
 
				+        self.trace_id = None
			
 
				+
			
 
				+    def check_params(self):
			
 
				+        """
			
 
				+        校验参数
			
 
				+        :return:
			
 
				+        """
			
 
				+        try:
			
 
				+            self.business_type = self.params['businessType']
			
 
				+            self.mini_code = self.params['miniCode']
			
 
				+            self.trace_id = self.params['traceId']
			
 
				+            return None
			
 
				+        except Exception as e:
			
 
				+            response = {
			
 
				+                "status": "fail",
			
 
				+                "code": 1,
			
 
				+                "message": str(e),
			
 
				+                "info": "params check error"
			
 
				+            }
			
 
				+            return response
			
 
				+
			
 
				+    def choose_minigram(self):
			
 
				+        """
			
 
				+        分配小程序卡片
			
 
				+        :return:
			
 
				+        """
			
 
				+        try:
			
 
				+            minigram = minigram_map.get(self.business_type).get(self.mini_code)
			
 
				+            response = {
			
 
				+                "programAvatar": minigram['avatar'],
			
 
				+                "programId": minigram['id'],
			
 
				+                "programName": minigram['name'],
			
 
				+                "trace_id": self.trace_id
			
 
				+            }
			
 
				+        except Exception as e:
			
 
				+            response = {
			
 
				+                "error": "invalid params",
			
 
				+                "msg": str(e)
			
 
				+            }
			
 
				+        return response
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        :return:
			
 
				+        """
			
 
				+        return self.check_params() if self.check_params() else self.choose_minigram()
			
--- a/server/api/record.py
+++ b/server/api/record.py
@@ -0,0 +1,129 @@
 
				+import time
			
 
				+
			
 
				+from uuid import uuid4
			
 
				+
			
 
				+from applications.functions.log import logging
			
 
				+
			
 
				+
			
 
				+class Record(object):
			
 
				+    """
			
 
				+    搜索接口处理逻辑
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, params, mysql_client, config):
			
 
				+        self.flow_pool_level = None
			
 
				+        self.content_id = None
			
 
				+        self.account_name = None
			
 
				+        self.contents = None
			
 
				+        self.title = None
			
 
				+        self.gh_id = None
			
 
				+        self.params = params
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.article_videos = config.articleVideos
			
 
				+        self.article_text = config.articleText
			
 
				+        self.trace_id = "search-{}-{}".format(str(uuid4()), str(int(time.time())))
			
 
				+
			
 
				+    def checkParams(self):
			
 
				+        """
			
 
				+        检查请求params
			
 
				+        :return:
			
 
				+        """
			
 
				+        try:
			
 
				+            self.gh_id = self.params['ghId']
			
 
				+            self.title = self.params['title'].split("@@")[-1].replace("'", "")
			
 
				+            self.contents = self.params['content'].replace("'", "")
			
 
				+            self.account_name = self.params['accountName'].replace("'", "")
			
 
				+            self.content_id = self.params['articleId']
			
 
				+            self.flow_pool_level = self.params['flowPoolLevelTag']
			
 
				+            logging(
			
 
				+                code="1001",
			
 
				+                info="搜索视频内容接口请求成功, 参数校验成功",
			
 
				+                port="title_to_search",
			
 
				+                trace_id=self.trace_id,
			
 
				+                data=self.params
			
 
				+            )
			
 
				+            return None
			
 
				+        except Exception as e:
			
 
				+            result = {
			
 
				+                "status": "fail",
			
 
				+                "code": 1,
			
 
				+                "message": str(e),
			
 
				+                "info": "params check error"
			
 
				+            }
			
 
				+            logging(
			
 
				+                code="4001",
			
 
				+                info="搜索视频内容接口请求成功, 参数校验失败",
			
 
				+                port="title_to_search",
			
 
				+                trace_id=self.trace_id,
			
 
				+                data=self.params
			
 
				+            )
			
 
				+            return result
			
 
				+
			
 
				+    async def inputIntoArticleVideos(self):
			
 
				+        """
			
 
				+        把数据插入待处理队列
			
 
				+        :return:
			
 
				+        """
			
 
				+        request_time = int(time.time())
			
 
				+        insert_sql = f"""
			
 
				+            INSERT INTO {self.article_videos}
			
 
				+                (trace_id, content_id, flow_pool_level, gh_id, account_name, request_timestamp)
			
 
				+            VALUES 
			
 
				+                (%s, %s, %s, %s, %s, %s);
			
 
				+            """
			
 
				+        await self.mysql_client.asyncInsert(
			
 
				+            sql=insert_sql,
			
 
				+            params=(
			
 
				+                self.trace_id,
			
 
				+                self.content_id,
			
 
				+                self.flow_pool_level,
			
 
				+                self.gh_id,
			
 
				+                self.account_name,
			
 
				+                request_time
			
 
				+            )
			
 
				+        )
			
 
				+        logging(
			
 
				+            code="1002",
			
 
				+            info="成功记录请求数据到mysql中",
			
 
				+            trace_id=self.trace_id
			
 
				+        )
			
 
				+
			
 
				+    async def inputIntoArticleText(self):
			
 
				+        """
			
 
				+
			
 
				+        :return:
			
 
				+        """
			
 
				+        insert_sql = f"""
			
 
				+        INSERT INTO {self.article_text} (content_id, article_title, article_text)
			
 
				+        values (%s, %s, %s);
			
 
				+        """
			
 
				+        try:
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=insert_sql,
			
 
				+                params=(
			
 
				+                    self.content_id,
			
 
				+                    self.title,
			
 
				+                    self.contents
			
 
				+                )
			
 
				+            )
			
 
				+        except Exception as e:
			
 
				+            print(e)
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        deal
			
 
				+        :return:
			
 
				+        """
			
 
				+        params_error = self.checkParams()
			
 
				+        if params_error:
			
 
				+            return params_error
			
 
				+        else:
			
 
				+            # 记录数据
			
 
				+            await self.inputIntoArticleVideos()
			
 
				+            await self.inputIntoArticleText()
			
 
				+            res = {
			
 
				+                "status": "success input to article queue",
			
 
				+                "code": 0,
			
 
				+                "traceId": self.trace_id
			
 
				+            }
			
 
				+            return res
			
--- a/server/api/response.py
+++ b/server/api/response.py
@@ -0,0 +1,242 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import json
			
 
				+import uuid
			
 
				+import time
			
 
				+import random
			
 
				+import hashlib
			
 
				+import urllib.parse
			
 
				+
			
 
				+from applications.functions.log import logging
			
 
				+
			
 
				+
			
 
				+class Response(object):
			
 
				+    """
			
 
				+    Response
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, params, mysql_client, config):
			
 
				+        """
			
 
				+        Response 接口
			
 
				+        """
			
 
				+        self.trace_id = None
			
 
				+        self.mini_program_type = None
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.params = params
			
 
				+        self.article_videos = config.articleVideos
			
 
				+        self.mini_map = json.loads(config.getConfigValue("miniMap"))
			
 
				+
			
 
				+    def checkParams(self):
			
 
				+        """
			
 
				+        请求参数校验
			
 
				+        :return:
			
 
				+        """
			
 
				+        try:
			
 
				+            self.mini_program_type = self.params['miniprogramUseType']
			
 
				+            self.trace_id = self.params['traceId']
			
 
				+            return None
			
 
				+        except Exception as e:
			
 
				+            return {
			
 
				+                "error": "params error",
			
 
				+                "msg": str(e),
			
 
				+                "info": self.params
			
 
				+            }
			
 
				+
			
 
				+    async def getVideosResult(self):
			
 
				+        """
			
 
				+        获取结果
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        SELECT gh_id, content_status, response, process_times
			
 
				+        FROM {self.article_videos}
			
 
				+        WHERE trace_id = '{self.trace_id}';
			
 
				+        """
			
 
				+        info_tuple = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        gh_id, content_status, response, process_times = info_tuple[0]
			
 
				+        return {
			
 
				+            "ghId": gh_id,
			
 
				+            "contentStatus": content_status,
			
 
				+            "response": json.loads(response),
			
 
				+            "processTimes": process_times
			
 
				+        }
			
 
				+
			
 
				+    def createGzhPath(self, video_id, shared_uid, gh_id):
			
 
				+        """
			
 
				+        :param gh_id: 公众号账号的gh_id
			
 
				+        :param video_id: 视频 id
			
 
				+        :param shared_uid: 分享 id
			
 
				+        """
			
 
				+
			
 
				+        def generate_source_id():
			
 
				+            """
			
 
				+            generate_source_id
			
 
				+            :return:
			
 
				+            """
			
 
				+            timestamp = str(int(time.time() * 1000))
			
 
				+            random_str = str(random.randint(1000, 9999))
			
 
				+            hash_input = f"{timestamp}-{random_str}"
			
 
				+            return hashlib.md5(hash_input.encode()).hexdigest()
			
 
				+
			
 
				+        root_share_id = str(uuid.uuid4())
			
 
				+        if self.mini_program_type == 2:
			
 
				+            source_id = (
			
 
				+                    "touliu_tencentGzhArticle_{}_".format(gh_id) + generate_source_id()
			
 
				+            )
			
 
				+        elif self.mini_program_type == 1:
			
 
				+            source_id = "longArticles_" + generate_source_id()
			
 
				+        elif self.mini_program_type == 3:
			
 
				+            source_id = "WeCom_" + generate_source_id()
			
 
				+        else:
			
 
				+            source_id = "Error mini_program_type {}".format(self.mini_program_type)
			
 
				+        url = f"pages/user-videos?id={video_id}&su={shared_uid}&fromGzh=1&rootShareId={root_share_id}&shareId={root_share_id}&rootSourceId={source_id}"
			
 
				+        # 自动把 root_share_id 加入到白名单
			
 
				+        # auto_white(root_share_id)
			
 
				+        return (
			
 
				+            root_share_id,
			
 
				+            source_id,
			
 
				+            f"pages/category?jumpPage={urllib.parse.quote(url, safe='')}",
			
 
				+        )
			
 
				+
			
 
				+    async def generateCard(self, index, gh_id, mini_id, item):
			
 
				+        """
			
 
				+        生成单个分享卡片
			
 
				+        :param item: 单个视频结果
			
 
				+        :param mini_id:  小程序 appType
			
 
				+        :param gh_id: 公众号 id
			
 
				+        :param index: 视频位置
			
 
				+        :return:
			
 
				+        """
			
 
				+        str_mini_id = str(mini_id)
			
 
				+        mini_info = self.mini_map[str_mini_id]
			
 
				+        avatar, app_id, app_name = mini_info['avatar'], mini_info['id'], mini_info['name']
			
 
				+        root_share_id, root_source_id, production_path = self.createGzhPath(
			
 
				+            video_id=item['videoId'],
			
 
				+            shared_uid=item['uid'],
			
 
				+            gh_id=gh_id
			
 
				+        )
			
 
				+        logging(
			
 
				+            code="1002",
			
 
				+            info="root_share_id --{}, productionPath -- {}".format(
			
 
				+                root_share_id, production_path
			
 
				+            ),
			
 
				+            function="process",
			
 
				+            trace_id=self.trace_id,
			
 
				+        )
			
 
				+        result = {
			
 
				+            "productionCover": item['videoCover'],
			
 
				+            "productionName": item['kimiTitle'],
			
 
				+            "programAvatar": avatar,
			
 
				+            "programId": app_id,
			
 
				+            "programName": app_name,
			
 
				+            "source": item['source'],
			
 
				+            "rootShareId": root_share_id,
			
 
				+            "productionPath": production_path,
			
 
				+            "videoUrl": item['videoPath'],
			
 
				+            "mini_id": mini_id,
			
 
				+            "paragraphPosition": index * 0.25
			
 
				+        }
			
 
				+        if index == 1:
			
 
				+            result['paragraphPosition'] = 0.01
			
 
				+        item['rootSourceId'] = root_source_id
			
 
				+        return result, item
			
 
				+
			
 
				+    async def generateCards(self, result):
			
 
				+        """
			
 
				+        生成返回卡片
			
 
				+        :return:
			
 
				+        """
			
 
				+        gh_id = result['ghId']
			
 
				+        response = result['response']
			
 
				+        match self.mini_program_type:
			
 
				+            case 1:
			
 
				+                L = []
			
 
				+                new_item_list = []
			
 
				+                for index, item in enumerate(response, 1):
			
 
				+                    random_num = random.randint(1, 10)
			
 
				+                    if random_num in [1, 2, 3, 4, 5, 6]:
			
 
				+                        mini_id = 25
			
 
				+                    elif random_num in [7, 8]:
			
 
				+                        mini_id = 29
			
 
				+                    else:
			
 
				+                        mini_id = 31
			
 
				+                    card, new_item = await self.generateCard(index, gh_id, mini_id, item)
			
 
				+                    L.append(card)
			
 
				+                    new_item_list.append(new_item)
			
 
				+                return L, new_item_list
			
 
				+            case 2:
			
 
				+                L = []
			
 
				+                new_item_list = []
			
 
				+                for index, item in enumerate(response, 1):
			
 
				+                    card, new_item = await self.generateCard(index, gh_id, 33, item)
			
 
				+                    L.append(card)
			
 
				+                    new_item_list.append(new_item)
			
 
				+                return L, new_item_list
			
 
				+            case 3:
			
 
				+                L = []
			
 
				+                new_item_list = []
			
 
				+                for index, item in enumerate(response, 1):
			
 
				+                    card, new_item = await self.generateCard(index, gh_id, 27, item)
			
 
				+                    L.append(card)
			
 
				+                    new_item_list.append(card)
			
 
				+                return L, new_item_list
			
 
				+
			
 
				+    async def job(self):
			
 
				+        """
			
 
				+        执行方法
			
 
				+        :return:
			
 
				+        """
			
 
				+        response = await self.getVideosResult()
			
 
				+        status_code = response.get('contentStatus')
			
 
				+        process_times = response.get('processTimes')
			
 
				+        match status_code:
			
 
				+            case 0:
			
 
				+                if process_times > 3:
			
 
				+                    result = {
			
 
				+                        "traceId": self.trace_id,
			
 
				+                        "code": 0,
			
 
				+                        "error": "匹配失败，处理超过 3 次"
			
 
				+                    }
			
 
				+                else:
			
 
				+                    result = {
			
 
				+                        "traceId": self.trace_id,
			
 
				+                        "code": 0,
			
 
				+                        "Message": "该请求还没处理"
			
 
				+                    }
			
 
				+                return result
			
 
				+            case 1:
			
 
				+                return {
			
 
				+                    "traceId": self.trace_id,
			
 
				+                    "code": 1,
			
 
				+                    "Message": "该请求正在处理中"
			
 
				+                }
			
 
				+            case 2:
			
 
				+                card_list, new_items = await self.generateCards(result=response)
			
 
				+                update_sql = f"""
			
 
				+                UPDATE {self.article_videos}
			
 
				+                SET response = %s, success_status = %s
			
 
				+                WHERE trace_id = %s;
			
 
				+                """
			
 
				+                await self.mysql_client.asyncInsert(
			
 
				+                    sql=update_sql,
			
 
				+                    params=(json.dumps(new_items, ensure_ascii=False), 1, self.trace_id)
			
 
				+                )
			
 
				+                return {"traceId": self.trace_id, "miniprogramList": card_list}
			
 
				+            case 3:
			
 
				+                return {
			
 
				+                    "traceId": self.trace_id,
			
 
				+                    "code": 3,
			
 
				+                    "error": "匹配失败，超过三次"
			
 
				+                }
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        api process starts from here
			
 
				+        :return:
			
 
				+        """
			
 
				+        params_error = self.checkParams()
			
 
				+        if params_error:
			
 
				+            return params_error
			
 
				+        else:
			
 
				+            return await self.job()
			
--- a/applications/routes.py
+++ b/applications/routes.py
@@ -3,12 +3,12 @@
 
				 """
			
 
				 from quart import Blueprint, jsonify, request
			
 
				 
			
 
				-from applications.deal import Response, Record, Minigram, GetOffVideos
			
 
				+from server.api import Response, Record, Minigram, GetOffVideos
			
 
				 
			
 
				-my_blueprint = Blueprint('LongArticles', __name__)
			
 
				+my_blueprint = Blueprint('LongArticlesMatchServer', __name__)
			
 
				 
			
 
				 
			
 
				-def Routes(mysql_client):
			
 
				+def Routes(mysql_client, config):
			
 
				     """
			
 
				     路由代码
			
 
				     """
			
@@ -24,11 +24,11 @@ def Routes(mysql_client):
 
				     @my_blueprint.route('/search_videos', methods=['POST'])
			
 
				     async def search_videos_from_the_web():
			
 
				         """
			
 
				-        从web 搜索视频并且存储到票圈的视频库中
			
 
				+        record Data
			
 
				         :return:
			
 
				         """
			
 
				         params = await request.get_json()
			
 
				-        SD = Record(params=params, mysql_client=mysql_client)
			
 
				+        SD = Record(params=params, mysql_client=mysql_client, config=config)
			
 
				         result = await SD.deal()
			
 
				         return jsonify(result)
			
 
				 
			
@@ -39,9 +39,11 @@ def Routes(mysql_client):
 
				         :return:
			
 
				         """
			
 
				         data = await request.get_json()
			
 
				-        trace_id = data['traceId']
			
 
				-        minigram_type = data['miniprogramUseType']
			
 
				-        RD = Response(trace_id=trace_id, mini_program_type=minigram_type, mysql_client=mysql_client)
			
 
				+        RD = Response(
			
 
				+            params=data,
			
 
				+            mysql_client=mysql_client,
			
 
				+            config=config
			
 
				+        )
			
 
				         response = await RD.deal()
			
 
				         return jsonify(response)
			
 
				 
			
@@ -63,7 +65,7 @@ def Routes(mysql_client):
 
				         :return:
			
 
				         """
			
 
				         data = await request.get_json()
			
 
				-        GOV = GetOffVideos(params=data, mysql_client=mysql_client)
			
 
				+        GOV = GetOffVideos(params=data, mysql_client=mysql_client, config=config)
			
 
				         response = await GOV.deal()
			
 
				         return jsonify(response)
			
 
				 
			
--- a/spiderTask.py
+++ b/spiderTask.py
@@ -0,0 +1,29 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import time
			
 
				+import datetime
			
 
				+import asyncio
			
 
				+
			
 
				+from tasks.spider_task import spiderTask
			
 
				+from applications.db import TaskMySQLClient
			
 
				+
			
 
				+
			
 
				+async def main():
			
 
				+    """
			
 
				+    main job
			
 
				+    :return:
			
 
				+    """
			
 
				+    TMC = TaskMySQLClient()
			
 
				+    await TMC.init_pool()
			
 
				+    PD = spiderTask(TMC)
			
 
				+    await PD.deal()
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    while True:
			
 
				+        asyncio.run(main())
			
 
				+        now_str = datetime.datetime.now().__str__()
			
 
				+        print("{}    请求执行完成， 等待60s".format(now_str))
			
 
				+        time.sleep(60)
			
 
				+
			
--- a/static/config.py
+++ b/static/config.py
@@ -1,993 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-
			
 
				-gh_id_dict = {
			
 
				-    "gh_008ef23062ee": {
			
 
				-        "uid": 71582074,
			
 
				-        "nick_name": "北至"
			
 
				-    },
			
 
				-    "gh_01a417472fdd": {
			
 
				-        "uid": 72459350,
			
 
				-        "nick_name": "婪"
			
 
				-    },
			
 
				-    "gh_01f8afd03366": {
			
 
				-        "uid": 69637520,
			
 
				-        "nick_name": "非亲非故"
			
 
				-    },
			
 
				-    "gh_036ab9bb685a": {
			
 
				-        "uid": 72088957,
			
 
				-        "nick_name": "不知春秋"
			
 
				-    },
			
 
				-    "gh_0394dd7e37e2": {
			
 
				-        "uid": 73723034,
			
 
				-        "nick_name": "上瘾"
			
 
				-    },
			
 
				-    "gh_03d32e83122f": {
			
 
				-        "uid": 71881045,
			
 
				-        "nick_name": "安抚"
			
 
				-    },
			
 
				-    "gh_03d45c260115": {
			
 
				-        "uid": 72385751,
			
 
				-        "nick_name": "少女提到战情场"
			
 
				-    },
			
 
				-    "gh_058e41145a0c": {
			
 
				-        "uid": 69637476,
			
 
				-        "nick_name": "甜腻梦话"
			
 
				-    },
			
 
				-    "gh_080bb43aa0dc": {
			
 
				-        "uid": 70731106,
			
 
				-        "nick_name": "那一树的嫣红"
			
 
				-    },
			
 
				-    "gh_084a485e859a": {
			
 
				-        "uid": 69637472,
			
 
				-        "nick_name": "梦星月"
			
 
				-    },
			
 
				-    "gh_0921c03402cd": {
			
 
				-        "uid": 69637531,
			
 
				-        "nick_name": "你的女友"
			
 
				-    },
			
 
				-    "gh_0b29b081f237": {
			
 
				-        "uid": 72088986,
			
 
				-        "nick_name": "顾然"
			
 
				-    },
			
 
				-    "gh_0bedf49a6a7e": {
			
 
				-        "uid": 72088983,
			
 
				-        "nick_name": "少女酒馆"
			
 
				-    },
			
 
				-    "gh_0c89e11f8bf3": {
			
 
				-        "uid": 69637508,
			
 
				-        "nick_name": "粟米"
			
 
				-    },
			
 
				-    "gh_0d8a65926cdf": {
			
 
				-        "uid": 71353811,
			
 
				-        "nick_name": "寻歡猫"
			
 
				-    },
			
 
				-    "gh_0dea45f2342a": {
			
 
				-        "uid": 72088958,
			
 
				-        "nick_name": "抚琴浅唱入君心"
			
 
				-    },
			
 
				-    "gh_0e4fd9e88386": {
			
 
				-        "uid": 71881046,
			
 
				-        "nick_name": "白玖逸"
			
 
				-    },
			
 
				-    "gh_156c66ac3e37": {
			
 
				-        "uid": 73858591,
			
 
				-        "nick_name": "微醉阳光"
			
 
				-    },
			
 
				-    "gh_1686250f15b6": {
			
 
				-        "uid": 72385753,
			
 
				-        "nick_name": "遥西江月"
			
 
				-    },
			
 
				-    "gh_171cec079b2a": {
			
 
				-        "uid": 69637501,
			
 
				-        "nick_name": "海上"
			
 
				-    },
			
 
				-    "gh_183d80deffb8": {
			
 
				-        "uid": 69637491,
			
 
				-        "nick_name": "论趣"
			
 
				-    },
			
 
				-    "gh_18e87b85e90c": {
			
 
				-        "uid": 72459372,
			
 
				-        "nick_name": "想你成瘾"
			
 
				-    },
			
 
				-    "gh_192c9cf58b13": {
			
 
				-        "uid": 70731102,
			
 
				-        "nick_name": "久亿"
			
 
				-    },
			
 
				-    "gh_199f74839fb3": {
			
 
				-        "uid": 72770994,
			
 
				-        "nick_name": "殇"
			
 
				-    },
			
 
				-    "gh_19daa341c8f9": {
			
 
				-        "uid": 71353816,
			
 
				-        "nick_name": "美"
			
 
				-    },
			
 
				-    "gh_1b27dd1beeca": {
			
 
				-        "uid": 71021080,
			
 
				-        "nick_name": "聚散常迷"
			
 
				-    },
			
 
				-    "gh_1c7e15e6ac9e": {
			
 
				-        "uid": 72088971,
			
 
				-        "nick_name": "我在等你"
			
 
				-    },
			
 
				-    "gh_1d10403eb554": {
			
 
				-        "uid": 71353815,
			
 
				-        "nick_name": "听闻那年"
			
 
				-    },
			
 
				-    "gh_1d887d61088c": {
			
 
				-        "uid": 71021081,
			
 
				-        "nick_name": "明月不知沟渠心"
			
 
				-    },
			
 
				-    "gh_1e83780cc5a8": {
			
 
				-        "uid": 71353810,
			
 
				-        "nick_name": "眉眼"
			
 
				-    },
			
 
				-    "gh_1ee2e1b39ccf": {
			
 
				-        "uid": 69637473,
			
 
				-        "nick_name": "纵有疾风起"
			
 
				-    },
			
 
				-    "gh_2046389c46d3": {
			
 
				-        "uid": 72459359,
			
 
				-        "nick_name": "北街九命猫南巷七秒鱼"
			
 
				-    },
			
 
				-    "gh_2111a67800ba": {
			
 
				-        "uid": 74162341,
			
 
				-        "nick_name": "夜半呻吟"
			
 
				-    },
			
 
				-    "gh_234ef02cdee5": {
			
 
				-        "uid": 69637513,
			
 
				-        "nick_name": "夹逼"
			
 
				-    },
			
 
				-    "gh_2370907fc8d6": {
			
 
				-        "uid": 71051365,
			
 
				-        "nick_name": "吹长笛"
			
 
				-    },
			
 
				-    "gh_243829b5ff02": {
			
 
				-        "uid": 74162336,
			
 
				-        "nick_name": "难做"
			
 
				-    },
			
 
				-    "gh_24aa1e4bf177": {
			
 
				-        "uid": 71353820,
			
 
				-        "nick_name": "翁思"
			
 
				-    },
			
 
				-    "gh_25c925cf5d8a": {
			
 
				-        "uid": 74162347,
			
 
				-        "nick_name": "谦谦公子"
			
 
				-    },
			
 
				-    "gh_26a307578776": {
			
 
				-        "uid": 69637490,
			
 
				-        "nick_name": "最宝贝的宝贝"
			
 
				-    },
			
 
				-    "gh_29074b51f2b7": {
			
 
				-        "uid": 69637530,
			
 
				-        "nick_name": "沉舸"
			
 
				-    },
			
 
				-    "gh_291ec369f017": {
			
 
				-        "uid": 74162334,
			
 
				-        "nick_name": "执炬逆风"
			
 
				-    },
			
 
				-    "gh_2abee512312a": {
			
 
				-        "uid": 70731103,
			
 
				-        "nick_name": "舍我"
			
 
				-    },
			
 
				-    "gh_2b8c6aa035ae": {
			
 
				-        "uid": 69637470,
			
 
				-        "nick_name": "懶得取名"
			
 
				-    },
			
 
				-    "gh_2e0c4609839f": {
			
 
				-        "uid": 74162332,
			
 
				-        "nick_name": "神君"
			
 
				-    },
			
 
				-    "gh_2e615fa75ffb": {
			
 
				-        "uid": 72683739,
			
 
				-        "nick_name": "空巢老人家"
			
 
				-    },
			
 
				-    "gh_2fde0fd0ad79": {
			
 
				-        "uid": 74162335,
			
 
				-        "nick_name": "城之"
			
 
				-    },
			
 
				-    "gh_30816d8adb52": {
			
 
				-        "uid": 71616016,
			
 
				-        "nick_name": "鹤绝"
			
 
				-    },
			
 
				-    "gh_3365a6f8b17f": {
			
 
				-        "uid": 72459349,
			
 
				-        "nick_name": "最好不过明天见"
			
 
				-    },
			
 
				-    "gh_34318194fd0e": {
			
 
				-        "uid": 69637517,
			
 
				-        "nick_name": "徒四壁"
			
 
				-    },
			
 
				-    "gh_37b084e62f1c": {
			
 
				-        "uid": 72459374,
			
 
				-        "nick_name": "讨人厌"
			
 
				-    },
			
 
				-    "gh_3845af6945d0": {
			
 
				-        "uid": 69637545,
			
 
				-        "nick_name": "秋水娉婷"
			
 
				-    },
			
 
				-    "gh_39218d3a3ec1": {
			
 
				-        "uid": 74162342,
			
 
				-        "nick_name": "人生如梦"
			
 
				-    },
			
 
				-    "gh_3ac6d7208961": {
			
 
				-        "uid": 69637497,
			
 
				-        "nick_name": "小熊的少女梦"
			
 
				-    },
			
 
				-    "gh_3c7d38636846": {
			
 
				-        "uid": 69637519,
			
 
				-        "nick_name": "油腻腻"
			
 
				-    },
			
 
				-    "gh_3ce2fa1956ea": {
			
 
				-        "uid": 74162320,
			
 
				-        "nick_name": "疑心病"
			
 
				-    },
			
 
				-    "gh_3df10391639c": {
			
 
				-        "uid": 69637541,
			
 
				-        "nick_name": "六郎娇面"
			
 
				-    },
			
 
				-    "gh_3e91f0624545": {
			
 
				-        "uid": 71616018,
			
 
				-        "nick_name": "青衫故人"
			
 
				-    },
			
 
				-    "gh_3ed305b5817f": {
			
 
				-        "uid": 71021082,
			
 
				-        "nick_name": "醉色染红颜"
			
 
				-    },
			
 
				-    "gh_3f4e2c890272": {
			
 
				-        "uid": 73858595,
			
 
				-        "nick_name": "海棠"
			
 
				-    },
			
 
				-    "gh_40a0ad154478": {
			
 
				-        "uid": 69637516,
			
 
				-        "nick_name": "禁止"
			
 
				-    },
			
 
				-    "gh_40a2ead40083": {
			
 
				-        "uid": 72459348,
			
 
				-        "nick_name": "两袖"
			
 
				-    },
			
 
				-    "gh_40fa65a44aa1": {
			
 
				-        "uid": 72558479,
			
 
				-        "nick_name": "南七夏"
			
 
				-    },
			
 
				-    "gh_424c8eeabced": {
			
 
				-        "uid": 69637522,
			
 
				-        "nick_name": "认命"
			
 
				-    },
			
 
				-    "gh_44127c197525": {
			
 
				-        "uid": 74162321,
			
 
				-        "nick_name": "青昧"
			
 
				-    },
			
 
				-    "gh_442a2c336dd8": {
			
 
				-        "uid": 72459352,
			
 
				-        "nick_name": "彻夜"
			
 
				-    },
			
 
				-    "gh_4568b5a7e2fe": {
			
 
				-        "uid": 69637482,
			
 
				-        "nick_name": "香腮"
			
 
				-    },
			
 
				-    "gh_45beb952dc74": {
			
 
				-        "uid": 69637488,
			
 
				-        "nick_name": "毋庸"
			
 
				-    },
			
 
				-    "gh_46879953339f": {
			
 
				-        "uid": 73723019,
			
 
				-        "nick_name": "天生童真"
			
 
				-    },
			
 
				-    "gh_484de412b0ef": {
			
 
				-        "uid": 69637481,
			
 
				-        "nick_name": "婪"
			
 
				-    },
			
 
				-    "gh_4a05bb40ab9b": {
			
 
				-        "uid": 72459370,
			
 
				-        "nick_name": "忧欢"
			
 
				-    },
			
 
				-    "gh_4af3ce7f9a85": {
			
 
				-        "uid": 72459373,
			
 
				-        "nick_name": "相衬"
			
 
				-    },
			
 
				-    "gh_4c058673c07e": {
			
 
				-        "uid": 69637474,
			
 
				-        "nick_name": "影帝"
			
 
				-    },
			
 
				-    "gh_4c21daadd79f": {
			
 
				-        "uid": 74162330,
			
 
				-        "nick_name": "想被宠一次"
			
 
				-    },
			
 
				-    "gh_4f6bfd731ac8": {
			
 
				-        "uid": 74162328,
			
 
				-        "nick_name": "浅梦"
			
 
				-    },
			
 
				-    "gh_50a7969695f6": {
			
 
				-        "uid": 73723024,
			
 
				-        "nick_name": "日日思君"
			
 
				-    },
			
 
				-    "gh_50c78060c5f2": {
			
 
				-        "uid": 72088980,
			
 
				-        "nick_name": "在乎"
			
 
				-    },
			
 
				-    "gh_5198e38df4c0": {
			
 
				-        "uid": 74162331,
			
 
				-        "nick_name": "饮长风"
			
 
				-    },
			
 
				-    "gh_51e4ad40466d": {
			
 
				-        "uid": 71616015,
			
 
				-        "nick_name": "吃甜"
			
 
				-    },
			
 
				-    "gh_531881b6d1ad": {
			
 
				-        "uid": 74162346,
			
 
				-        "nick_name": "如同昨日"
			
 
				-    },
			
 
				-    "gh_538f78f9d3aa": {
			
 
				-        "uid": 69637478,
			
 
				-        "nick_name": "伤痕"
			
 
				-    },
			
 
				-    "gh_53cb7afbb2df": {
			
 
				-        "uid": 72459360,
			
 
				-        "nick_name": "卷子泛滥成灾"
			
 
				-    },
			
 
				-    "gh_55866e76fc28": {
			
 
				-        "uid": 74162343,
			
 
				-        "nick_name": "少走感情路"
			
 
				-    },
			
 
				-    "gh_56a6765df869": {
			
 
				-        "uid": 69637514,
			
 
				-        "nick_name": "风月"
			
 
				-    },
			
 
				-    "gh_56ca3dae948c": {
			
 
				-        "uid": 69637538,
			
 
				-        "nick_name": "留下太多回忆"
			
 
				-    },
			
 
				-    "gh_57573f01b2ee": {
			
 
				-        "uid": 71582075,
			
 
				-        "nick_name": "醉色染红颜"
			
 
				-    },
			
 
				-    "gh_5765f834684c": {
			
 
				-        "uid": 74162324,
			
 
				-        "nick_name": "一笑百媚生"
			
 
				-    },
			
 
				-    "gh_57c9e8babea7": {
			
 
				-        "uid": 72683735,
			
 
				-        "nick_name": "离去"
			
 
				-    },
			
 
				-    "gh_5887a9154605": {
			
 
				-        "uid": 71353814,
			
 
				-        "nick_name": "寄许"
			
 
				-    },
			
 
				-    "gh_58d75d978f31": {
			
 
				-        "uid": 72047581,
			
 
				-        "nick_name": "经历风雨"
			
 
				-    },
			
 
				-    "gh_58fa9df7733a": {
			
 
				-        "uid": 73858593,
			
 
				-        "nick_name": "一身宠爱"
			
 
				-    },
			
 
				-    "gh_59b9f8ef99a4": {
			
 
				-        "uid": 71051360,
			
 
				-        "nick_name": "小編最可愛"
			
 
				-    },
			
 
				-    "gh_5ae65db96cb7": {
			
 
				-        "uid": 70731108,
			
 
				-        "nick_name": "喘声娇息"
			
 
				-    },
			
 
				-    "gh_5c841d031d42": {
			
 
				-        "uid": 72459356,
			
 
				-        "nick_name": "香肩"
			
 
				-    },
			
 
				-    "gh_5d68fee2093f": {
			
 
				-        "uid": 72088974,
			
 
				-        "nick_name": "足够体面"
			
 
				-    },
			
 
				-    "gh_5e1464b76ff6": {
			
 
				-        "uid": 74162323,
			
 
				-        "nick_name": "不走为尽"
			
 
				-    },
			
 
				-    "gh_5e543853d8f0": {
			
 
				-        "uid": 69637543,
			
 
				-        "nick_name": "不知春秋"
			
 
				-    },
			
 
				-    "gh_5ff48e9fb9ef": {
			
 
				-        "uid": 69637494,
			
 
				-        "nick_name": "寻她找他"
			
 
				-    },
			
 
				-    "gh_6503fd75c35e": {
			
 
				-        "uid": 72459358,
			
 
				-        "nick_name": "一口甜"
			
 
				-    },
			
 
				-    "gh_660afe87b6fd": {
			
 
				-        "uid": 72385752,
			
 
				-        "nick_name": "青涩迷人"
			
 
				-    },
			
 
				-    "gh_671f460c856c": {
			
 
				-        "uid": 69637523,
			
 
				-        "nick_name": "绝不改悔"
			
 
				-    },
			
 
				-    "gh_67776b73f896": {
			
 
				-        "uid": 73723032,
			
 
				-        "nick_name": "风过长街"
			
 
				-    },
			
 
				-    "gh_68e7fdc09fe4": {
			
 
				-        "uid": 71371653,
			
 
				-        "nick_name": "红尘客"
			
 
				-    },
			
 
				-    "gh_69f4300b4cda": {
			
 
				-        "uid": 72459366,
			
 
				-        "nick_name": "仙气儿"
			
 
				-    },
			
 
				-    "gh_6b7c2a257263": {
			
 
				-        "uid": 69637528,
			
 
				-        "nick_name": "奶牙"
			
 
				-    },
			
 
				-    "gh_6cfd1132df94": {
			
 
				-        "uid": 70731104,
			
 
				-        "nick_name": "中指灵活"
			
 
				-    },
			
 
				-    "gh_6d205db62f04": {
			
 
				-        "uid": 69637509,
			
 
				-        "nick_name": "怕羞"
			
 
				-    },
			
 
				-    "gh_6d3aa9d13402": {
			
 
				-        "uid": 72683738,
			
 
				-        "nick_name": "四月的荒原"
			
 
				-    },
			
 
				-    "gh_6d9f36e3a7be": {
			
 
				-        "uid": 69637498,
			
 
				-        "nick_name": "望长安"
			
 
				-    },
			
 
				-    "gh_6da12d2660ba": {
			
 
				-        "uid": 72088985,
			
 
				-        "nick_name": "你妈biu"
			
 
				-    },
			
 
				-    "gh_6e75b9dcde6b": {
			
 
				-        "uid": 72770995,
			
 
				-        "nick_name": "宠儿"
			
 
				-    },
			
 
				-    "gh_6f5221bf1801": {
			
 
				-        "uid": 72459351,
			
 
				-        "nick_name": "顾词"
			
 
				-    },
			
 
				-    "gh_6ff82851890a": {
			
 
				-        "uid": 72088976,
			
 
				-        "nick_name": "世俗"
			
 
				-    },
			
 
				-    "gh_7208b813f16d": {
			
 
				-        "uid": 74162329,
			
 
				-        "nick_name": "数流年"
			
 
				-    },
			
 
				-    "gh_72bace6b3059": {
			
 
				-        "uid": 70731109,
			
 
				-        "nick_name": "万物生息"
			
 
				-    },
			
 
				-    "gh_73be0287bb94": {
			
 
				-        "uid": 69637537,
			
 
				-        "nick_name": "戏剧"
			
 
				-    },
			
 
				-    "gh_744cb16f6e16": {
			
 
				-        "uid": 69637505,
			
 
				-        "nick_name": "反駁"
			
 
				-    },
			
 
				-    "gh_749271f1ccd5": {
			
 
				-        "uid": 72125026,
			
 
				-        "nick_name": "天下第一"
			
 
				-    },
			
 
				-    "gh_759ace9d4567": {
			
 
				-        "uid": 71353812,
			
 
				-        "nick_name": "青丝与白猫"
			
 
				-    },
			
 
				-    "gh_77f36c109fb1": {
			
 
				-        "uid": 71569299,
			
 
				-        "nick_name": "轻盈"
			
 
				-    },
			
 
				-    "gh_78640efc49bf": {
			
 
				-        "uid": 73723020,
			
 
				-        "nick_name": "打更人"
			
 
				-    },
			
 
				-    "gh_789a40fe7935": {
			
 
				-        "uid": 71616017,
			
 
				-        "nick_name": "杀手也动情"
			
 
				-    },
			
 
				-    "gh_7adb9417f845": {
			
 
				-        "uid": 72088960,
			
 
				-        "nick_name": "南音雨阁"
			
 
				-    },
			
 
				-    "gh_7b4a5f86d68c": {
			
 
				-        "uid": 69637477,
			
 
				-        "nick_name": "我很想你"
			
 
				-    },
			
 
				-    "gh_7bca1c99aea0": {
			
 
				-        "uid": 69637511,
			
 
				-        "nick_name": "从小就很傲"
			
 
				-    },
			
 
				-    "gh_7c66e0dbd2cf": {
			
 
				-        "uid": 72125025,
			
 
				-        "nick_name": "烟波明灭"
			
 
				-    },
			
 
				-    "gh_7e5818b2dd83": {
			
 
				-        "uid": 69637532,
			
 
				-        "nick_name": "二八佳人"
			
 
				-    },
			
 
				-    "gh_7f5075624a50": {
			
 
				-        "uid": 70731113,
			
 
				-        "nick_name": "浮現"
			
 
				-    },
			
 
				-    "gh_845f84745a80": {
			
 
				-        "uid": 74162327,
			
 
				-        "nick_name": "可鄙"
			
 
				-    },
			
 
				-    "gh_87df74d068d5": {
			
 
				-        "uid": 72459347,
			
 
				-        "nick_name": "教养"
			
 
				-    },
			
 
				-    "gh_89d00dca4896": {
			
 
				-        "uid": 72088978,
			
 
				-        "nick_name": "知己"
			
 
				-    },
			
 
				-    "gh_89ef4798d3ea": {
			
 
				-        "uid": 69637533,
			
 
				-        "nick_name": "彼岸花"
			
 
				-    },
			
 
				-    "gh_8a783ca03d5e": {
			
 
				-        "uid": 72459353,
			
 
				-        "nick_name": "菁华浮梦"
			
 
				-    },
			
 
				-    "gh_8eaa863bc40e": {
			
 
				-        "uid": 71353813,
			
 
				-        "nick_name": "花费时间"
			
 
				-    },
			
 
				-    "gh_8f9bd3d100d3": {
			
 
				-        "uid": 72459357,
			
 
				-        "nick_name": "浮念"
			
 
				-    },
			
 
				-    "gh_901b0d722749": {
			
 
				-        "uid": 69637518,
			
 
				-        "nick_name": "深情不为我"
			
 
				-    },
			
 
				-    "gh_9161517e5676": {
			
 
				-        "uid": 69637495,
			
 
				-        "nick_name": "折磨"
			
 
				-    },
			
 
				-    "gh_91abdbc32d5f": {
			
 
				-        "uid": 71353822,
			
 
				-        "nick_name": "一往情深"
			
 
				-    },
			
 
				-    "gh_92da3c574f82": {
			
 
				-        "uid": 73723018,
			
 
				-        "nick_name": "蝶无需花恋"
			
 
				-    },
			
 
				-    "gh_93e00e187787": {
			
 
				-        "uid": 69637504,
			
 
				-        "nick_name": "理会"
			
 
				-    },
			
 
				-    "gh_947785cd2d97": {
			
 
				-        "uid": 73723022,
			
 
				-        "nick_name": "含笑"
			
 
				-    },
			
 
				-    "gh_949bf0195759": {
			
 
				-        "uid": 72088981,
			
 
				-        "nick_name": "解脱"
			
 
				-    },
			
 
				-    "gh_95ed5ecf9363": {
			
 
				-        "uid": 71881047,
			
 
				-        "nick_name": "路途"
			
 
				-    },
			
 
				-    "gh_969f5ea5fee1": {
			
 
				-        "uid": 71582077,
			
 
				-        "nick_name": "仁至义尽"
			
 
				-    },
			
 
				-    "gh_97034d655595": {
			
 
				-        "uid": 72459363,
			
 
				-        "nick_name": "萌懂"
			
 
				-    },
			
 
				-    "gh_970460d9ccec": {
			
 
				-        "uid": 71881048,
			
 
				-        "nick_name": "青丝"
			
 
				-    },
			
 
				-    "gh_9743cdc25c97": {
			
 
				-        "uid": 72459368,
			
 
				-        "nick_name": "一刀两断"
			
 
				-    },
			
 
				-    "gh_9782c8a85bce": {
			
 
				-        "uid": 72047582,
			
 
				-        "nick_name": "尢物少女"
			
 
				-    },
			
 
				-    "gh_9877c8541764": {
			
 
				-        "uid": 69637506,
			
 
				-        "nick_name": "我沿着悲伤"
			
 
				-    },
			
 
				-    "gh_98a84818284c": {
			
 
				-        "uid": 72088972,
			
 
				-        "nick_name": "就是昏君"
			
 
				-    },
			
 
				-    "gh_98ec0ffe69b3": {
			
 
				-        "uid": 72683736,
			
 
				-        "nick_name": "苦衷"
			
 
				-    },
			
 
				-    "gh_9904c57b243e": {
			
 
				-        "uid": 72088965,
			
 
				-        "nick_name": "意中人"
			
 
				-    },
			
 
				-    "gh_9a1e71e3460d": {
			
 
				-        "uid": 72459355,
			
 
				-        "nick_name": "多少画"
			
 
				-    },
			
 
				-    "gh_9cf3b7ff486b": {
			
 
				-        "uid": 69637492,
			
 
				-        "nick_name": "hoit"
			
 
				-    },
			
 
				-    "gh_9e559b3b94ca": {
			
 
				-        "uid": 69637471,
			
 
				-        "nick_name": "我与你相遇"
			
 
				-    },
			
 
				-    "gh_9ee24345c6ce": {
			
 
				-        "uid": 71353818,
			
 
				-        "nick_name": "爱隔山河"
			
 
				-    },
			
 
				-    "gh_9eef14ad6c16": {
			
 
				-        "uid": 70731110,
			
 
				-        "nick_name": "抱一抱"
			
 
				-    },
			
 
				-    "gh_9f8dc5b0c74e": {
			
 
				-        "uid": 69637496,
			
 
				-        "nick_name": "港口"
			
 
				-    },
			
 
				-    "gh_a172a6bf7dc5": {
			
 
				-        "uid": 72088963,
			
 
				-        "nick_name": "Thorns"
			
 
				-    },
			
 
				-    "gh_a182cfc94dad": {
			
 
				-        "uid": 69637539,
			
 
				-        "nick_name": "四海八荒"
			
 
				-    },
			
 
				-    "gh_a1b5a2142e11": {
			
 
				-        "uid": 72088970,
			
 
				-        "nick_name": "唯壹的執著"
			
 
				-    },
			
 
				-    "gh_a221d1a952aa": {
			
 
				-        "uid": 73858592,
			
 
				-        "nick_name": "凉薄少年葬空城"
			
 
				-    },
			
 
				-    "gh_a2901d34f75b": {
			
 
				-        "uid": 69637535,
			
 
				-        "nick_name": "听腻了谎话"
			
 
				-    },
			
 
				-    "gh_a29af5b297b1": {
			
 
				-        "uid": 74162338,
			
 
				-        "nick_name": "凑巧"
			
 
				-    },
			
 
				-    "gh_a307072c04b9": {
			
 
				-        "uid": 69637521,
			
 
				-        "nick_name": "踏步"
			
 
				-    },
			
 
				-    "gh_a57a534ec05c": {
			
 
				-        "uid": 72459364,
			
 
				-        "nick_name": "想和你同床"
			
 
				-    },
			
 
				-    "gh_a5c534db075f": {
			
 
				-        "uid": 74162333,
			
 
				-        "nick_name": "养猪仙人"
			
 
				-    },
			
 
				-    "gh_a5e71438865e": {
			
 
				-        "uid": 72088977,
			
 
				-        "nick_name": "同类"
			
 
				-    },
			
 
				-    "gh_a6351b447819": {
			
 
				-        "uid": 69637540,
			
 
				-        "nick_name": "七猫酒馆"
			
 
				-    },
			
 
				-    "gh_abc6794e6996": {
			
 
				-        "uid": 73723021,
			
 
				-        "nick_name": "娇娘"
			
 
				-    },
			
 
				-    "gh_abd3aef4debe": {
			
 
				-        "uid": 72088956,
			
 
				-        "nick_name": "弱鸡"
			
 
				-    },
			
 
				-    "gh_ac43e43b253b": {
			
 
				-        "uid": 69637499,
			
 
				-        "nick_name": "一厢情愿"
			
 
				-    },
			
 
				-    "gh_ac43eb24376d": {
			
 
				-        "uid": 71582078,
			
 
				-        "nick_name": "亏心者"
			
 
				-    },
			
 
				-    "gh_ad7b26ee9e17": {
			
 
				-        "uid": 71353809,
			
 
				-        "nick_name": "最宝贝的宝贝"
			
 
				-    },
			
 
				-    "gh_adca24a8f429": {
			
 
				-        "uid": 69637483,
			
 
				-        "nick_name": "对你何止一句喜欢"
			
 
				-    },
			
 
				-    "gh_aed298be263a": {
			
 
				-        "uid": 73723029,
			
 
				-        "nick_name": "毒瘤"
			
 
				-    },
			
 
				-    "gh_af559c13a06e": {
			
 
				-        "uid": 73723031,
			
 
				-        "nick_name": "气质"
			
 
				-    },
			
 
				-    "gh_b15de7c99912": {
			
 
				-        "uid": 69637536,
			
 
				-        "nick_name": "糖炒板栗"
			
 
				-    },
			
 
				-    "gh_b181786a6c8c": {
			
 
				-        "uid": 72385754,
			
 
				-        "nick_name": "暴露人性"
			
 
				-    },
			
 
				-    "gh_b24476d5090c": {
			
 
				-        "uid": 72088967,
			
 
				-        "nick_name": "挽救"
			
 
				-    },
			
 
				-    "gh_b32125c73861": {
			
 
				-        "uid": 69637493,
			
 
				-        "nick_name": "发尾"
			
 
				-    },
			
 
				-    "gh_b3f26b9dccbd": {
			
 
				-        "uid": 72125024,
			
 
				-        "nick_name": "苍天"
			
 
				-    },
			
 
				-    "gh_b3ffc1ca3a04": {
			
 
				-        "uid": 69637546,
			
 
				-        "nick_name": "主宰你心"
			
 
				-    },
			
 
				-    "gh_b676b7ad9b74": {
			
 
				-        "uid": 71021086,
			
 
				-        "nick_name": "枕畔红冰薄"
			
 
				-    },
			
 
				-    "gh_b6f2c5332c72": {
			
 
				-        "uid": 71021088,
			
 
				-        "nick_name": "斗篷"
			
 
				-    },
			
 
				-    "gh_b721056f294a": {
			
 
				-        "uid": 72459371,
			
 
				-        "nick_name": "些许几多"
			
 
				-    },
			
 
				-    "gh_b7f7144a96c5": {
			
 
				-        "uid": 72088962,
			
 
				-        "nick_name": "纵情荒唐"
			
 
				-    },
			
 
				-    "gh_b8baac4296cb": {
			
 
				-        "uid": 69637489,
			
 
				-        "nick_name": "生性"
			
 
				-    },
			
 
				-    "gh_b9b99173ff8a": {
			
 
				-        "uid": 69637524,
			
 
				-        "nick_name": "养一只月亮"
			
 
				-    },
			
 
				-    "gh_ba6e1e4f2de0": {
			
 
				-        "uid": 71353817,
			
 
				-        "nick_name": "余欢"
			
 
				-    },
			
 
				-    "gh_bd57b6978e06": {
			
 
				-        "uid": 69637527,
			
 
				-        "nick_name": "厌遇"
			
 
				-    },
			
 
				-    "gh_be505c7d28ac": {
			
 
				-        "uid": 71353823,
			
 
				-        "nick_name": "遥远的她"
			
 
				-    },
			
 
				-    "gh_be8c29139989": {
			
 
				-        "uid": 69637502,
			
 
				-        "nick_name": "不负"
			
 
				-    },
			
 
				-    "gh_bfe5b705324a": {
			
 
				-        "uid": 69637529,
			
 
				-        "nick_name": "乐极"
			
 
				-    },
			
 
				-    "gh_bfea052b5baa": {
			
 
				-        "uid": 72683733,
			
 
				-        "nick_name": "手背"
			
 
				-    },
			
 
				-    "gh_bff0bcb0694a": {
			
 
				-        "uid": 69637534,
			
 
				-        "nick_name": "简迷离"
			
 
				-    },
			
 
				-    "gh_c484cea5ce0b": {
			
 
				-        "uid": 72088968,
			
 
				-        "nick_name": "猫咚"
			
 
				-    },
			
 
				-    "gh_c5cdf60d9ab4": {
			
 
				-        "uid": 70731111,
			
 
				-        "nick_name": "定酌"
			
 
				-    },
			
 
				-    "gh_c69776baf2cd": {
			
 
				-        "uid": 69637512,
			
 
				-        "nick_name": "骄纵"
			
 
				-    },
			
 
				-    "gh_c794770120dc": {
			
 
				-        "uid": 71353819,
			
 
				-        "nick_name": "以笑相迎"
			
 
				-    },
			
 
				-    "gh_c7c9929bdfc4": {
			
 
				-        "uid": 72088969,
			
 
				-        "nick_name": "草莓酸奶"
			
 
				-    },
			
 
				-    "gh_c91b42649690": {
			
 
				-        "uid": 69637503,
			
 
				-        "nick_name": "荟萃"
			
 
				-    },
			
 
				-    "gh_cd82bb10dd98": {
			
 
				-        "uid": 72459354,
			
 
				-        "nick_name": "著迷動心"
			
 
				-    },
			
 
				-    "gh_d2cc901deca7": {
			
 
				-        "uid": 69637487,
			
 
				-        "nick_name": "恶意调笑"
			
 
				-    },
			
 
				-    "gh_d367454ca4d7": {
			
 
				-        "uid": 72088961,
			
 
				-        "nick_name": "不负虚设"
			
 
				-    },
			
 
				-    "gh_d49df5e974ca": {
			
 
				-        "uid": 70731107,
			
 
				-        "nick_name": "没你"
			
 
				-    },
			
 
				-    "gh_d4dffc34ac39": {
			
 
				-        "uid": 70744072,
			
 
				-        "nick_name": "驯课"
			
 
				-    },
			
 
				-    "gh_d5f935d0d1f2": {
			
 
				-        "uid": 69637500,
			
 
				-        "nick_name": "青少年哪吒"
			
 
				-    },
			
 
				-    "gh_d8c215687f02": {
			
 
				-        "uid": 73723033,
			
 
				-        "nick_name": "看淡"
			
 
				-    },
			
 
				-    "gh_d9de0e9b70e9": {
			
 
				-        "uid": 72088973,
			
 
				-        "nick_name": "枝头月"
			
 
				-    },
			
 
				-    "gh_da2732f4518b": {
			
 
				-        "uid": 74162340,
			
 
				-        "nick_name": "小城管小商贩"
			
 
				-    },
			
 
				-    "gh_da44c409ec0f": {
			
 
				-        "uid": 73723025,
			
 
				-        "nick_name": "红眼"
			
 
				-    },
			
 
				-    "gh_da76772d8d15": {
			
 
				-        "uid": 69637526,
			
 
				-        "nick_name": "独揽风月"
			
 
				-    },
			
 
				-    "gh_dd4c857bbb36": {
			
 
				-        "uid": 71021083,
			
 
				-        "nick_name": "过分着迷"
			
 
				-    },
			
 
				-    "gh_ddafea4bcc29": {
			
 
				-        "uid": 72410372,
			
 
				-        "nick_name": "枯燥"
			
 
				-    },
			
 
				-    "gh_ddf6ec0104d0": {
			
 
				-        "uid": 73858596,
			
 
				-        "nick_name": "诗情"
			
 
				-    },
			
 
				-    "gh_de2c9fefe715": {
			
 
				-        "uid": 72088982,
			
 
				-        "nick_name": "旧心"
			
 
				-    },
			
 
				-    "gh_de9f9ebc976b": {
			
 
				-        "uid": 69637475,
			
 
				-        "nick_name": "剑出鞘恩怨了"
			
 
				-    },
			
 
				-    "gh_e0eb490115f5": {
			
 
				-        "uid": 69637486,
			
 
				-        "nick_name": "赋别"
			
 
				-    },
			
 
				-    "gh_e24da99dc899": {
			
 
				-        "uid": 69637484,
			
 
				-        "nick_name": "恋雨夏季"
			
 
				-    },
			
 
				-    "gh_e2576b7181c6": {
			
 
				-        "uid": 69637515,
			
 
				-        "nick_name": "满天星"
			
 
				-    },
			
 
				-    "gh_e3a8e14013cd": {
			
 
				-        "uid": 73723030,
			
 
				-        "nick_name": "城堡"
			
 
				-    },
			
 
				-    "gh_e4506a7ce46f": {
			
 
				-        "uid": 74162322,
			
 
				-        "nick_name": "肥球"
			
 
				-    },
			
 
				-    "gh_e56ddf195d91": {
			
 
				-        "uid": 74162345,
			
 
				-        "nick_name": "煽情"
			
 
				-    },
			
 
				-    "gh_e6be5a12e83c": {
			
 
				-        "uid": 74162348,
			
 
				-        "nick_name": "争霸"
			
 
				-    },
			
 
				-    "gh_e75dbdc73d80": {
			
 
				-        "uid": 69637542,
			
 
				-        "nick_name": "情战"
			
 
				-    },
			
 
				-    "gh_e9d819f9e147": {
			
 
				-        "uid": 69637525,
			
 
				-        "nick_name": "与卿"
			
 
				-    },
			
 
				-    "gh_eb1f9880beb7": {
			
 
				-        "uid": 73723026,
			
 
				-        "nick_name": "清辰"
			
 
				-    },
			
 
				-    "gh_ebbba8a46bbc": {
			
 
				-        "uid": 74162319,
			
 
				-        "nick_name": "朝筠"
			
 
				-    },
			
 
				-    "gh_ede868a2e656": {
			
 
				-        "uid": 73858594,
			
 
				-        "nick_name": "晚安"
			
 
				-    },
			
 
				-    "gh_ee78360d06f5": {
			
 
				-        "uid": 71021089,
			
 
				-        "nick_name": "思绪"
			
 
				-    },
			
 
				-    "gh_efaf7da157f5": {
			
 
				-        "uid": 69637547,
			
 
				-        "nick_name": "心野性子浪"
			
 
				-    },
			
 
				-    "gh_efd90dcf48ac": {
			
 
				-        "uid": 74162316,
			
 
				-        "nick_name": "动心"
			
 
				-    },
			
 
				-    "gh_f1122b34f1f3": {
			
 
				-        "uid": 74162337,
			
 
				-        "nick_name": "该怎样"
			
 
				-    },
			
 
				-    "gh_f25b5fb01977": {
			
 
				-        "uid": 70731105,
			
 
				-        "nick_name": "山色空濛"
			
 
				-    },
			
 
				-    "gh_f2bc589c78eb": {
			
 
				-        "uid": 73723028,
			
 
				-        "nick_name": "與妳穿過風"
			
 
				-    },
			
 
				-    "gh_f321695e3983": {
			
 
				-        "uid": 72459375,
			
 
				-        "nick_name": "阁"
			
 
				-    },
			
 
				-    "gh_f4594783f5b8": {
			
 
				-        "uid": 69637544,
			
 
				-        "nick_name": "自缚"
			
 
				-    },
			
 
				-    "gh_f74ca3104604": {
			
 
				-        "uid": 74162325,
			
 
				-        "nick_name": "鬼面書生"
			
 
				-    },
			
 
				-    "gh_f902cea89e48": {
			
 
				-        "uid": 71021085,
			
 
				-        "nick_name": "晚春的树"
			
 
				-    },
			
 
				-    "gh_fa0b85528a93": {
			
 
				-        "uid": 72459365,
			
 
				-        "nick_name": "永不言弃"
			
 
				-    },
			
 
				-    "gh_fb8031aca805": {
			
 
				-        "uid": 72088959,
			
 
				-        "nick_name": "惊醒"
			
 
				-    },
			
 
				-    "gh_fe6ef3a65a48": {
			
 
				-        "uid": 69637480,
			
 
				-        "nick_name": "风间"
			
 
				-    },
			
 
				-    "gh_ff487cb5dab3": {
			
 
				-        "uid": 70744071,
			
 
				-        "nick_name": "决然"
			
 
				-    }
			
 
				-}
			
 
				-
			
 
				-
			
 
				-# prod
			
 
				-db_article = "long_articles_video"
			
 
				-db_video = "article_match_videos"
			
 
				-
			
 
				-# dev
			
 
				-# db_article = "long_articles_video_dev"
			
 
				-# db_video = "article_match_videos_dev"
			
 
				-
			
 
				-# spider coroutines
			
 
				-spider_coroutines = 10
			
 
				-
			
 
				-# mysql coroutines
			
 
				-mysql_coroutines = 100
			
--- a/static/logo.png
+++ b/static/logo.png
--- a/static/official_accounts
+++ b/static/official_accounts
@@ -1,3 +0,0 @@
 
				-天天美好祝福生活
			
 
				-wx0b7d95eb293b783b
			
 
				-https://rescdn.yishihui.com/0temp/ttmhzfsh.png
			
--- a/tasks/__init__.py
+++ b/tasks/__init__.py
@@ -2,7 +2,8 @@
 
				 @author: luojunhui
			
 
				 定时任务
			
 
				 """
			
 
				-from .task1 import MatchTask1
			
 
				-from .task2 import MatchTask2
			
 
				-from .task3 import MatchTask3
			
 
				-from .task4 import MatchTask4
			
 
				+from .etl_task import AsyncETL
			
 
				+from .kimi_task import KimiTask
			
 
				+from .spider_task import spiderTask
			
 
				+from .publish_task import publishTask
			
 
				+from .history_task import historyContentIdTask
			
--- a/tasks/chadui.py
+++ b/tasks/chadui.py
@@ -1,150 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import asyncio
			
 
				-
			
 
				-from static.config import db_article, db_video
			
 
				-from applications.functions.log import logging
			
 
				-from static.config import mysql_coroutines
			
 
				-
			
 
				-
			
 
				-class MatchTask5(object):
			
 
				-    """
			
 
				-    定时执行任务
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self, mysql_client):
			
 
				-        """
			
 
				-        :param mysql_client:
			
 
				-        """
			
 
				-        self.mysql_client = mysql_client
			
 
				-
			
 
				-    async def get_task(self):
			
 
				-        """
			
 
				-        获取任务
			
 
				-        :return:
			
 
				-        """
			
 
				-        select_sql = f"""
			
 
				-            SELECT trace_id, content_id, gh_id, article_title, article_text, content_status, process_times
			
 
				-            FROM {db_article} 
			
 
				-            WHERE content_status = 0 and process_times <= 5 and account_name = '万事如意一家子'
			
 
				-            ORDER BY request_time_stamp
			
 
				-            DESC
			
 
				-            LIMIT {mysql_coroutines};
			
 
				-        """
			
 
				-        task_list = await self.mysql_client.async_select(sql=select_sql)
			
 
				-        task_obj_list = [
			
 
				-            {
			
 
				-                "trace_id": item[0],
			
 
				-                "content_id": item[1],
			
 
				-                "gh_id": item[2],
			
 
				-                "title": item[3],
			
 
				-                "text": item[4],
			
 
				-                "content_status": item[5],
			
 
				-                "process_times": item[6]
			
 
				-            } for item in task_list
			
 
				-        ]
			
 
				-        print("本次任务获取到 {} 条视频".format(len(task_obj_list)))
			
 
				-        # logging(
			
 
				-        #     code="9001",
			
 
				-        #     info="本次任务获取到 {} 条视频".format(len(task_obj_list)),
			
 
				-        #     data=task_obj_list
			
 
				-        # )
			
 
				-        return task_obj_list
			
 
				-
			
 
				-    async def get_history_videos(self, content_id):
			
 
				-        """
			
 
				-        check whether the contents videos exists
			
 
				-        :param content_id:
			
 
				-        :return:
			
 
				-        """
			
 
				-        select_sql = f"""
			
 
				-            SELECT video_id
			
 
				-            FROM {db_video}
			
 
				-            where content_id = '{content_id}' and video_status = 1 order by request_time DESC;
			
 
				-        """
			
 
				-        content_videos = await self.mysql_client.async_select(select_sql)
			
 
				-        videos = [vid for vid in content_videos]
			
 
				-        print(len(videos))
			
 
				-        if len(videos) >= 3:
			
 
				-            return videos
			
 
				-        else:
			
 
				-            return None
			
 
				-
			
 
				-    async def use_exists_contents_videos(self, video_id_list, params):
			
 
				-        """
			
 
				-        使用已经存在的视频id
			
 
				-        :return:
			
 
				-        """
			
 
				-        trace_id = params['trace_id']
			
 
				-        content_id = params['content_id']
			
 
				-        select_sql = f"""
			
 
				-            SELECT kimi_title
			
 
				-            FROM {db_article}
			
 
				-            WHERE content_id = '{content_id}' and kimi_title is not null limit 1;
			
 
				-        """
			
 
				-        info = await self.mysql_client.async_select(sql=select_sql)
			
 
				-        kimi_title = info[0]
			
 
				-        update_sql = f"""
			
 
				-            UPDATE {db_article}
			
 
				-            SET 
			
 
				-                kimi_title=%s,
			
 
				-                recall_video_id1=%s, 
			
 
				-                recall_video_id2=%s, 
			
 
				-                recall_video_id3=%s,
			
 
				-                content_status=%s,
			
 
				-                process_times = %s
			
 
				-            WHERE  trace_id = %s
			
 
				-        """
			
 
				-        vid1, vid2, vid3 = video_id_list[0], video_id_list[1], video_id_list[2]
			
 
				-        await self.mysql_client.async_insert(
			
 
				-            sql=update_sql,
			
 
				-            params=(
			
 
				-                kimi_title,
			
 
				-                video_id_list[0],
			
 
				-                "NULL" if vid2 is None else vid2,
			
 
				-                "NULL" if vid3 is None else vid3,
			
 
				-                2,
			
 
				-                int(params['process_times']) + 1,
			
 
				-                trace_id
			
 
				-            )
			
 
				-        )
			
 
				-        logging(
			
 
				-            code="9002",
			
 
				-            info="已从历史文章更新，文章id： {}".format(content_id),
			
 
				-            trace_id=trace_id
			
 
				-        )
			
 
				-
			
 
				-    async def process_task(self, params):
			
 
				-        """
			
 
				-        异步执行
			
 
				-        :param params:
			
 
				-        :return:
			
 
				-        """
			
 
				-        content_id = params['content_id']
			
 
				-        print(content_id)
			
 
				-        # 判断该篇文章是否存在未下架的视频，且判断是否有3条， 如果没有三条，则启动新抓取任务，后续优化点
			
 
				-        video_id_list = await self.get_history_videos(content_id=content_id)
			
 
				-        print(video_id_list)
			
 
				-        if video_id_list:
			
 
				-            # 说明已经存在了结果, 将该条记录下的video_id拿出来
			
 
				-            print("存在历史文章")
			
 
				-            await self.use_exists_contents_videos(video_id_list=video_id_list, params=params)
			
 
				-        else:
			
 
				-            pass
			
 
				-
			
 
				-    async def deal(self):
			
 
				-        """
			
 
				-        处理
			
 
				-        :return:
			
 
				-        """
			
 
				-        task_list = await self.get_task()
			
 
				-        print(len(task_list))
			
 
				-        if task_list:
			
 
				-            tasks = [self.process_task(params) for params in task_list]
			
 
				-            await asyncio.gather(*tasks)
			
 
				-        else:
			
 
				-            logging(
			
 
				-                code="9008",
			
 
				-                info="没有要处理的请求"
			
 
				-            )
			
--- a/tasks/etl_task.py
+++ b/tasks/etl_task.py
@@ -0,0 +1,300 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import os
			
 
				+
			
 
				+import oss2
			
 
				+import aiohttp
			
 
				+import aiofiles
			
 
				+import asyncio
			
 
				+from hashlib import md5
			
 
				+from uuid import uuid4
			
 
				+
			
 
				+import requests
			
 
				+from fake_useragent import FakeUserAgent
			
 
				+from applications.config import Config
			
 
				+
			
 
				+
			
 
				+async def downloadCover(file_path, platform, cover_url):
			
 
				+    """
			
 
				+    下载视频封面
			
 
				+    :param platform:
			
 
				+    :param cover_url:
			
 
				+    :param file_path:
			
 
				+    :return:
			
 
				+    """
			
 
				+    headers = requestHeader(platform=platform, url=cover_url, download_type="cover")
			
 
				+    response = requests.get(url=cover_url, headers=headers)
			
 
				+    if b"<html>" in response.content:
			
 
				+        return None
			
 
				+    elif response.status_code != 200:
			
 
				+        return None
			
 
				+    else:
			
 
				+        with open(file_path, "wb") as f:
			
 
				+            f.write(response.content)
			
 
				+        return file_path
			
 
				+
			
 
				+
			
 
				+def requestHeader(platform, url, download_type="video"):
			
 
				+    """
			
 
				+    请求头
			
 
				+    :return:
			
 
				+    """
			
 
				+    if platform == "xg_search":
			
 
				+        if "v9-xg-web-pc.ixigua.com" in url:
			
 
				+            headers = {
			
 
				+                "Accept": "*/*",
			
 
				+                "Accept-Language": "zh-CN,zh;q=0.9",
			
 
				+                "Host": "v9-xg-web-pc.ixigua.com",
			
 
				+                "User-Agent": FakeUserAgent().chrome,
			
 
				+                "Origin": "https://www.ixigua.com/",
			
 
				+                "Referer": "https://www.ixigua.com/"
			
 
				+            }
			
 
				+        elif "v3-xg-web-pc.ixigua.com" in url:
			
 
				+            headers = {
			
 
				+                "Accept": "*/*",
			
 
				+                "Accept-Language": "zh-CN,zh;q=0.9",
			
 
				+                "Host": "v3-xg-web-pc.ixigua.com",
			
 
				+                "User-Agent": FakeUserAgent().chrome,
			
 
				+                "Origin": "https://www.ixigua.com/",
			
 
				+                "Referer": "https://www.ixigua.com/"
			
 
				+            }
			
 
				+        elif download_type == "cover":
			
 
				+            headers = {
			
 
				+                'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7',
			
 
				+                'Accept-Language': 'en,zh;q=0.9,zh-CN;q=0.8',
			
 
				+                'Cache-Control': 'max-age=0',
			
 
				+                'Proxy-Connection': 'keep-alive',
			
 
				+                'Upgrade-Insecure-Requests': '1',
			
 
				+                'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/125.0.0.0 Safari/537.36'
			
 
				+            }
			
 
				+        else:
			
 
				+            headers = {
			
 
				+                "Accept": "*/*",
			
 
				+                "Accept-Language": "zh-CN,zh;q=0.9",
			
 
				+                "Host": "v3-xg-web-pc.ixigua.com",
			
 
				+                "User-Agent": FakeUserAgent().chrome,
			
 
				+                "Origin": "https://www.ixigua.com/",
			
 
				+                "Referer": "https://www.ixigua.com/"
			
 
				+            }
			
 
				+    elif platform == "baidu_search":
			
 
				+        headers = {
			
 
				+            "Accept": "*/*",
			
 
				+            "Accept-Language": "zh-CN,zh;q=0.9",
			
 
				+            "User-Agent": FakeUserAgent().chrome,
			
 
				+        }
			
 
				+    elif platform == "wx_search":
			
 
				+        headers = {
			
 
				+            "Accept": "*/*",
			
 
				+            "Accept-Language": "zh-CN,zh;q=0.9",
			
 
				+            "User-Agent": FakeUserAgent().chrome,
			
 
				+            "Origin": "https://mp.weixin.qq.com",
			
 
				+            "Referer": "https://mp.weixin.qq.com"
			
 
				+        }
			
 
				+    elif platform == "dy_search":
			
 
				+        headers = {
			
 
				+            'accept': '*/*',
			
 
				+            'accept-language': 'en,zh;q=0.9,zh-CN;q=0.8',
			
 
				+            'priority': 'i',
			
 
				+            'range': 'bytes=0-',
			
 
				+            'referer': 'https://v11-coldf.douyinvod.com/',
			
 
				+            'user-agent': FakeUserAgent().chrome
			
 
				+        }
			
 
				+    else:
			
 
				+        headers = {}
			
 
				+    return headers
			
 
				+
			
 
				+
			
 
				+async def downloadVideo(file_path, platform, video_url, download_type="video"):
			
 
				+    """
			
 
				+    :param download_type:
			
 
				+    :param video_url:
			
 
				+    :param platform:
			
 
				+    :param file_path:
			
 
				+    :return:
			
 
				+    """
			
 
				+    headers = requestHeader(platform=platform, url=video_url, download_type=download_type)
			
 
				+    if os.path.exists(file_path):
			
 
				+        file_size = os.path.getsize(file_path)
			
 
				+        headers["Range"] = f"bytes={file_size}-"
			
 
				+    else:
			
 
				+        file_size = 0
			
 
				+    async with aiohttp.ClientSession() as session:
			
 
				+        async with session.get(video_url, headers=headers) as response:
			
 
				+            if response.status in [200, 206]:
			
 
				+                if file_size > 0:
			
 
				+                    async with aiofiles.open(file_path, "ab+") as f:
			
 
				+                        # 以1MB为单位分块下载
			
 
				+                        async for chunk in response.content.iter_chunked(1024 * 1024):
			
 
				+                            await f.write(chunk)
			
 
				+                else:
			
 
				+                    async with aiofiles.open(file_path, "wb") as f:
			
 
				+                        # 以1MB为单位分块下载
			
 
				+                        async for chunk in response.content.iter_chunked(1024 * 1024):
			
 
				+                            await f.write(chunk)
			
 
				+
			
 
				+            else:
			
 
				+                print(response.status)
			
 
				+    return file_path
			
 
				+
			
 
				+
			
 
				+def generateVideoPath(platform, video_id):
			
 
				+    """
			
 
				+    通过视频信息生成唯一视频地址
			
 
				+    :return:
			
 
				+    """
			
 
				+    index = "{}-{}-{}".format(platform, video_id, uuid4())
			
 
				+    index = md5(index.encode()).hexdigest()
			
 
				+    file_name = "{}.mp4".format(index)
			
 
				+    cover_name = "{}.png".format(index)
			
 
				+    file_path = os.path.join(os.getcwd(), "static", file_name)
			
 
				+    cover_path = os.path.join(os.getcwd(), "static", cover_name)
			
 
				+    return file_path, cover_path
			
 
				+
			
 
				+
			
 
				+async def uploadToOss(local_video_path, download_type):
			
 
				+    """
			
 
				+    把视频上传到 oss
			
 
				+    :return:
			
 
				+    """
			
 
				+    oss_video_key = "long_articles/{}/".format(download_type) + str(uuid4())
			
 
				+    access_key_id = "LTAIP6x1l3DXfSxm"
			
 
				+    access_key_secret = "KbTaM9ars4OX3PMS6Xm7rtxGr1FLon"
			
 
				+    endpoint = "oss-cn-hangzhou.aliyuncs.com"
			
 
				+    bucket_name = "art-pubbucket"
			
 
				+    bucket = oss2.Bucket(
			
 
				+        oss2.Auth(access_key_id, access_key_secret), endpoint, bucket_name
			
 
				+    )
			
 
				+    bucket.put_object_from_file(key=oss_video_key, filename=local_video_path)
			
 
				+    return oss_video_key
			
 
				+
			
 
				+
			
 
				+class AsyncETL(object):
			
 
				+    """
			
 
				+    视频下载功能
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, mysql_client):
			
 
				+        # self.proxy = {
			
 
				+        #     "http://": "http://t17772369458618:5zqcjkmy@q796.kdltps.com:15818/",
			
 
				+        #     "https://": "http://t17772369458618:5zqcjkmy@q796.kdltps.com:15818/",
			
 
				+        # }
			
 
				+        self.max_retry = 5
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.article_crawler_videos = Config().articleCrawlerVideos
			
 
				+
			
 
				+    async def getTasks(self):
			
 
				+        """
			
 
				+        获取视频 id
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        SELECT id, out_video_id, platform, video_title, video_url, cover_url, user_id
			
 
				+        FROM {self.article_crawler_videos}
			
 
				+        WHERE download_status = 0
			
 
				+        ORDER BY id
			
 
				+        LIMIT 10;
			
 
				+        """
			
 
				+        result = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if result:
			
 
				+            tasks = [
			
 
				+                {
			
 
				+                    "id": line[0],
			
 
				+                    "video_id": line[1],
			
 
				+                    "platform": line[2],
			
 
				+                    "video_title": line[3],
			
 
				+                    "video_url": line[4],
			
 
				+                    "cover_url": line[5],
			
 
				+                    "user_id": line[6]
			
 
				+                }
			
 
				+                for line in result
			
 
				+            ]
			
 
				+            return tasks
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def processTask(self, params):
			
 
				+        """
			
 
				+        处理 task
			
 
				+        :return:
			
 
				+        {
			
 
				+                    "id": line[0],
			
 
				+                    "video_id": line[1],
			
 
				+                    "platform": line[2],
			
 
				+                    "video_title": line[3],
			
 
				+                    "video_url": line[4],
			
 
				+                    "cover_url": line[5],
			
 
				+                    "user_id": line[6]
			
 
				+                }
			
 
				+        """
			
 
				+        update_sql_0 = f"""
			
 
				+                    UPDATE {self.article_crawler_videos}
			
 
				+                    SET download_status = %s
			
 
				+                    WHERE id = %s;
			
 
				+                    """
			
 
				+        await self.mysql_client.asyncInsert(
			
 
				+            sql=update_sql_0,
			
 
				+            params=(1, params['id'])
			
 
				+        )
			
 
				+        try:
			
 
				+            local_video_path, local_cover_path = generateVideoPath(params['platform'], params['video_id'])
			
 
				+            # download videos
			
 
				+            file_path = await downloadVideo(
			
 
				+                file_path=local_video_path,
			
 
				+                platform=params['platform'],
			
 
				+                video_url=params['video_url']
			
 
				+            )
			
 
				+            # download cover
			
 
				+            cover_path = await downloadCover(
			
 
				+                file_path=local_cover_path,
			
 
				+                platform=params['platform'],
			
 
				+                cover_url=params['cover_url']
			
 
				+            )
			
 
				+            oss_video = await uploadToOss(
			
 
				+                local_video_path=file_path,
			
 
				+                download_type="video"
			
 
				+            )
			
 
				+            if cover_path:
			
 
				+                oss_cover = await uploadToOss(
			
 
				+                    local_video_path=cover_path,
			
 
				+                    download_type="image"
			
 
				+                )
			
 
				+            else:
			
 
				+                oss_cover = None
			
 
				+            update_sql = f"""
			
 
				+            UPDATE {self.article_crawler_videos}
			
 
				+            SET video_oss_path = %s, cover_oss_path = %s, download_status = %s
			
 
				+            WHERE id = %s;
			
 
				+            """
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=update_sql,
			
 
				+                params=(
			
 
				+                    oss_video,
			
 
				+                    oss_cover,
			
 
				+                    2,
			
 
				+                    params['id']
			
 
				+                )
			
 
				+            )
			
 
				+        except Exception as e:
			
 
				+            print("failed", e)
			
 
				+            update_sql = f"""
			
 
				+            UPDATE {self.article_crawler_videos}
			
 
				+            SET download_status = %s
			
 
				+            WHERE id = %s;
			
 
				+            """
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=update_sql,
			
 
				+                params=(3, params['id'])
			
 
				+            )
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        ETL Deal Task
			
 
				+        :return:
			
 
				+        """
			
 
				+        task_list = await self.getTasks()
			
 
				+        if task_list:
			
 
				+            tasks = [self.processTask(params) for params in task_list]
			
 
				+            await asyncio.gather(*tasks)
			
 
				+        else:
			
 
				+            print("No spider tasks")
			
--- a/tasks/history_task.py
+++ b/tasks/history_task.py
@@ -0,0 +1,215 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import json
			
 
				+import time
			
 
				+import asyncio
			
 
				+
			
 
				+from applications.config import Config
			
 
				+from applications.functions.log import logging
			
 
				+from applications.functions.pqFunctions import publishToPQ
			
 
				+
			
 
				+
			
 
				+class historyContentIdTask(object):
			
 
				+    """
			
 
				+    处理已经匹配过小程序的文章
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, mysql_client):
			
 
				+        """
			
 
				+        :param mysql_client:
			
 
				+        """
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.article_text = Config().articleText
			
 
				+        self.article_video = Config().articleVideos
			
 
				+        self.article_crawler_video = Config().articleCrawlerVideos
			
 
				+        self.history_coroutines = Config().getConfigValue("historyArticleCoroutines")
			
 
				+
			
 
				+    async def getTaskList(self):
			
 
				+        """
			
 
				+        获取任务
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql1 = f"""
			
 
				+            SELECT 
			
 
				+                ART.trace_id, 
			
 
				+                ART.content_id, 
			
 
				+                ART.flow_pool_level, 
			
 
				+                ART.gh_id,
			
 
				+                ART.process_times
			
 
				+            FROM {self.article_video} ART
			
 
				+            JOIN (
			
 
				+                select content_id, count(1) as cnt 
			
 
				+                from {self.article_crawler_video}
			
 
				+                where download_status = 2
			
 
				+                group by content_id
			
 
				+            ) VID on ART.content_id = VID.content_id and VID.cnt >= 3
			
 
				+            WHERE ART.content_status = 0 and ART.process_times <= 3
			
 
				+            ORDER BY request_timestamp
			
 
				+            LIMIT {self.history_coroutines};
			
 
				+        """
			
 
				+        tasks = await self.mysql_client.asyncSelect(sql=select_sql1)
			
 
				+        task_obj_list = [
			
 
				+            {
			
 
				+                "trace_id": item[0],
			
 
				+                "content_id": item[1],
			
 
				+                "flow_pool_level": item[2],
			
 
				+                "gh_id": item[3],
			
 
				+                "process_times": item[4]
			
 
				+            } for item in tasks
			
 
				+        ]
			
 
				+        logging(
			
 
				+            code="9001",
			
 
				+            info="本次任务获取到 {} 条视频".format(len(task_obj_list)),
			
 
				+            data=task_obj_list
			
 
				+        )
			
 
				+        return task_obj_list
			
 
				+
			
 
				+    async def getVideoList(self, content_id):
			
 
				+        """
			
 
				+        content_id
			
 
				+        :return:
			
 
				+        """
			
 
				+        sql = f"""
			
 
				+        SELECT platform, play_count, like_count, video_oss_path, cover_oss_path, user_id
			
 
				+        FROM {self.article_crawler_video}
			
 
				+        WHERE content_id = '{content_id}' and download_status = 2;
			
 
				+        """
			
 
				+        res_tuple = await self.mysql_client.asyncSelect(sql)
			
 
				+        if len(res_tuple) >= 3:
			
 
				+            return [
			
 
				+                {
			
 
				+                    "platform": i[0],
			
 
				+                    "play_count": i[1],
			
 
				+                    "like_count": i[2],
			
 
				+                    "video_oss_path": i[3],
			
 
				+                    "cover_oss_path": i[4],
			
 
				+                    "uid": i[5]
			
 
				+                }
			
 
				+                for i in res_tuple]
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def getKimiTitle(self, content_id):
			
 
				+        """
			
 
				+        获取 kimiTitle
			
 
				+        :param content_id:
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        select kimi_title from {self.article_text} where content_id = '{content_id}';
			
 
				+        """
			
 
				+        res_tuple = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if res_tuple:
			
 
				+            return res_tuple[0][0]
			
 
				+        else:
			
 
				+            return False
			
 
				+
			
 
				+    async def publishVideosToPq(self, trace_id, flow_pool_level, kimi_title, gh_id, download_videos, process_times):
			
 
				+        """
			
 
				+        发布至 pq
			
 
				+        :param process_times:
			
 
				+        :param trace_id:
			
 
				+        :param download_videos: 已下载的视频---> list [{}, {}, {}.... ]
			
 
				+        :param gh_id: 公众号 id ---> str
			
 
				+        :param kimi_title: kimi 标题 ---> str
			
 
				+        :param flow_pool_level: 流量池层级 ---> str
			
 
				+        :return:
			
 
				+        """
			
 
				+        video_list = download_videos[:3]
			
 
				+        match flow_pool_level:
			
 
				+            case "autoArticlePoolLevel4":
			
 
				+                print("冷启层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel3":
			
 
				+                print("暂时未知层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel2":
			
 
				+                print("次条层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel1":
			
 
				+                print("头条层")
			
 
				+                video_list = []
			
 
				+        L = []
			
 
				+        for video_obj in video_list:
			
 
				+            params = {
			
 
				+                "videoPath": video_obj['video_oss_path'],
			
 
				+                "uid": video_obj['uid'],
			
 
				+                "title": kimi_title
			
 
				+            }
			
 
				+            response = await publishToPQ(params)
			
 
				+            # time.sleep(2)
			
 
				+            obj = {
			
 
				+                "uid": video_obj['uid'],
			
 
				+                "source": video_obj['platform'],
			
 
				+                "kimiTitle": kimi_title,
			
 
				+                "videoId": response['data']['id'],
			
 
				+                "videoCover": response['data']['shareImgPath'],
			
 
				+                "videoPath": response['data']['videoPath'],
			
 
				+                "videoOss": video_obj['video_oss_path'].split("/")[-1]
			
 
				+            }
			
 
				+            L.append(obj)
			
 
				+        update_sql = f"""
			
 
				+           UPDATE {self.article_video}
			
 
				+           SET content_status = %s, response = %s, process_times = %s
			
 
				+           WHERE trace_id = %s;
			
 
				+           """
			
 
				+        await self.mysql_client.asyncInsert(
			
 
				+            sql=update_sql,
			
 
				+            params=(2, json.dumps(L, ensure_ascii=False), process_times + 1, trace_id)
			
 
				+        )
			
 
				+
			
 
				+    async def processTask(self, params):
			
 
				+        """
			
 
				+        异步执行
			
 
				+        :param params:
			
 
				+        :return:
			
 
				+        """
			
 
				+        content_id = params['content_id']
			
 
				+        trace_id = params['trace_id']
			
 
				+        flow_pool_level = params['flow_pool_level'],
			
 
				+        gh_id = params['gh_id']
			
 
				+        process_times = params['process_times']
			
 
				+        # 判断该篇文章是否存在未下架的视频，且判断是否有3条， 如果没有三条，则启动新抓取任务，后续优化点
			
 
				+        download_videos = await self.getVideoList(content_id=content_id)
			
 
				+        if download_videos:
			
 
				+            # 把状态修改为 4
			
 
				+            update_sql = f"""
			
 
				+            UPDATE {self.article_video}
			
 
				+            SET content_status = %s 
			
 
				+            WHERE trace_id = %s;
			
 
				+            """
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=update_sql,
			
 
				+                params=(4, trace_id)
			
 
				+            )
			
 
				+
			
 
				+            kimi_title = await self.getKimiTitle(content_id)
			
 
				+            if kimi_title:
			
 
				+                await self.publishVideosToPq(
			
 
				+                    flow_pool_level=flow_pool_level,
			
 
				+                    kimi_title=kimi_title,
			
 
				+                    gh_id=gh_id,
			
 
				+                    trace_id=trace_id,
			
 
				+                    download_videos=download_videos,
			
 
				+                    process_times=process_times
			
 
				+                )
			
 
				+            else:
			
 
				+                print("Kimi title 生成失败---后续加报警")
			
 
				+        else:
			
 
				+            pass
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        处理
			
 
				+        :return:
			
 
				+        """
			
 
				+        task_list = await self.getTaskList()
			
 
				+        if task_list:
			
 
				+            tasks = [self.processTask(params) for params in task_list]
			
 
				+            await asyncio.gather(*tasks)
			
 
				+        else:
			
 
				+            logging(
			
 
				+                code="9008",
			
 
				+                info="没有要处理的请求"
			
 
				+            )
			
--- a/tasks/kimi_task.py
+++ b/tasks/kimi_task.py
@@ -0,0 +1,98 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import json
			
 
				+import asyncio
			
 
				+from applications.functions.kimi import KimiServer
			
 
				+from applications.functions.log import logging
			
 
				+from applications.config import Config
			
 
				+
			
 
				+
			
 
				+class KimiTask(object):
			
 
				+    """
			
 
				+    KIMI task
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, mysql_client):
			
 
				+        """
			
 
				+
			
 
				+        :param mysql_client:
			
 
				+        """
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.config = Config()
			
 
				+
			
 
				+    async def getTasks(self):
			
 
				+        """
			
 
				+        获取 tasks
			
 
				+        :return:
			
 
				+        """
			
 
				+        sql = f"""
			
 
				+        SELECT content_id, article_title, article_text
			
 
				+        FROM {self.config.articleText}
			
 
				+        WHERE kimi_status = 0
			
 
				+        limit 5;
			
 
				+        """
			
 
				+        content_list = await self.mysql_client.asyncSelect(sql)
			
 
				+        if content_list:
			
 
				+            task_list = [
			
 
				+                {
			
 
				+                    "contentId": i[0],
			
 
				+                    "articleTitle": i[1],
			
 
				+                    "articleText": i[2]
			
 
				+                } for i in content_list
			
 
				+            ]
			
 
				+            return task_list
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def processTask(self, params):
			
 
				+        """
			
 
				+        do something
			
 
				+        :return:
			
 
				+        """
			
 
				+        K = KimiServer()
			
 
				+        try:
			
 
				+            kimi_info = await K.search_kimi_schedule(params=params)
			
 
				+            kimi_title = kimi_info['k_title']
			
 
				+            content_title = kimi_info['content_title'].replace("'", "").replace('"', "")
			
 
				+            content_keys = json.dumps(kimi_info['content_keys'], ensure_ascii=False)
			
 
				+            update_kimi_sql = f"""
			
 
				+            UPDATE {self.config.articleText} 
			
 
				+            SET
			
 
				+                kimi_title = %s,
			
 
				+                kimi_summary = %s,
			
 
				+                kimi_keys = %s,
			
 
				+                kimi_status = %s
			
 
				+            WHERE content_id = %s;
			
 
				+                                    """
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=update_kimi_sql,
			
 
				+                params=(kimi_title, content_title, content_keys, 1, params['contentId'])
			
 
				+            )
			
 
				+        except Exception as e:
			
 
				+            update_kimi_sql = f"""
			
 
				+            UPDATE {self.config.articleText}
			
 
				+            SET
			
 
				+                kimi_status = %s 
			
 
				+            WHERE content_id = %s
			
 
				+            """
			
 
				+            await self.mysql_client.asyncInsert(
			
 
				+                sql=update_kimi_sql,
			
 
				+                params=(2, params['contentId'])
			
 
				+            )
			
 
				+            print("kimi error--{}".format(e))
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        deal function
			
 
				+        :return:
			
 
				+        """
			
 
				+        task_list = await self.getTasks()
			
 
				+        if task_list:
			
 
				+            tasks = [self.processTask(params) for params in task_list]
			
 
				+            await asyncio.gather(*tasks)
			
 
				+        else:
			
 
				+            logging(
			
 
				+                code="9008",
			
 
				+                info="没有要处理的 kimi 任务"
			
 
				+            )
			
--- a/tasks/publish_task.py
+++ b/tasks/publish_task.py
@@ -0,0 +1,186 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+发布到 pq 获取视频 id
			
 
				+"""
			
 
				+import asyncio
			
 
				+import json
			
 
				+import time
			
 
				+
			
 
				+from applications.config import Config
			
 
				+from applications.functions.log import logging
			
 
				+from applications.functions.pqFunctions import publishToPQ
			
 
				+
			
 
				+
			
 
				+class publishTask(object):
			
 
				+    """
			
 
				+    在 match_videos 表中， 获取 content_status = 1 的 content_id
			
 
				+    用  content_id 在 crawler_videos 表， 查询 download_status为 2 的视频，表示该 content_id 已经匹配完的视频
			
 
				+    通过 流量池tag  逻辑
			
 
				+    把 crawler_videos 中的视频路径发布至 pq， 获得 videoId
			
 
				+    match_videos表将 content_status 修改为 2，response中记录 videoId && ossName等信息
			
 
				+    """
			
 
				+
			
 
				+    def __init__(self, mysql_client):
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.article_video = Config().articleVideos
			
 
				+        self.article_text = Config().articleText
			
 
				+        self.article_crawler_video = Config().articleCrawlerVideos
			
 
				+
			
 
				+    async def getTasks(self):
			
 
				+        """
			
 
				+        获取 task
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        SELECT trace_id, content_id, flow_pool_level, gh_id
			
 
				+        FROM {self.article_video} 
			
 
				+        WHERE content_status = 1
			
 
				+        limit 10;
			
 
				+        """
			
 
				+        tasks = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if tasks:
			
 
				+            return [
			
 
				+                {
			
 
				+                    "trace_id": i[0],
			
 
				+                    "content_id": i[1],
			
 
				+                    "flow_pool_level": i[2],
			
 
				+                    "gh_id": i[3]
			
 
				+                }
			
 
				+                for i in tasks
			
 
				+            ]
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def getVideoList(self, content_id):
			
 
				+        """
			
 
				+        content_id
			
 
				+        :return:
			
 
				+        """
			
 
				+        sql = f"""
			
 
				+        SELECT platform, play_count, like_count, video_oss_path, cover_oss_path, user_id
			
 
				+        FROM {self.article_crawler_video}
			
 
				+        WHERE content_id = '{content_id}' and download_status = 2;
			
 
				+        """
			
 
				+        res_tuple = await self.mysql_client.asyncSelect(sql)
			
 
				+        if len(res_tuple) >= 3:
			
 
				+            return [
			
 
				+                {
			
 
				+                    "platform": i[0],
			
 
				+                    "play_count": i[1],
			
 
				+                    "like_count": i[2],
			
 
				+                    "video_oss_path": i[3],
			
 
				+                    "cover_oss_path": i[4],
			
 
				+                    "uid": i[5]
			
 
				+                }
			
 
				+                for i in res_tuple]
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def getKimiTitle(self, content_id):
			
 
				+        """
			
 
				+        获取 kimiTitle
			
 
				+        :param content_id:
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        select kimi_title from {self.article_text} where content_id = '{content_id}';
			
 
				+        """
			
 
				+        res_tuple = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if res_tuple:
			
 
				+            return res_tuple[0][0]
			
 
				+        else:
			
 
				+            return False
			
 
				+
			
 
				+    async def publishVideosToPq(self, trace_id, flow_pool_level, kimi_title, gh_id, download_videos):
			
 
				+        """
			
 
				+        发布至 pq
			
 
				+        :param trace_id:
			
 
				+        :param download_videos: 已下载的视频---> list [{}, {}, {}.... ]
			
 
				+        :param gh_id: 公众号 id ---> str
			
 
				+        :param kimi_title: kimi 标题 ---> str
			
 
				+        :param flow_pool_level: 流量池层级 ---> str
			
 
				+        :return:
			
 
				+        """
			
 
				+        video_list = download_videos[:3]
			
 
				+        match flow_pool_level:
			
 
				+            case "autoArticlePoolLevel4":
			
 
				+                print("冷启层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel3":
			
 
				+                print("暂时未知层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel2":
			
 
				+                print("次条层")
			
 
				+                video_list = []
			
 
				+            case "autoArticlePoolLevel1":
			
 
				+                print("头条层")
			
 
				+                video_list = []
			
 
				+        L = []
			
 
				+        for video_obj in video_list:
			
 
				+            params = {
			
 
				+                "videoPath": video_obj['video_oss_path'],
			
 
				+                "uid": video_obj['uid'],
			
 
				+                "title": kimi_title
			
 
				+            }
			
 
				+            response = await publishToPQ(params)
			
 
				+            print(response)
			
 
				+            time.sleep(2)
			
 
				+            obj = {
			
 
				+                "uid": video_obj['uid'],
			
 
				+                "source": video_obj['platform'],
			
 
				+                "kimiTitle": kimi_title,
			
 
				+                "videoId": response['data']['id'],
			
 
				+                "videoCover": response['data']['shareImgPath'],
			
 
				+                "videoPath": response['data']['videoPath'],
			
 
				+                "videoOss": video_obj['video_oss_path'].split("/")[-1]
			
 
				+            }
			
 
				+            L.append(obj)
			
 
				+        update_sql = f"""
			
 
				+        UPDATE {self.article_video}
			
 
				+        SET content_status = %s, response = %s
			
 
				+        WHERE trace_id = %s;
			
 
				+        """
			
 
				+        await self.mysql_client.asyncInsert(
			
 
				+            sql=update_sql,
			
 
				+            params=(2, json.dumps(L, ensure_ascii=False), trace_id)
			
 
				+        )
			
 
				+
			
 
				+    async def processTask(self, params):
			
 
				+        """
			
 
				+        处理任务
			
 
				+        :return:
			
 
				+        """
			
 
				+        gh_id = params['gh_id']
			
 
				+        flow_pool_level = params['flow_pool_level']
			
 
				+        content_id = params['content_id']
			
 
				+        trace_id = params['trace_id']
			
 
				+        download_videos = await self.getVideoList(content_id)
			
 
				+        if download_videos:
			
 
				+            kimi_title = await self.getKimiTitle(content_id)
			
 
				+            if kimi_title:
			
 
				+                await self.publishVideosToPq(
			
 
				+                    flow_pool_level=flow_pool_level,
			
 
				+                    kimi_title=kimi_title,
			
 
				+                    gh_id=gh_id,
			
 
				+                    trace_id=trace_id,
			
 
				+                    download_videos=download_videos
			
 
				+                )
			
 
				+            else:
			
 
				+                print("Kimi title 生成失败---后续加报警")
			
 
				+        else:
			
 
				+            print("该 content_id还未下载完成")
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        function
			
 
				+        :return:
			
 
				+        """
			
 
				+        task_list = await self.getTasks()
			
 
				+        if task_list:
			
 
				+            tasks = [self.processTask(params) for params in task_list]
			
 
				+            await asyncio.gather(*tasks)
			
 
				+        else:
			
 
				+            logging(
			
 
				+                code="9008",
			
 
				+                info="没有要处理的请求"
			
 
				+            )
			
--- a/tasks/spider_task.py
+++ b/tasks/spider_task.py
@@ -0,0 +1,244 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+"""
			
 
				+import asyncio
			
 
				+import json
			
 
				+
			
 
				+from applications.config import Config
			
 
				+from applications.functions.log import logging
			
 
				+from applications.spider import searchVideos
			
 
				+
			
 
				+
			
 
				+class spiderTask(object):
			
 
				+    """
			
 
				+    定时执行任务
			
 
				+    """
			
 
				+    C = Config()
			
 
				+
			
 
				+    def __init__(self, mysql_client):
			
 
				+        """
			
 
				+        :param mysql_client:
			
 
				+        """
			
 
				+        self.mysql_client = mysql_client
			
 
				+        self.article_video = self.C.articleVideos
			
 
				+        self.article_text = self.C.articleText
			
 
				+        self.article_video_crawler = self.C.articleCrawlerVideos
			
 
				+        self.spider_coroutines = self.C.getConfigValue("spiderCoroutines")
			
 
				+        self.gh_id_map = json.loads(self.C.getConfigValue("accountMap"))
			
 
				+
			
 
				+    async def getTask(self):
			
 
				+        """
			
 
				+        获取任务
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+            SELECT trace_id, content_id, gh_id, process_times
			
 
				+            FROM {self.article_video}
			
 
				+            WHERE content_status = 0 and process_times <= 3
			
 
				+            GROUP BY content_id
			
 
				+            LIMIT {self.spider_coroutines};
			
 
				+        """
			
 
				+        content_id_tuple = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if content_id_tuple:
			
 
				+            content_id_list = [i for i in list(content_id_tuple)]
			
 
				+            task_obj_list = [
			
 
				+                {
			
 
				+                    "trace_id": item[0],
			
 
				+                    "content_id": item[1],
			
 
				+                    "gh_id": item[2],
			
 
				+                    "process_times": item[3]
			
 
				+                } for item in content_id_list
			
 
				+            ]
			
 
				+            logging(
			
 
				+                code="9001",
			
 
				+                info="本次任务获取到 {} 条视频".format(len(task_obj_list)),
			
 
				+                data=task_obj_list
			
 
				+            )
			
 
				+            return task_obj_list
			
 
				+        else:
			
 
				+            return []
			
 
				+
			
 
				+    async def getHistoryVideos(self, content_id):
			
 
				+        """
			
 
				+        check whether the contents videos exists
			
 
				+        :param content_id:
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+            SELECT count(1)
			
 
				+            FROM {self.article_video_crawler}
			
 
				+            where content_id = '{content_id}' and download_status = 2;
			
 
				+        """
			
 
				+        content_videos = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        videos_count = content_videos[0][0]
			
 
				+        if videos_count >= 3:
			
 
				+            return True
			
 
				+        else:
			
 
				+            return False
			
 
				+
			
 
				+    async def judgeContentProcessing(self, content_id):
			
 
				+        """
			
 
				+        判断该content_id是否在处理中
			
 
				+        :param content_id:
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+                       SELECT trace_id, content_status
			
 
				+                       FROM {self.article_video}
			
 
				+                       WHERE content_id = '{content_id}'
			
 
				+                       ORDER BY id DESC;
			
 
				+                   """
			
 
				+        result = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if result:
			
 
				+            for item in result:
			
 
				+                trace_id, content_status = item
			
 
				+                if content_status == 1:
			
 
				+                    return False
			
 
				+            return True
			
 
				+        else:
			
 
				+            return True
			
 
				+
			
 
				+    async def getKimiResult(self, content_id):
			
 
				+        """
			
 
				+        通过 content_id 获取kimi info
			
 
				+        :return:
			
 
				+        """
			
 
				+        select_sql = f"""
			
 
				+        select article_title, kimi_title, kimi_summary, kimi_keys, kimi_status
			
 
				+        from {self.article_text}
			
 
				+        where content_id = '{content_id}';
			
 
				+        """
			
 
				+        response = await self.mysql_client.asyncSelect(select_sql)
			
 
				+        if response:
			
 
				+            article_detail = response[0]
			
 
				+            if article_detail[4] == 1:
			
 
				+                result = {
			
 
				+                    "oriTitle": article_detail[0],
			
 
				+                    "kimiTitle": article_detail[1],
			
 
				+                    "kimiSummary": article_detail[2],
			
 
				+                    "kimiKeys": json.loads(article_detail[3]),
			
 
				+                    "kimiStatus": article_detail[4]
			
 
				+                }
			
 
				+            else:
			
 
				+                result = {
			
 
				+                    "kimiStatus": article_detail[4]
			
 
				+                }
			
 
				+            return result
			
 
				+        else:
			
 
				+            return
			
 
				+
			
 
				+    async def startProcess(self, params):
			
 
				+        """
			
 
				+        开始处理
			
 
				+        :param params:
			
 
				+        :return:
			
 
				+        """
			
 
				+        # 更新文章contentId为1， 说明该文章正在处理中
			
 
				+        kimi_result = await self.getKimiResult(content_id=params['content_id'])
			
 
				+        kimi_status = kimi_result['kimiStatus']
			
 
				+        match kimi_status:
			
 
				+            case 1:
			
 
				+                update_process_times_sql = f"""
			
 
				+                            UPDATE {self.article_video}
			
 
				+                            SET process_times = %s, content_status = %s
			
 
				+                            WHERE trace_id = %s;
			
 
				+                            """
			
 
				+                await self.mysql_client.asyncInsert(
			
 
				+                    sql=update_process_times_sql,
			
 
				+                    params=(
			
 
				+                        params['process_times'] + 1,
			
 
				+                        1,
			
 
				+                        params['trace_id']
			
 
				+                    )
			
 
				+                )
			
 
				+                try:
			
 
				+                    await searchVideos(
			
 
				+                        info={
			
 
				+                            "oriTitle": kimi_result['oriTitle'],
			
 
				+                            "kimiSummary": kimi_result['kimiSummary'],
			
 
				+                            "kimiKeys": kimi_result['kimiKeys'],
			
 
				+                            "traceId": params['trace_id'],
			
 
				+                            "ghId": params['gh_id'],
			
 
				+                            "contentId": params['content_id'],
			
 
				+                            "spider": self.article_video_crawler
			
 
				+                        },
			
 
				+                        ghIdMap=self.gh_id_map,
			
 
				+                        dbClient=self.mysql_client
			
 
				+                    )
			
 
				+                except Exception as e:
			
 
				+                    roll_back_status = f"""
			
 
				+                    UPDATE {self.article_video}
			
 
				+                    SET content_status = %s
			
 
				+                    WHERE trace_id = %s;
			
 
				+                    """
			
 
				+                    await self.mysql_client.asyncInsert(
			
 
				+                        sql=roll_back_status,
			
 
				+                        params=(
			
 
				+                            0,
			
 
				+                            params['trace_id']
			
 
				+                        )
			
 
				+                    )
			
 
				+                    print("处理失败，回退状态为 0")
			
 
				+            case 2:
			
 
				+                update_process_times_sql = f"""
			
 
				+                            UPDATE {self.article_video}
			
 
				+                            SET process_times = %s, content_status = %s
			
 
				+                            WHERE trace_id = %s;
			
 
				+                            """
			
 
				+                await self.mysql_client.asyncInsert(
			
 
				+                    sql=update_process_times_sql,
			
 
				+                    params=(
			
 
				+                        params['process_times'] + 1,
			
 
				+                        3,
			
 
				+                        params['trace_id']
			
 
				+                    )
			
 
				+                )
			
 
				+            case 0:
			
 
				+                print("kimi not ready")
			
 
				+
			
 
				+    async def processTask(self, params):
			
 
				+        """
			
 
				+        异步执行
			
 
				+        :param params:
			
 
				+        :return:
			
 
				+        """
			
 
				+        content_id = params['content_id']
			
 
				+        trace_id = params['trace_id']
			
 
				+        video_id_list = await self.getHistoryVideos(content_id=content_id)
			
 
				+        if video_id_list:
			
 
				+            # 说明已经存在了结果, 将该条记录下的video_id拿出来
			
 
				+            logging(
			
 
				+                code="9001",
			
 
				+                info="存在历史文章",
			
 
				+                trace_id=trace_id
			
 
				+            )
			
 
				+        else:
			
 
				+            flag = await self.judgeContentProcessing(content_id)
			
 
				+            if flag:
			
 
				+                logging(
			
 
				+                    code="9004",
			
 
				+                    info="无正在处理的文章ID， 开始处理",
			
 
				+                    trace_id=trace_id
			
 
				+                )
			
 
				+                await self.startProcess(params=params)
			
 
				+            else:
			
 
				+                logging(
			
 
				+                    code="9003",
			
 
				+                    info="该文章ID正在请求--文章ID {}".format(content_id),
			
 
				+                    trace_id=trace_id
			
 
				+                )
			
 
				+
			
 
				+    async def deal(self):
			
 
				+        """
			
 
				+        处理
			
 
				+        :return:
			
 
				+        """
			
 
				+        task_list = await self.getTask()
			
 
				+        if task_list:
			
 
				+            tasks = [self.processTask(params) for params in task_list]
			
 
				+            await asyncio.gather(*tasks)
			
 
				+        else:
			
 
				+            logging(
			
 
				+                code="9008",
			
 
				+                info="爬虫池没有要处理的请求"
			
 
				+            )
			
--- a/tasks/task1.py
+++ b/tasks/task1.py
@@ -1,347 +0,0 @@
 
				-"""
			
 
				-@author: luojunhui
			
 
				-"""
			
 
				-import asyncio
			
 
				-
			
 
				-from static.config import db_article, db_video
			
 
				-from applications.schedule import search_videos
			
 
				-from applications.functions.log import logging
			
 
				-from static.config import spider_coroutines
			
 
				-
			
 
				-
			
 
				-class MatchTask1(object):
			
 
				-    """
			
 
				-    定时执行任务
			
 
				-    """
			
 
				-
			
 
				-    def __init__(self, mysql_client):
			
 
				-        """
			
 
				-        :param mysql_client:
			
 
				-        """
			
 
				-        self.mysql_client = mysql_client
			
 
				-
			
 
				-    async def get_task(self):
			
 
				-        """
			
 
				-        获取任务
			
 
				-        :return:
			
 
				-        """
			
 
				-        select_sql1 = f"""
			
 
				-            SELECT DISTINCT (content_id)       
			
 
				-            FROM {db_article} 
			
 
				-            WHERE content_status = 0 and process_times <= 3
			
 
				-            ORDER BY request_time_stamp
			
 
				-            ASC
			
 
				-            LIMIT {spider_coroutines};
			
 
				-        """
			
 
				-        content_ids = await self.mysql_client.async_select(select_sql1)
			
 
				-        cil = []
			
 
				-        for content_id in content_ids:
			
 
				-            cil.append(content_id[0])
			
 
				-        content_ids_tuple = str(cil).replace("[", "(").replace("]", ")")
			
 
				-        if len(content_ids_tuple) > 3:
			
 
				-            select_sql = f"""
			
 
				-                SELECT trace_id, content_id, gh_id, article_title, article_text, content_status, process_times
			
 
				-                FROM {db_article} 
			
 
				-                WHERE content_id in {content_ids_tuple} and process_times <= 3 
			
 
				-                ORDER BY request_time_stamp
			
 
				-                ASC;
			
 
				-            """
			
 
				-            task_list = await self.mysql_client.async_select(sql=select_sql)
			
 
				-            task_obj_list = [
			
 
				-                {
			
 
				-                    "trace_id": item[0],
			
 
				-                    "content_id": item[1],
			
 
				-                    "gh_id": item[2],
			
 
				-                    "title": item[3],
			
 
				-                    "text": item[4],
			
 
				-                    "content_status": item[5],
			
 
				-                    "process_times": item[6]
			
 
				-                } for item in task_list
			
 
				-            ]
			
 
				-            logging(
			
 
				-                code="9001",
			
 
				-                info="本次任务获取到 {} 条视频".format(len(task_obj_list)),
			
 
				-                data=task_obj_list
			
 
				-            )
			
 
				-            return task_obj_list
			
 
				-        else:
			
 
				-            return []
			
 
				-
			
 
				-    async def get_history_videos(self, content_id):
			
 
				-        """
			
 
				-        check whether the contents videos exists
			
 
				-        :param content_id:
			
 
				-        :return:
			
 
				-        """
			
 
				-        select_sql = f"""
			
 
				-            SELECT video_id
			
 
				-            FROM {db_video}
			
 
				-            where content_id = '{content_id}' and video_status = 1 order by request_time DESC;
			
 
				-        """
			
 
				-        content_videos = await self.mysql_client.async_select(select_sql)
			
 
				-        videos = [vid for vid in content_videos]
			
 
				-        if len(videos) >= 3:
			
 
				-            return videos
			
 
				-        else:
			
 
				-            return None
			
 
				-
			
 
				-    async def judge_content_processing(self, content_id):
			
 
				-        """
			
 
				-        判断该content_id是否在处理中
			
 
				-        :param content_id:
			
 
				-        :return:
			
 
				-        """
			
 
				-        select_sql = f"""
			
 
				-                       SELECT trace_id, content_status
			
 
				-                       FROM {db_article}
			
 
				-                       WHERE content_id = '{content_id}'
			
 
				-                       ORDER BY id DESC;
			
 
				-                   """
			
 
				-        result = await self.mysql_client.async_select(select_sql)
			
 
				-        if result:
			
 
				-            for item in result:
			
 
				-                trace_id, content_status = item
			
 
				-                if content_status == 1:
			
 
				-                    return False
			
 
				-            return True
			
 
				-        else:
			
 
				-            return True
			
 
				-
			
 
				-    async def use_exists_contents_videos(self, video_id_list, params):
			
 
				-        """
			
 
				-        使用已经存在的视频id
			
 
				-        :return:
			
 
				-        """
			
 
				-        trace_id = params['trace_id']
			
 
				-        content_id = params['content_id']
			
 
				-        select_sql = f"""
			
 
				-            SELECT kimi_title
			
 
				-            FROM {db_article}
			
 
				-            WHERE content_id = '{content_id}' and kimi_title is not null limit 1;
			
 
				-        """
			
 
				-        info = await self.mysql_client.async_select(sql=select_sql)
			
 
				-        kimi_title = info[0]
			
 
				-        update_sql = f"""
			
 
				-            UPDATE {db_article}
			
 
				-            SET 
			
 
				-                kimi_title=%s,
			
 
				-                recall_video_id1=%s, 
			
 
				-                recall_video_id2=%s, 
			
 
				-                recall_video_id3=%s,
			
 
				-                content_status=%s,
			
 
				-                process_times = %s
			
 
				-            WHERE  trace_id = %s
			
 
				-        """
			
 
				-        vid1, vid2, vid3 = video_id_list[0], video_id_list[1], video_id_list[2]
			
 
				-        await self.mysql_client.async_insert(
			
 
				-            sql=update_sql,
			
 
				-            params=(
			
 
				-                kimi_title,
			
 
				-                video_id_list[0],
			
 
				-                "NULL" if vid2 is None else vid2,
			
 
				-                "NULL" if vid3 is None else vid3,
			
 
				-                2,
			
 
				-                int(params['process_times']) + 1,
			
 
				-                trace_id
			
 
				-            )
			
 
				-        )
			
 
				-        logging(
			
 
				-            code="9002",
			
 
				-            info="已从历史文章更新，文章id： {}".format(content_id),
			
 
				-            trace_id=trace_id
			
 
				-        )
			
 
				-
			
 
				-    async def start_process(self, params):
			
 
				-        """
			
 
				-        开始处理
			
 
				-        :param params:
			
 
				-        :return:
			
 
				-        """
			
 
				-        # 更新文章contentId为1， 说明该文章正在处理中
			
 
				-        update_sql = f"""
			
 
				-            UPDATE {db_article}
			
 
				-            SET 
			
 
				-                content_status = %s
			
 
				-            WHERE 
			
 
				-                trace_id = %s;
			
 
				-        """
			
 
				-        await self.mysql_client.async_insert(
			
 
				-            sql=update_sql,
			
 
				-            params=(
			
 
				-                1, params['trace_id']
			
 
				-            )
			
 
				-        )
			
 
				-        try:
			
 
				-            video_count = await search_videos(
			
 
				-                params={
			
 
				-                    "title": params['title'],
			
 
				-                    "content": params['text'],
			
 
				-                    "trace_id": params['trace_id'],
			
 
				-                    "content_id": params['content_id']
			
 
				-                },
			
 
				-                trace_id=params['trace_id'],
			
 
				-                gh_id=params['gh_id'],
			
 
				-                mysql_client=self.mysql_client
			
 
				-            )
			
 
				-            select_sql = f"""
			
 
				-                SELECT video_id
			
 
				-                FROM {db_video}
			
 
				-                WHERE content_id = '{params['content_id']}'
			
 
				-            """
			
 
				-            result = await self.mysql_client.async_select(sql=select_sql)
			
 
				-            vid1, vid2, vid3 = result[0], result[1], result[2]
			
 
				-            if vid1 or vid2 or vid3:
			
 
				-                update_sql2 = f"""
			
 
				-                    UPDATE {db_article}
			
 
				-                    SET
			
 
				-                        recall_video_id1 = %s,
			
 
				-                        recall_video_id2 = %s,
			
 
				-                        recall_video_id3 = %s,
			
 
				-                        content_status = %s,
			
 
				-                        process_times = %s
			
 
				-                        WHERE trace_id = %s;
			
 
				-                """
			
 
				-                await self.mysql_client.async_insert(
			
 
				-                    sql=update_sql2,
			
 
				-                    params=(
			
 
				-                        vid1 if vid1 else "NULL",
			
 
				-                        vid2 if vid2 else "NULL",
			
 
				-                        vid3 if vid3 else "NULL",
			
 
				-                        2,
			
 
				-                        {int(params['process_times']) + 1},
			
 
				-                        params['trace_id']
			
 
				-                    )
			
 
				-                )
			
 
				-                logging(
			
 
				-                    code="9008",
			
 
				-                    info="视频搜索成功， 状态修改为2",
			
 
				-                    trace_id=params['trace_id']
			
 
				-                )
			
 
				-            else:
			
 
				-                if int(params['process_times']) < 3:
			
 
				-                    update_sql3 = f"""
			
 
				-                        UPDATE {db_article}
			
 
				-                        SET 
			
 
				-                           content_status = %s,
			
 
				-                           process_times = %s
			
 
				-                        WHERE trace_id = %s;
			
 
				-                                    """
			
 
				-                    await self.mysql_client.async_insert(
			
 
				-                        sql=update_sql3,
			
 
				-                        params=(0, int(params['process_times']) + 1, params['trace_id'])
			
 
				-                    )
			
 
				-                    logging(
			
 
				-                        code="9018",
			
 
				-                        info="视频搜索失败，回退状态为0",
			
 
				-                        trace_id=params['trace_id']
			
 
				-                    )
			
 
				-                else:
			
 
				-                    update_sql3 = f"""
			
 
				-                        UPDATE {db_article}
			
 
				-                        SET 
			
 
				-                           content_status = %s,
			
 
				-                           process_times = %s
			
 
				-                        WHERE trace_id = %s;
			
 
				-                                    """
			
 
				-                    await self.mysql_client.async_insert(
			
 
				-                        sql=update_sql3,
			
 
				-                        params=(3, int(params['process_times']) + 1, params['trace_id'])
			
 
				-                    )
			
 
				-                    logging(
			
 
				-                        code="9019",
			
 
				-                        info="视频多次搜索失败，状态修改为3",
			
 
				-                        trace_id=params['trace_id']
			
 
				-                    )
			
 
				-        except Exception as e:
			
 
				-            if int(params['process_times']) < 3:
			
 
				-                logging(
			
 
				-                    code="9018",
			
 
				-                    info="{}异常错误:{}， 回退状态为0".format(params['trace_id'], e),
			
 
				-                    trace_id=params['trace_id']
			
 
				-                )
			
 
				-                update_sql4 = f"""
			
 
				-                    UPDATE {db_article}
			
 
				-                    SET
			
 
				-                       content_status = %s,
			
 
				-                       process_times = %s
			
 
				-                    WHERE trace_id = %s;
			
 
				-                """
			
 
				-                await self.mysql_client.async_insert(
			
 
				-                    sql=update_sql4,
			
 
				-                    params=(0, int(params['process_times']) + 1, params['trace_id'])
			
 
				-                )
			
 
				-            else:
			
 
				-                logging(
			
 
				-                    code="9019",
			
 
				-                    info="{}异常错误:{}, 状态修改为3".format(params['trace_id'], e),
			
 
				-                    trace_id=params['trace_id']
			
 
				-                )
			
 
				-                update_sql4 = f"""
			
 
				-                                    UPDATE {db_article}
			
 
				-                                    SET
			
 
				-                                       content_status = %s,
			
 
				-                                       process_times = %s
			
 
				-                                    WHERE trace_id = %s;
			
 
				-                                """
			
 
				-                await self.mysql_client.async_insert(
			
 
				-                    sql=update_sql4,
			
 
				-                    params=(3, int(params['process_times']) + 1, params['trace_id'])
			
 
				-                )
			
 
				-
			
 
				-    async def process_task(self, params):
			
 
				-        """
			
 
				-        异步执行
			
 
				-        :param params:
			
 
				-        :return:
			
 
				-        """
			
 
				-        content_id = params['content_id']
			
 
				-        trace_id = params['trace_id']
			
 
				-        # 判断该篇文章是否存在未下架的视频，且判断是否有3条， 如果没有三条，则启动新抓取任务，后续优化点
			
 
				-        video_id_list = await self.get_history_videos(content_id=content_id)
			
 
				-        if video_id_list:
			
 
				-            # 说明已经存在了结果, 将该条记录下的video_id拿出来
			
 
				-            logging(
			
 
				-                code="9001",
			
 
				-                info="存在历史文章",
			
 
				-                trace_id=trace_id
			
 
				-            )
			
 
				-            # await self.use_exists_contents_videos(video_id_list=video_id_list, params=params)
			
 
				-        else:
			
 
				-            flag = await self.judge_content_processing(content_id)
			
 
				-            if flag:
			
 
				-                logging(
			
 
				-                    code="9004",
			
 
				-                    info="无正在处理的文章ID， 开始处理",
			
 
				-                    trace_id=trace_id
			
 
				-                )
			
 
				-                await self.start_process(params=params)
			
 
				-            else:
			
 
				-                logging(
			
 
				-                    code="9003",
			
 
				-                    info="该文章ID正在请求--文章ID {}".format(content_id),
			
 
				-                    trace_id=trace_id
			
 
				-                )
			
 
				-
			
 
				-    async def deal(self):
			
 
				-        """
			
 
				-        处理
			
 
				-        :return:
			
 
				-        """
			
 
				-        task_list = await self.get_task()
			
 
				-        task_dict = {}
			
 
				-        for task in task_list:
			
 
				-            key = task['content_id']
			
 
				-            task_dict[key] = task
			
 
				-        process_list = []
			
 
				-        for item in task_dict:
			
 
				-            process_list.append(task_dict[item])
			
 
				-        if process_list:
			
 
				-            # for task in task_list:
			
 
				-            #     await self.process_task(task)
			
 
				-            tasks = [self.process_task(params) for params in process_list]
			
 
				-            await asyncio.gather(*tasks)
			
 
				-        else:
			
 
				-            logging(
			
 
				-                code="9008",
			
 
				-                info="没有要处理的请求"
			
 
				-            )
			
--- a/test_code/SPIDER/baidu.py
+++ b/test_code/SPIDER/baidu.py
@@ -0,0 +1,132 @@
 
				+"""
			
 
				+@author: luojunhui
			
 
				+好看视频搜索爬虫
			
 
				+"""
			
 
				+import json
			
 
				+import time
			
 
				+import base64
			
 
				+import hashlib
			
 
				+import requests
			
 
				+import urllib.parse
			
 
				+from uuid import uuid4
			
 
				+from fake_useragent import FakeUserAgent
			
 
				+
			
 
				+from applications.functions.common import sensitive_flag
			
 
				+
			
 
				+
			
 
				+def tunnel_proxies():
			
 
				+    """
			
 
				+    快代理
			
 
				+    :return:
			
 
				+    """
			
 
				+    # 隧道域名:端口号
			
 
				+    tunnel = "l901.kdltps.com:15818"
			
 
				+
			
 
				+    # 用户名密码方式
			
 
				+    username = "t11983523373311"
			
 
				+    password = "mtuhdr2z"
			
 
				+    proxies = {
			
 
				+        "http": "http://%(user)s:%(pwd)s@%(proxy)s/" % {"user": username, "pwd": password, "proxy": tunnel},
			
 
				+        "https": "http://%(user)s:%(pwd)s@%(proxy)s/" % {"user": username, "pwd": password, "proxy": tunnel}
			
 
				+    }
			
 
				+    return proxies
			
 
				+
			
 
				+
			
 
				+def get_video_detail(video_id):
			
 
				+    """
			
 
				+    获取好看视频的视频链接
			
 
				+    :param video_id:
			
 
				+    :return:
			
 
				+    """
			
 
				+    url = "https://haokan.baidu.com/v"
			
 
				+    params = {
			
 
				+        'vid': video_id,
			
 
				+        '_format': 'json'
			
 
				+    }
			
 
				+
			
 
				+    base_64_string = base64.b64encode(str(uuid4()).encode()).decode()
			
 
				+    headers = {
			
 
				+        'Accept': '*/*',
			
 
				+        'cookie': "BIDUPSID={}".format(base_64_string),
			
 
				+        'Accept-Language': 'en,zh;q=0.9,zh-CN;q=0.8',
			
 
				+        'Cache-Control': 'no-cache',
			
 
				+        'Connection': 'keep-alive',
			
 
				+        'Content-Type': 'application/x-www-form-urlencoded',
			
 
				+        'Referer': 'https://haokan.baidu.com',
			
 
				+        'User-Agent': FakeUserAgent().chrome,
			
 
				+    }
			
 
				+    response = requests.request(
			
 
				+        "GET",
			
 
				+        url,
			
 
				+        headers=headers,
			
 
				+        params=params,
			
 
				+        proxies=tunnel_proxies()
			
 
				+    ).json()
			
 
				+    time.sleep(2)
			
 
				+    return response['data']['apiData']['curVideoMeta']
			
 
				+
			
 
				+
			
 
				+def hksp_search(key, sensitive_words, trace_id):
			
 
				+    """
			
 
				+    好看视频搜索爬虫
			
 
				+    """
			
 
				+    timestamp_seconds = time.time()
			
 
				+    timestamp_milliseconds = int(timestamp_seconds * 1000)
			
 
				+    url = 'https://haokan.baidu.com/haokan/ui-search/pc/search/video'
			
 
				+    # 定义请求的参数
			
 
				+    strings = "{}_{}_{}_{}_{}".format(1, urllib.parse.quote(key), 10, timestamp_milliseconds, 1)
			
 
				+    sign = hashlib.md5(strings.encode()).hexdigest()
			
 
				+    params = {
			
 
				+        'pn': 1,
			
 
				+        'rn': 10,
			
 
				+        'type': 'video',
			
 
				+        'query': key,
			
 
				+        'sign': sign,
			
 
				+        'version': 1,
			
 
				+        'timestamp': timestamp_milliseconds
			
 
				+    }
			
 
				+    # 定义请求头
			
 
				+    base_64_string = base64.b64encode(str(uuid4()).encode()).decode()
			
 
				+    headers = {
			
 
				+        'authority': 'haokan.baidu.com',
			
 
				+        'accept': '*/*',
			
 
				+        'accept-language': 'zh,en;q=0.9,zh-CN;q=0.8',
			
 
				+        'cookie': "BIDUPSID={}".format(base_64_string),
			
 
				+        'user-agent': FakeUserAgent().chrome,
			
 
				+        'x-requested-with': 'xmlhttprequest',
			
 
				+    }
			
 
				+    # 发送GET请求
			
 
				+    try:
			
 
				+        response = requests.get(
			
 
				+            url,
			
 
				+            headers=headers,
			
 
				+            params=params,
			
 
				+            proxies=tunnel_proxies(),
			
 
				+            timeout=120
			
 
				+        ).json()
			
 
				+        data_list = response['data']['list']
			
 
				+        L = []
			
 
				+        for data in data_list:
			
 
				+            try:
			
 
				+                video_id = data['vid']
			
 
				+                title = data['title']
			
 
				+                duration = int(data['duration'].split(":")[0]) * 60 + int(data['duration'].split(":")[1])
			
 
				+                if sensitive_flag(sensitive_words, title) and int(duration) <= 300:
			
 
				+                    res = get_video_detail(video_id)
			
 
				+                    L.append(res)
			
 
				+                    return L
			
 
				+                else:
			
 
				+                    continue
			
 
				+            except Exception as e:
			
 
				+                pass
			
 
				+
			
 
				+        return L
			
 
				+    except Exception as e:
			
 
				+        print(e)
			
 
				+        return []
			
 
				+
			
 
				+
			
 
				+if __name__ == '__main__':
			
 
				+    res = hksp_search("90岁上海大爷征婚", sensitive_words=[], trace_id="testId")
			
 
				+    for item in res:
			
 
				+        print(json.dumps(item, ensure_ascii=False, indent=4))