publish_single_video_pool_videos.py 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112
  1. import datetime
  2. from pymysql.cursors import DictCursor
  3. from applications import bot, aiditApi
  4. from applications.db import DatabaseConnector
  5. from config import long_articles_config
  6. generate_plan_map = {
  7. "gzh": "20250320072903157918565",
  8. "sph": "20250320111354709330323",
  9. "toutiao": "20250320111012643367248",
  10. "hksp": "20250320111324346478697",
  11. }
  12. platform_name_map = {
  13. "gzh": "公众号",
  14. "sph": "视频号",
  15. "toutiao": "头条号",
  16. "hksp": "好看视频",
  17. }
  18. class PublishSingleVideoPoolVideos:
  19. def __init__(self):
  20. self.db_client = DatabaseConnector(db_config=long_articles_config)
  21. self.db_client.connect()
  22. def get_task_list(self, platform:str) -> list[dict]:
  23. match platform:
  24. case "sph":
  25. task_count = 218
  26. case "gzh":
  27. task_count = 201
  28. case "toutiao":
  29. task_count = 411
  30. case "hksp":
  31. task_count = 165
  32. case _:
  33. return []
  34. fetch_query = f"""
  35. select id, content_trace_id, pq_vid
  36. from single_video_transform_queue
  37. where status = 0 and platform = '{platform}'
  38. order by score desc
  39. """
  40. fetch_response = self.db_client.fetch(query=fetch_query, cursor_type=DictCursor)
  41. return fetch_response
  42. def update_tasks_status(self,
  43. task_id_tuple: tuple,
  44. ori_status: int,
  45. new_status: int)-> int:
  46. update_query = f"""
  47. update single_video_transform_queue
  48. set status = %s
  49. where id in %s and status = %s;
  50. """
  51. affected_rows = self.db_client.save(
  52. query=update_query,
  53. params=(new_status, task_id_tuple, ori_status)
  54. )
  55. return affected_rows
  56. def deal(self):
  57. """
  58. entrance of this class
  59. """
  60. platform_list = ["sph", "gzh", "toutiao", "hksp"]
  61. for platform in platform_list:
  62. task_list = self.get_task_list(platform)
  63. task_id_tuple = tuple([task['id'] for task in task_list])
  64. vid_list = [task['pq_vid'] for task in task_list]
  65. if vid_list:
  66. # create video crawler plan
  67. plan_name = f"{platform_name_map[platform]}-历史数据-视频数量: {len(vid_list)}"
  68. crawler_plan_response = aiditApi.auto_create_single_video_crawler_task(
  69. plan_name=plan_name,
  70. plan_tag="单视频供给冷启动",
  71. video_id_list=vid_list,
  72. )
  73. crawler_plan_id = crawler_plan_response["data"]["id"]
  74. crawler_plan_name = crawler_plan_response["data"]["name"]
  75. # update status
  76. self.update_tasks_status(
  77. task_id_tuple=task_id_tuple,
  78. ori_status=0,
  79. new_status=1,
  80. )
  81. # bind crawler plan to generate plan
  82. crawler_task_list = [
  83. {
  84. "contentType": 1,
  85. "inputSourceModal": 4,
  86. "inputSourceChannel": 10,
  87. "inputSourceType": 2,
  88. "inputSourceValue": crawler_plan_id,
  89. "inputSourceSubType": None,
  90. "fieldName": None,
  91. "inputSourceLabel": "原始帖子-视频-票圈小程序-内容添加计划-{}".format(crawler_plan_name),
  92. }
  93. ]
  94. generate_plan_id = generate_plan_map[platform]
  95. aiditApi.bind_crawler_task_to_generate_task(
  96. crawler_task_list=crawler_task_list,
  97. generate_task_id=generate_plan_id,
  98. )
  99. if __name__ == '__main__':
  100. task = PublishSingleVideoPoolVideos()
  101. task.deal()