publish_single_video_pool_videos.py 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107
  1. import datetime
  2. from pymysql.cursors import DictCursor
  3. from applications import bot, aiditApi
  4. from applications.db import DatabaseConnector
  5. from config import long_articles_config
  6. generate_plan_map = {
  7. "gzh": "20250320072903157918565",
  8. "sph": "20250320111354709330323",
  9. "toutiao": "20250320111012643367248",
  10. "hksp": "20250320111324346478697",
  11. }
  12. platform_name_map = {
  13. "gzh": "公众号",
  14. "sph": "视频号",
  15. "toutiao": "头条号",
  16. "hksp": "好看视频",
  17. }
  18. class PublishSingleVideoPoolVideos:
  19. def __init__(self):
  20. self.db_client = DatabaseConnector(db_config=long_articles_config)
  21. self.db_client.connect()
  22. def get_task_list(self, platform:str) -> list[dict]:
  23. match platform:
  24. case "sph":
  25. task_count = 218
  26. case "gzh":
  27. task_count = 201
  28. case "toutiao":
  29. task_count = 411
  30. case "hksp":
  31. task_count = 165
  32. case _:
  33. return []
  34. fetch_query = f"""
  35. select id, content_trace_id, pq_vid
  36. from single_video_transform_queue
  37. where status = 0 and platform = '{platform}'
  38. order by score desc
  39. limit 2000
  40. """
  41. fetch_response = self.db_client.fetch(query=fetch_query, cursor_type=DictCursor)
  42. return fetch_response
  43. def update_tasks_status(self,
  44. task_id_tuple: tuple,
  45. ori_status: int,
  46. new_status: int)-> int:
  47. update_query = f"""
  48. update single_video_transform_queue
  49. set status = %s
  50. where id in %s and status = %s;
  51. """
  52. affected_rows = self.db_client.save(
  53. query=update_query,
  54. params=(new_status, task_id_tuple, ori_status)
  55. )
  56. return affected_rows
  57. def deal(self):
  58. """
  59. entrance of this class
  60. """
  61. platform_list = ["sph", "gzh", "toutiao", "hksp"]
  62. for platform in platform_list:
  63. task_list = self.get_task_list(platform)
  64. task_id_tuple = tuple([task['id'] for task in task_list])
  65. vid_list = [task['pq_vid'] for task in task_list]
  66. if vid_list:
  67. # create video crawler plan
  68. plan_name = f"{platform_name_map[platform]}-{datetime.datetime.today().strftime('%Y-%m-%d')}-视频数量: {len(vid_list)}"
  69. crawler_plan_response = aiditApi.auto_create_single_video_crawler_task(
  70. plan_name=plan_name,
  71. plan_tag="单视频供给冷启动",
  72. video_id_list=vid_list,
  73. )
  74. crawler_plan_id = crawler_plan_response["data"]["id"]
  75. crawler_plan_name = crawler_plan_response["data"]["name"]
  76. # update status
  77. self.update_tasks_status(
  78. task_id_tuple=task_id_tuple,
  79. ori_status=0,
  80. new_status=1,
  81. )
  82. # bind crawler plan to generate plan
  83. crawler_task_list = [
  84. {
  85. "contentType": 1,
  86. "inputSourceModal": 4,
  87. "inputSourceChannel": 10,
  88. "inputSourceType": 2,
  89. "inputSourceValue": crawler_plan_id,
  90. "inputSourceSubType": None,
  91. "fieldName": None,
  92. "inputSourceLabel": "原始帖子-视频-票圈小程序-内容添加计划-{}".format(crawler_plan_name),
  93. }
  94. ]
  95. generate_plan_id = generate_plan_map[platform]
  96. aiditApi.bind_crawler_task_to_generate_task(
  97. crawler_task_list=crawler_task_list,
  98. generate_task_id=generate_plan_id,
  99. )