schedule.py 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128
  1. """
  2. 定时任务相关数据库操作
  3. demand_content: 原始检索内容库
  4. demand_find_task: 执行记录表,通过 demand_content_id 关联
  5. """
  6. import logging
  7. from typing import Any, Dict, Optional
  8. from .connection import get_connection
  9. logger = logging.getLogger(__name__)
  10. # 状态常量(与 demand_find_task 表一致)
  11. STATUS_PENDING = 0
  12. STATUS_RUNNING = 1
  13. STATUS_SUCCESS = 2
  14. STATUS_FAILED = 3
  15. def get_next_unprocessed_demand() -> Optional[Dict[str, Any]]:
  16. """
  17. 联表查询 demand_content 和 demand_find_task,找到创建最早且未处理的 demand_content。
  18. 未处理定义:该 demand_content_id 下无 status 为 0/1/2 的任务
  19. (即无待执行、执行中、成功的记录)
  20. Returns:
  21. {"demand_content_id": int, "query": str} 或 None
  22. """
  23. sql = """
  24. SELECT dc.id AS demand_content_id,
  25. dc.name AS query
  26. FROM demand_content dc
  27. WHERE NOT EXISTS (
  28. SELECT 1 FROM demand_find_task t
  29. WHERE t.demand_content_id = dc.id AND t.status IN (%s, %s, %s)
  30. )
  31. ORDER BY dc.id ASC
  32. LIMIT 1
  33. """
  34. conn = None
  35. try:
  36. conn = get_connection()
  37. with conn.cursor() as cur:
  38. cur.execute(sql, (STATUS_PENDING, STATUS_RUNNING, STATUS_SUCCESS))
  39. row = cur.fetchone()
  40. return dict(row) if row else None
  41. except Exception as e:
  42. logger.error(f"get_next_unprocessed_demand 失败: {e}", exc_info=True)
  43. raise
  44. finally:
  45. if conn:
  46. conn.close()
  47. def create_task_record(demand_content_id: int, trace_id: str = "", status: int = STATUS_PENDING) -> None:
  48. """
  49. 在 demand_find_task 中新增一条记录。
  50. 初始创建时 trace_id 可置为空字符串,任务完成后通过 update_task_on_complete 更新。
  51. """
  52. sql = """
  53. INSERT INTO demand_find_task (trace_id, demand_content_id, status)
  54. VALUES (%s, %s, %s)
  55. """
  56. conn = None
  57. try:
  58. conn = get_connection()
  59. with conn.cursor() as cur:
  60. cur.execute(sql, (trace_id, demand_content_id, status))
  61. logger.info(f"创建任务记录: demand_content_id={demand_content_id}")
  62. except Exception as e:
  63. logger.error(f"create_task_record 失败: {e}", exc_info=True)
  64. raise
  65. finally:
  66. if conn:
  67. conn.close()
  68. def update_task_on_complete(demand_content_id: int, trace_id: str, status: int) -> None:
  69. """
  70. 任务完成后更新 trace_id 和 status。
  71. 匹配 trace_id 为空字符串的记录(初始创建时的占位)。
  72. """
  73. sql = """
  74. UPDATE demand_find_task
  75. SET trace_id = %s, status = %s
  76. WHERE demand_content_id = %s AND trace_id = ''
  77. """
  78. conn = None
  79. try:
  80. conn = get_connection()
  81. with conn.cursor() as cur:
  82. cur.execute(sql, (trace_id, status, demand_content_id))
  83. logger.info(f"更新任务完成: demand_content_id={demand_content_id}, trace_id={trace_id}, status={status}")
  84. except Exception as e:
  85. logger.error(f"update_task_on_complete 失败: {e}", exc_info=True)
  86. raise
  87. finally:
  88. if conn:
  89. conn.close()
  90. def update_task_status(trace_id: str, demand_content_id: int, status: int) -> None:
  91. """
  92. 更新 demand_find_task 中指定记录的状态。
  93. trace_id 可为空字符串(任务尚未返回时,通过 demand_content_id 定位记录)。
  94. """
  95. sql = """
  96. UPDATE demand_find_task
  97. SET status = %s
  98. WHERE trace_id = %s AND demand_content_id = %s
  99. """
  100. conn = None
  101. try:
  102. conn = get_connection()
  103. with conn.cursor() as cur:
  104. cur.execute(sql, (status, trace_id, demand_content_id))
  105. logger.info(f"更新任务状态: trace_id={trace_id}, demand_content_id={demand_content_id}, status={status}")
  106. except Exception as e:
  107. logger.error(f"update_task_status 失败: {e}", exc_info=True)
  108. raise
  109. finally:
  110. if conn:
  111. conn.close()