run_evaluate.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298
  1. #!/usr/bin/env python
  2. # -*- coding: utf-8 -*-
  3. """
  4. 测试 EvaluateWorkflow 功能
  5. 创建测试数据并验证评估工作流的功能
  6. """
  7. import json
  8. import sys
  9. from pathlib import Path
  10. # 添加项目根目录到路径
  11. project_root = Path(__file__).parent.parent
  12. sys.path.insert(0, str(project_root))
  13. from src.models import get_db, DecodeVideo, DecodeStatus, EvaluateRecord, EvaluateStatus
  14. from src.workflows.evaluate_workflow import EvaluateWorkflow
  15. from src.utils.logger import get_logger
  16. logger = get_logger(__name__)
  17. def create_test_decode_video(task_id: int, video_id: str = "test_video_001") -> DecodeVideo:
  18. """创建测试用的 DecodeVideo 记录"""
  19. # 创建模拟的解构结果
  20. decode_result_v2 = {
  21. "视频信息": {
  22. "标题": "🔴退伍军人二次入伍的感人画面!若有战,召必回",
  23. "视频URL": "https://rescdn.yishihui.com/pipeline/video/f522fd33-1556-4928-ab5a-c5afdd3c9688.mp4",
  24. "正文": ""
  25. },
  26. "三点解构": {
  27. "灵感点": [
  28. {
  29. "候选编号": 1,
  30. "分类": "亲情告别",
  31. "灵感点": "父亲亲吻熟睡的婴儿",
  32. "描述": "视频开头,一位身着便装、背着行囊的男子,在即将离家前,深情地俯身亲吻床上熟睡的小婴儿,并温柔地为其盖好被子,眼中充满不舍。"
  33. }
  34. ],
  35. "目的点": {
  36. "perspective": "创作者视角",
  37. "purposes": [
  38. {
  39. "维度": {
  40. "一级分类": "个人",
  41. "二级分类": "分享"
  42. },
  43. "目的点": "展现军人告别与家人不舍的感人瞬间",
  44. "描述": "创作者通过剪辑多位军人在入伍或归队前与亲人进行告别的场景,着重刻画了军人坚毅与亲人依依不舍的复杂情感。"
  45. }
  46. ]
  47. },
  48. "关键点": {
  49. "key_points": [
  50. {
  51. "候选编号": 1,
  52. "维度大类": "实质",
  53. "维度细分": "元素",
  54. "关键点": "军人发型数字'2'",
  55. "描述": "军人头部的理发造型中,清晰可见数字'2',象征着'二次入伍'的身份。"
  56. }
  57. ]
  58. }
  59. },
  60. "选题理解": {
  61. "核心主题": "军人二次入伍与家人告别",
  62. "目标受众": "关注军人生活、家国情怀的观众",
  63. "情感基调": "感人、不舍、家国情怀"
  64. }
  65. }
  66. # 创建 DecodeVideo 记录
  67. decode_video = DecodeVideo.create(
  68. task_id=task_id,
  69. video_id=video_id,
  70. status=DecodeStatus.SUCCESS,
  71. decode_result_v2=json.dumps(decode_result_v2, ensure_ascii=False)
  72. )
  73. return decode_video
  74. def create_test_evaluate_record(evaluate_id: int, task_id: int) -> EvaluateRecord:
  75. """创建测试用的 EvaluateRecord 记录"""
  76. evaluate_record = EvaluateRecord.create(
  77. evaluate_id=evaluate_id,
  78. task_id=task_id,
  79. status=EvaluateStatus.PENDING
  80. )
  81. return evaluate_record
  82. def create_test_search_result() -> list:
  83. """创建测试用的待评估视频列表"""
  84. search_result = [
  85. {
  86. "video_id": "61626151",
  87. "video_url": "https://rescdn.yishihui.com/pipeline/video/f522fd33-1556-4928-ab5a-c5afdd3c9688.mp4",
  88. "title": "🔴退伍军人二次入伍的感人画面!若有战,召必回"
  89. },
  90. {
  91. "video_id": "61626152",
  92. "video_url": "https://rescdn.yishihui.com/pipeline/video/example1.mp4",
  93. "title": "军人告别家人的感人瞬间"
  94. },
  95. {
  96. "video_id": "61626153",
  97. "video_url": "https://rescdn.yishihui.com/pipeline/video/example2.mp4",
  98. "title": "二次入伍军人的家国情怀"
  99. },
  100. {
  101. "video_id": "61626154",
  102. "video_url": "https://rescdn.yishihui.com/pipeline/video/example3.mp4",
  103. "title": "美食制作教程:如何做红烧肉"
  104. },
  105. {
  106. "video_id": "61626155",
  107. "video_url": "https://rescdn.yishihui.com/pipeline/video/example4.mp4",
  108. "title": "旅行vlog:探索美丽的风景"
  109. }
  110. ]
  111. return search_result
  112. def setup_test_data(task_id: int, evaluate_id: int, video_id: str = "test_video_001"):
  113. """设置测试数据(创建数据库记录)"""
  114. logger.info("=== 开始设置测试数据 ===")
  115. db = next(get_db())
  116. try:
  117. # 检查是否已存在记录
  118. existing_decode = db.query(DecodeVideo).filter_by(task_id=task_id).first()
  119. if existing_decode:
  120. logger.info(f"DecodeVideo 记录已存在: task_id={task_id},将删除后重新创建")
  121. db.delete(existing_decode)
  122. db.commit()
  123. existing_evaluate = db.query(EvaluateRecord).filter_by(evaluate_id=evaluate_id).first()
  124. if existing_evaluate:
  125. logger.info(f"EvaluateRecord 记录已存在: evaluate_id={evaluate_id},将删除后重新创建")
  126. db.delete(existing_evaluate)
  127. db.commit()
  128. # 创建 DecodeVideo 记录
  129. decode_video = create_test_decode_video(task_id, video_id)
  130. db.add(decode_video)
  131. logger.info(f"✓ 创建 DecodeVideo 记录: task_id={task_id}, video_id={video_id}")
  132. # 创建 EvaluateRecord 记录
  133. evaluate_record = create_test_evaluate_record(evaluate_id, task_id)
  134. db.add(evaluate_record)
  135. logger.info(f"✓ 创建 EvaluateRecord 记录: evaluate_id={evaluate_id}, task_id={task_id}")
  136. db.commit()
  137. logger.info("✓ 测试数据设置完成")
  138. except Exception as e:
  139. logger.error(f"设置测试数据失败: {e}", exc_info=True)
  140. db.rollback()
  141. raise
  142. finally:
  143. db.close()
  144. def test_evaluate_workflow(task_id: int, evaluate_id: int):
  145. """测试评估工作流"""
  146. logger.info("=== 开始测试评估工作流 ===")
  147. # 创建待评估的视频列表
  148. search_result = create_test_search_result()
  149. logger.info(f"待评估视频数量: {len(search_result)}")
  150. # 准备输入数据
  151. input_data = {
  152. "task_id": task_id,
  153. "evaluate_id": evaluate_id,
  154. "search_result": search_result
  155. }
  156. logger.info(f"输入数据: task_id={task_id}, evaluate_id={evaluate_id}, search_result数量={len(search_result)}")
  157. # 创建并执行工作流
  158. try:
  159. workflow = EvaluateWorkflow(model_provider="google_genai")
  160. result = workflow.invoke(input_data)
  161. logger.info("=== 工作流执行结果 ===")
  162. logger.info(f"工作流状态: {result.get('workflow_status')}")
  163. if result.get("error"):
  164. logger.error(f"工作流执行错误: {result.get('error')}")
  165. return result
  166. evaluate_result = result.get("evaluate_result", [])
  167. logger.info(f"评估结果数量: {len(evaluate_result)}")
  168. # 打印评估结果详情
  169. if evaluate_result:
  170. logger.info("\n=== 评估结果详情 ===")
  171. for i, video in enumerate(evaluate_result, 1):
  172. logger.info(f"\n视频 {i}:")
  173. logger.info(f" video_id: {video.get('video_id')}")
  174. logger.info(f" title: {video.get('title')}")
  175. logger.info(f" relevance_score: {video.get('relevance_score', 'N/A')}")
  176. logger.info(f" is_selected: {video.get('is_selected', 'N/A')}")
  177. # 验证结果
  178. selected_count = sum(1 for v in evaluate_result if v.get("is_selected", False))
  179. logger.info(f"\n入选视频数量: {selected_count}/{len(evaluate_result)}")
  180. return result
  181. except Exception as e:
  182. logger.error(f"测试评估工作流失败: {e}", exc_info=True)
  183. raise
  184. def verify_database_result(evaluate_id: int):
  185. """验证数据库中的评估结果"""
  186. logger.info("=== 验证数据库结果 ===")
  187. db = next(get_db())
  188. try:
  189. evaluate_record = db.query(EvaluateRecord).filter_by(evaluate_id=evaluate_id).first()
  190. if not evaluate_record:
  191. logger.error(f"未找到 evaluate_id={evaluate_id} 的评估记录")
  192. return
  193. logger.info(f"评估记录状态: {EvaluateStatus.get_description(evaluate_record.status)}")
  194. logger.info(f"评估记录状态值: {evaluate_record.status}")
  195. if evaluate_record.evaluate_result:
  196. try:
  197. result_data = json.loads(evaluate_record.evaluate_result)
  198. logger.info(f"评估结果数量: {len(result_data) if isinstance(result_data, list) else 'N/A'}")
  199. logger.info(f"评估结果已保存到数据库")
  200. except json.JSONDecodeError as e:
  201. logger.error(f"解析评估结果失败: {e}")
  202. else:
  203. logger.warning("评估结果为空")
  204. except Exception as e:
  205. logger.error(f"验证数据库结果失败: {e}", exc_info=True)
  206. finally:
  207. db.close()
  208. def main():
  209. """主函数"""
  210. # 测试参数
  211. task_id = 999999 # 测试用的 task_id
  212. evaluate_id = 888888 # 测试用的 evaluate_id
  213. video_id = "test_video_001"
  214. try:
  215. # 1. 设置测试数据
  216. setup_test_data(task_id, evaluate_id, video_id)
  217. # 2. 执行评估工作流
  218. result = test_evaluate_workflow(task_id, evaluate_id)
  219. # 3. 验证数据库结果
  220. verify_database_result(evaluate_id)
  221. # 4. 总结
  222. logger.info("\n=== 测试总结 ===")
  223. if result.get("workflow_status") == "success":
  224. logger.info("✓ 评估工作流测试成功!")
  225. evaluate_result = result.get("evaluate_result", [])
  226. if evaluate_result:
  227. logger.info(f"✓ 成功评估 {len(evaluate_result)} 个视频")
  228. selected = [v for v in evaluate_result if v.get("is_selected", False)]
  229. logger.info(f"✓ 入选视频 {len(selected)} 个")
  230. else:
  231. logger.error("✗ 评估工作流测试失败")
  232. if result.get("error"):
  233. logger.error(f"错误信息: {result.get('error')}")
  234. except Exception as e:
  235. logger.error(f"测试执行失败: {e}", exc_info=True)
  236. sys.exit(1)
  237. if __name__ == "__main__":
  238. main()