run_graph_pipeline.sh 3.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141
  1. #!/bin/bash
  2. # 图谱构建与可视化流程(步骤5-9)
  3. #
  4. # 依赖前置步骤(1-4)已执行完成:
  5. # 1. extract_feature_categories.py
  6. # 2. extract_features_from_posts.py
  7. # 3. extract_current_posts.py
  8. # 4. match_inspiration_features.py
  9. #
  10. # 本脚本执行:
  11. # 1. filter_how_results.py - 过滤how解构结果
  12. # 2. build_persona_graph.py - 构建人设图谱
  13. # 3. build_post_graph.py - 构建帖子图谱
  14. # 4. visualization/build.py - 生成人设图谱可视化HTML
  15. #
  16. # 使用方式:
  17. # ./run_graph_pipeline.sh # 使用默认账号
  18. # ./run_graph_pipeline.sh 阿里多多酱 # 指定账号
  19. # ACCOUNT_NAME=xxx ./run_graph_pipeline.sh
  20. set -e # 遇到错误立即退出
  21. # 获取脚本所在目录的绝对路径
  22. SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
  23. PROJECT_ROOT="$(cd "$SCRIPT_DIR/../.." && pwd)"
  24. cd "$PROJECT_ROOT"
  25. # 颜色定义
  26. GREEN='\033[0;32m'
  27. RED='\033[0;31m'
  28. YELLOW='\033[1;33m'
  29. BLUE='\033[0;34m'
  30. NC='\033[0m'
  31. print_info() { echo -e "${BLUE}[INFO]${NC} $1"; }
  32. print_success() { echo -e "${GREEN}[SUCCESS]${NC} $1"; }
  33. print_error() { echo -e "${RED}[ERROR]${NC} $1"; }
  34. print_step() { echo -e "${YELLOW}[$1]${NC} $2"; }
  35. # 执行单个步骤
  36. run_step() {
  37. local step_num=$1
  38. local step_name=$2
  39. local script_name=$3
  40. print_step "$step_num/4" "$step_name"
  41. if python "script/data_processing/$script_name"; then
  42. print_success "$step_name 完成"
  43. echo ""
  44. return 0
  45. else
  46. print_error "$step_name 失败"
  47. return 1
  48. fi
  49. }
  50. # 主处理函数
  51. process_account() {
  52. local account_name=$1
  53. echo ""
  54. echo "=========================================="
  55. echo "图谱构建与可视化流程"
  56. echo "账号: $account_name"
  57. echo "项目: $PROJECT_ROOT"
  58. echo "=========================================="
  59. echo ""
  60. # 设置环境变量
  61. export ACCOUNT_NAME="$account_name"
  62. # 步骤1: 过滤how解构结果
  63. run_step 1 "过滤how解构结果" "filter_how_results.py" || return 1
  64. # # 步骤2: 提取节点和边(不再需要)
  65. # run_step 2 "提取节点和边" "extract_nodes_and_edges.py" || return 1
  66. # 步骤2: 构建人设图谱
  67. run_step 2 "构建人设图谱" "build_persona_graph.py" || return 1
  68. # # 步骤: 构建匹配图谱(不再需要)
  69. # run_step 4 "构建匹配图谱" "build_match_graph.py" || return 1
  70. # 步骤3: 构建帖子图谱
  71. run_step 3 "构建帖子图谱" "build_post_graph.py" || return 1
  72. # # 步骤: 生成匹配图谱可视化HTML(不再需要)
  73. # run_step 6 "生成匹配图谱可视化" "visualize_match_graph.py" || return 1
  74. # 步骤4: 生成人设图谱可视化HTML
  75. print_step "4/4" "生成人设图谱可视化"
  76. if python "script/visualization/build.py"; then
  77. print_success "生成人设图谱可视化 完成"
  78. echo ""
  79. else
  80. print_error "生成人设图谱可视化 失败"
  81. return 1
  82. fi
  83. echo "=========================================="
  84. print_success "图谱构建与可视化流程完成!"
  85. echo "=========================================="
  86. }
  87. # 获取默认账号
  88. get_default_account() {
  89. python -c "
  90. import json
  91. from pathlib import Path
  92. config_file = Path('config/accounts.json')
  93. with open(config_file) as f:
  94. config = json.load(f)
  95. print(config.get('default_account', ''))
  96. "
  97. }
  98. # 主逻辑
  99. main() {
  100. local account_name=""
  101. # 解析参数
  102. if [ -n "$1" ]; then
  103. account_name="$1"
  104. elif [ -n "$ACCOUNT_NAME" ]; then
  105. account_name="$ACCOUNT_NAME"
  106. else
  107. account_name=$(get_default_account)
  108. if [ -z "$account_name" ]; then
  109. print_error "未指定账号,请通过参数或环境变量指定"
  110. echo "用法: $0 <账号名>"
  111. exit 1
  112. fi
  113. print_info "使用默认账号: $account_name"
  114. fi
  115. process_account "$account_name"
  116. }
  117. main "$@"