| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312131313141315131613171318131913201321132213231324132513261327132813291330133113321333133413351336133713381339134013411342134313441345134613471348134913501351135213531354135513561357135813591360136113621363136413651366136713681369137013711372137313741375137613771378137913801381138213831384138513861387 |
- #!/usr/bin/env python3
- # -*- coding: utf-8 -*-
- """
- Stage6评估结果可视化工具
- 整合两层评估结果的交互式HTML页面
- """
- import json
- import os
- from datetime import datetime
- from typing import List, Dict, Any
- def load_data(json_path: str) -> List[Dict[str, Any]]:
- """加载JSON数据"""
- with open(json_path, 'r', encoding='utf-8') as f:
- return json.load(f)
- def calculate_statistics(data: List[Dict[str, Any]]) -> Dict[str, Any]:
- """计算统计数据(包括评估结果)"""
- total_features = len(data)
- total_search_words = 0
- total_notes = 0
- video_count = 0
- normal_count = 0
- # 评估统计
- total_evaluated_notes = 0
- total_filtered = 0
- match_complete = 0 # 8-10分
- match_similar = 0 # 6-7分
- match_weak = 0 # 5-6分
- match_none = 0 # ≤4分
- for feature in data:
- grouped_results = feature.get('组合评估结果_分组', [])
- for group in grouped_results:
- search_items = group.get('top10_searches', [])
- total_search_words += len(search_items)
- for search_item in search_items:
- search_result = search_item.get('search_result', {})
- notes = search_result.get('data', {}).get('data', [])
- total_notes += len(notes)
- # 统计视频/图文类型
- for note in notes:
- note_type = note.get('note_card', {}).get('type', '')
- if note_type == 'video':
- video_count += 1
- else:
- normal_count += 1
- # 统计评估结果
- evaluation = search_item.get('evaluation_with_filter')
- if evaluation:
- total_evaluated_notes += evaluation.get('total_notes', 0)
- total_filtered += evaluation.get('filtered_count', 0)
- stats = evaluation.get('statistics', {})
- match_complete += stats.get('完全匹配(8-10)', 0)
- match_similar += stats.get('相似匹配(6-7)', 0)
- match_weak += stats.get('弱相似(5-6)', 0)
- match_none += stats.get('无匹配(≤4)', 0)
- # 计算百分比
- total_remaining = total_evaluated_notes - total_filtered if total_evaluated_notes > 0 else 0
- return {
- 'total_features': total_features,
- 'total_search_words': total_search_words,
- 'total_notes': total_notes,
- 'video_count': video_count,
- 'normal_count': normal_count,
- 'video_percentage': round(video_count / total_notes * 100, 1) if total_notes > 0 else 0,
- 'normal_percentage': round(normal_count / total_notes * 100, 1) if total_notes > 0 else 0,
- # 评估统计
- 'total_evaluated': total_evaluated_notes,
- 'total_filtered': total_filtered,
- 'total_remaining': total_remaining,
- 'filter_rate': round(total_filtered / total_evaluated_notes * 100, 1) if total_evaluated_notes > 0 else 0,
- 'match_complete': match_complete,
- 'match_similar': match_similar,
- 'match_weak': match_weak,
- 'match_none': match_none,
- 'complete_rate': round(match_complete / total_remaining * 100, 1) if total_remaining > 0 else 0,
- 'similar_rate': round(match_similar / total_remaining * 100, 1) if total_remaining > 0 else 0,
- }
- def generate_html(data: List[Dict[str, Any]], stats: Dict[str, Any], output_path: str):
- """生成HTML可视化页面"""
- # 准备数据JSON(用于JavaScript)
- data_json = json.dumps(data, ensure_ascii=False, indent=2)
- html_content = f'''<!DOCTYPE html>
- <html lang="zh-CN">
- <head>
- <meta charset="UTF-8">
- <meta name="viewport" content="width=device-width, initial-scale=1.0">
- <title>Stage6 评估结果可视化</title>
- <style>
- * {{
- margin: 0;
- padding: 0;
- box-sizing: border-box;
- }}
- body {{
- font-family: -apple-system, BlinkMacSystemFont, "Segoe UI", Roboto, "Helvetica Neue", Arial, sans-serif;
- background: #f5f7fa;
- color: #333;
- overflow-x: hidden;
- }}
- /* 顶部统计面板 */
- .stats-panel {{
- background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
- color: white;
- padding: 20px;
- box-shadow: 0 2px 10px rgba(0,0,0,0.1);
- }}
- .stats-container {{
- max-width: 1400px;
- margin: 0 auto;
- }}
- .stats-row {{
- display: flex;
- justify-content: space-around;
- align-items: center;
- flex-wrap: wrap;
- gap: 15px;
- margin-bottom: 15px;
- }}
- .stats-row:last-child {{
- margin-bottom: 0;
- padding-top: 15px;
- border-top: 1px solid rgba(255,255,255,0.2);
- }}
- .stat-item {{
- text-align: center;
- }}
- .stat-value {{
- font-size: 28px;
- font-weight: bold;
- margin-bottom: 5px;
- }}
- .stat-label {{
- font-size: 12px;
- opacity: 0.9;
- }}
- .stat-item.small .stat-value {{
- font-size: 22px;
- }}
- /* 过滤控制面板 */
- .filter-panel {{
- background: white;
- max-width: 1400px;
- margin: 20px auto;
- padding: 15px 20px;
- border-radius: 8px;
- box-shadow: 0 2px 8px rgba(0,0,0,0.1);
- display: flex;
- align-items: center;
- gap: 20px;
- flex-wrap: wrap;
- }}
- .filter-label {{
- font-weight: 600;
- color: #374151;
- }}
- .filter-buttons {{
- display: flex;
- gap: 10px;
- flex-wrap: wrap;
- }}
- .filter-btn {{
- padding: 6px 12px;
- border: 2px solid #e5e7eb;
- background: white;
- border-radius: 6px;
- cursor: pointer;
- font-size: 13px;
- font-weight: 500;
- transition: all 0.2s;
- }}
- .filter-btn:hover {{
- border-color: #667eea;
- background: #f9fafb;
- }}
- .filter-btn.active {{
- border-color: #667eea;
- background: #667eea;
- color: white;
- }}
- .filter-btn.complete {{
- border-color: #10b981;
- }}
- .filter-btn.complete.active {{
- background: #10b981;
- border-color: #10b981;
- }}
- .filter-btn.similar {{
- border-color: #f59e0b;
- }}
- .filter-btn.similar.active {{
- background: #f59e0b;
- border-color: #f59e0b;
- }}
- .filter-btn.weak {{
- border-color: #f97316;
- }}
- .filter-btn.weak.active {{
- background: #f97316;
- border-color: #f97316;
- }}
- .filter-btn.none {{
- border-color: #ef4444;
- }}
- .filter-btn.none.active {{
- background: #ef4444;
- border-color: #ef4444;
- }}
- .filter-btn.filtered {{
- border-color: #6b7280;
- }}
- .filter-btn.filtered.active {{
- background: #6b7280;
- border-color: #6b7280;
- }}
- /* 主容器 */
- .main-container {{
- display: flex;
- max-width: 1400px;
- margin: 0 auto 20px;
- gap: 20px;
- padding: 0 20px;
- height: calc(100vh - 260px);
- }}
- /* 左侧导航 */
- .left-sidebar {{
- width: 30%;
- background: white;
- border-radius: 8px;
- box-shadow: 0 2px 8px rgba(0,0,0,0.1);
- overflow-y: auto;
- position: sticky;
- top: 20px;
- height: fit-content;
- max-height: calc(100vh - 280px);
- }}
- .feature-group {{
- border-bottom: 1px solid #e5e7eb;
- }}
- .feature-header {{
- padding: 15px 20px;
- background: #f9fafb;
- cursor: pointer;
- user-select: none;
- transition: background 0.2s;
- }}
- .feature-header:hover {{
- background: #f3f4f6;
- }}
- .feature-header.active {{
- background: #667eea;
- color: white;
- }}
- .feature-title {{
- font-size: 16px;
- font-weight: 600;
- margin-bottom: 5px;
- }}
- .feature-meta {{
- font-size: 12px;
- color: #6b7280;
- }}
- .feature-header.active .feature-meta {{
- color: rgba(255,255,255,0.8);
- }}
- .search-words-list {{
- display: none;
- padding: 0;
- }}
- .search-words-list.expanded {{
- display: block;
- }}
- /* Base word分组层 */
- .base-word-group {{
- border-bottom: 1px solid #f3f4f6;
- }}
- .base-word-header {{
- padding: 12px 20px 12px 30px;
- background: #fafbfc;
- cursor: pointer;
- user-select: none;
- transition: all 0.2s;
- border-left: 3px solid transparent;
- }}
- .base-word-header:hover {{
- background: #f3f4f6;
- border-left-color: #a78bfa;
- }}
- .base-word-header.active {{
- background: #f3f4f6;
- border-left-color: #7c3aed;
- }}
- .base-word-title {{
- font-size: 15px;
- font-weight: 600;
- color: #7c3aed;
- margin-bottom: 4px;
- }}
- .base-word-meta {{
- font-size: 11px;
- color: #6b7280;
- }}
- .base-word-desc {{
- padding: 8px 20px 8px 30px;
- background: #fefce8;
- font-size: 12px;
- color: #854d0e;
- line-height: 1.5;
- border-left: 3px solid #fbbf24;
- display: none;
- }}
- .base-word-desc.expanded {{
- display: block;
- }}
- .search-words-sublist {{
- display: none;
- }}
- .search-words-sublist.expanded {{
- display: block;
- }}
- .search-word-item {{
- padding: 12px 20px 12px 50px;
- cursor: pointer;
- border-left: 3px solid transparent;
- transition: all 0.2s;
- }}
- .search-word-item:hover {{
- background: #f9fafb;
- border-left-color: #667eea;
- }}
- .search-word-item.active {{
- background: #ede9fe;
- border-left-color: #7c3aed;
- }}
- .search-word-text {{
- font-size: 14px;
- font-weight: 500;
- color: #374151;
- margin-bottom: 4px;
- }}
- .search-word-score {{
- display: inline-block;
- padding: 2px 8px;
- border-radius: 12px;
- font-size: 11px;
- font-weight: 600;
- margin-left: 8px;
- }}
- .score-high {{
- background: #d1fae5;
- color: #065f46;
- }}
- .score-medium {{
- background: #fef3c7;
- color: #92400e;
- }}
- .score-low {{
- background: #fee2e2;
- color: #991b1b;
- }}
- /* 评估徽章 */
- .eval-badge {{
- display: inline-block;
- padding: 2px 6px;
- border-radius: 10px;
- font-size: 11px;
- font-weight: 600;
- margin-left: 6px;
- }}
- .eval-complete {{
- background: #d1fae5;
- color: #065f46;
- border: 1px solid #10b981;
- }}
- .eval-similar {{
- background: #fef3c7;
- color: #92400e;
- border: 1px solid #f59e0b;
- }}
- .eval-weak {{
- background: #fed7aa;
- color: #9a3412;
- border: 1px solid #f97316;
- }}
- .eval-none {{
- background: #fee2e2;
- color: #991b1b;
- border: 1px solid #ef4444;
- }}
- .eval-filtered {{
- background: #e5e7eb;
- color: #4b5563;
- border: 1px solid #6b7280;
- }}
- .search-word-eval {{
- font-size: 11px;
- color: #6b7280;
- margin-top: 4px;
- }}
- /* 右侧结果区 */
- .right-content {{
- flex: 1;
- overflow-y: auto;
- padding-bottom: 40px;
- }}
- .result-block {{
- background: white;
- border-radius: 8px;
- box-shadow: 0 2px 8px rgba(0,0,0,0.1);
- margin-bottom: 30px;
- padding: 20px;
- scroll-margin-top: 20px;
- }}
- .result-header {{
- margin-bottom: 20px;
- padding-bottom: 15px;
- border-bottom: 2px solid #e5e7eb;
- }}
- .result-title {{
- font-size: 20px;
- font-weight: 600;
- color: #111827;
- margin-bottom: 10px;
- }}
- .result-stats {{
- display: flex;
- gap: 10px;
- font-size: 12px;
- color: #6b7280;
- flex-wrap: wrap;
- }}
- .stat-badge {{
- background: #f3f4f6;
- padding: 4px 10px;
- border-radius: 4px;
- }}
- .stat-badge.eval {{
- font-weight: 600;
- }}
- .stat-badge.eval.complete {{
- background: #d1fae5;
- color: #065f46;
- }}
- .stat-badge.eval.similar {{
- background: #fef3c7;
- color: #92400e;
- }}
- .stat-badge.eval.weak {{
- background: #fed7aa;
- color: #9a3412;
- }}
- .stat-badge.eval.none {{
- background: #fee2e2;
- color: #991b1b;
- }}
- .stat-badge.eval.filtered {{
- background: #e5e7eb;
- color: #4b5563;
- }}
- /* 帖子网格 */
- .notes-grid {{
- display: grid;
- grid-template-columns: repeat(auto-fill, minmax(280px, 1fr));
- gap: 20px;
- }}
- .note-card {{
- border: 3px solid #e5e7eb;
- border-radius: 8px;
- overflow: hidden;
- cursor: pointer;
- transition: all 0.3s;
- background: white;
- }}
- .note-card:hover {{
- transform: translateY(-4px);
- box-shadow: 0 10px 25px rgba(0,0,0,0.15);
- }}
- /* 根据评估分数设置边框颜色 */
- .note-card.eval-complete {{
- border-color: #10b981;
- }}
- .note-card.eval-similar {{
- border-color: #f59e0b;
- }}
- .note-card.eval-weak {{
- border-color: #f97316;
- }}
- .note-card.eval-none {{
- border-color: #ef4444;
- }}
- .note-card.eval-filtered {{
- border-color: #6b7280;
- opacity: 0.6;
- }}
- /* 图片轮播 */
- .image-carousel {{
- position: relative;
- width: 100%;
- height: 280px;
- background: #f3f4f6;
- overflow: hidden;
- }}
- .carousel-images {{
- display: flex;
- height: 100%;
- transition: transform 0.3s ease;
- }}
- .carousel-image {{
- min-width: 100%;
- height: 100%;
- object-fit: cover;
- }}
- .carousel-btn {{
- position: absolute;
- top: 50%;
- transform: translateY(-50%);
- background: rgba(0,0,0,0.5);
- color: white;
- border: none;
- width: 32px;
- height: 32px;
- border-radius: 50%;
- cursor: pointer;
- font-size: 16px;
- display: none;
- align-items: center;
- justify-content: center;
- transition: background 0.2s;
- z-index: 10;
- }}
- .carousel-btn:hover {{
- background: rgba(0,0,0,0.7);
- }}
- .carousel-btn.prev {{
- left: 8px;
- }}
- .carousel-btn.next {{
- right: 8px;
- }}
- .note-card:hover .carousel-btn {{
- display: flex;
- }}
- .carousel-indicators {{
- position: absolute;
- bottom: 10px;
- left: 50%;
- transform: translateX(-50%);
- display: flex;
- gap: 6px;
- z-index: 10;
- }}
- .dot {{
- width: 8px;
- height: 8px;
- border-radius: 50%;
- background: rgba(255,255,255,0.5);
- cursor: pointer;
- transition: all 0.2s;
- }}
- .dot.active {{
- background: white;
- width: 24px;
- border-radius: 4px;
- }}
- .image-counter {{
- position: absolute;
- top: 10px;
- right: 10px;
- background: rgba(0,0,0,0.6);
- color: white;
- padding: 4px 8px;
- border-radius: 4px;
- font-size: 12px;
- z-index: 10;
- }}
- /* 帖子信息 */
- .note-info {{
- padding: 12px;
- }}
- .note-title {{
- font-size: 14px;
- font-weight: 500;
- color: #111827;
- margin-bottom: 8px;
- display: -webkit-box;
- -webkit-line-clamp: 2;
- -webkit-box-orient: vertical;
- overflow: hidden;
- line-height: 1.4;
- }}
- .note-meta {{
- display: flex;
- align-items: center;
- justify-content: space-between;
- font-size: 12px;
- color: #6b7280;
- margin-bottom: 8px;
- }}
- .note-type {{
- padding: 3px 8px;
- border-radius: 4px;
- font-weight: 500;
- }}
- .type-video {{
- background: #dbeafe;
- color: #1e40af;
- }}
- .type-normal {{
- background: #d1fae5;
- color: #065f46;
- }}
- .note-author {{
- display: flex;
- align-items: center;
- gap: 6px;
- }}
- .author-avatar {{
- width: 24px;
- height: 24px;
- border-radius: 50%;
- }}
- /* 评估信息 */
- .note-eval {{
- padding: 8px 12px;
- background: #f9fafb;
- border-top: 1px solid #e5e7eb;
- font-size: 12px;
- }}
- .note-eval-header {{
- display: flex;
- align-items: center;
- justify-content: space-between;
- cursor: pointer;
- user-select: none;
- }}
- .note-eval-score {{
- font-weight: 600;
- }}
- .note-eval-toggle {{
- color: #6b7280;
- font-size: 10px;
- }}
- .note-eval-details {{
- margin-top: 8px;
- padding-top: 8px;
- border-top: 1px solid #e5e7eb;
- display: none;
- line-height: 1.5;
- }}
- .note-eval-details.expanded {{
- display: block;
- }}
- .eval-detail-label {{
- font-weight: 600;
- color: #374151;
- margin-top: 6px;
- margin-bottom: 2px;
- }}
- .eval-detail-label:first-child {{
- margin-top: 0;
- }}
- .eval-detail-text {{
- color: #6b7280;
- }}
- /* 滚动条样式 */
- ::-webkit-scrollbar {{
- width: 8px;
- height: 8px;
- }}
- ::-webkit-scrollbar-track {{
- background: #f1f1f1;
- }}
- ::-webkit-scrollbar-thumb {{
- background: #888;
- border-radius: 4px;
- }}
- ::-webkit-scrollbar-thumb:hover {{
- background: #555;
- }}
- /* 隐藏类 */
- .hidden {{
- display: none !important;
- }}
- </style>
- </head>
- <body>
- <!-- 统计面板 -->
- <div class="stats-panel">
- <div class="stats-container">
- <div class="stats-row">
- <div class="stat-item">
- <div class="stat-value">📊 {stats['total_features']}</div>
- <div class="stat-label">原始特征数</div>
- </div>
- <div class="stat-item">
- <div class="stat-value">🔍 {stats['total_search_words']}</div>
- <div class="stat-label">搜索词数</div>
- </div>
- <div class="stat-item">
- <div class="stat-value">📝 {stats['total_notes']}</div>
- <div class="stat-label">帖子总数</div>
- </div>
- <div class="stat-item">
- <div class="stat-value">🎬 {stats['video_count']}</div>
- <div class="stat-label">视频类型 ({stats['video_percentage']}%)</div>
- </div>
- <div class="stat-item">
- <div class="stat-value">📷 {stats['normal_count']}</div>
- <div class="stat-label">图文类型 ({stats['normal_percentage']}%)</div>
- </div>
- </div>
- <div class="stats-row">
- <div class="stat-item small">
- <div class="stat-value">⚡ {stats['total_evaluated']}</div>
- <div class="stat-label">已评估</div>
- </div>
- <div class="stat-item small">
- <div class="stat-value">⚫ {stats['total_filtered']}</div>
- <div class="stat-label">已过滤 ({stats['filter_rate']}%)</div>
- </div>
- <div class="stat-item small">
- <div class="stat-value">🟢 {stats['match_complete']}</div>
- <div class="stat-label">完全匹配 ({stats['complete_rate']}%)</div>
- </div>
- <div class="stat-item small">
- <div class="stat-value">🟡 {stats['match_similar']}</div>
- <div class="stat-label">相似匹配 ({stats['similar_rate']}%)</div>
- </div>
- <div class="stat-item small">
- <div class="stat-value">🟠 {stats['match_weak']}</div>
- <div class="stat-label">弱相似</div>
- </div>
- <div class="stat-item small">
- <div class="stat-value">🔴 {stats['match_none']}</div>
- <div class="stat-label">无匹配</div>
- </div>
- </div>
- </div>
- </div>
- <!-- 过滤控制面板 -->
- <div class="filter-panel">
- <span class="filter-label">🔍 筛选显示:</span>
- <div class="filter-buttons">
- <button class="filter-btn active" onclick="filterNotes('all')">全部</button>
- <button class="filter-btn complete" onclick="filterNotes('complete')">🟢 完全匹配</button>
- <button class="filter-btn similar" onclick="filterNotes('similar')">🟡 相似匹配</button>
- <button class="filter-btn weak" onclick="filterNotes('weak')">🟠 弱相似</button>
- <button class="filter-btn none" onclick="filterNotes('none')">🔴 无匹配</button>
- <button class="filter-btn filtered" onclick="filterNotes('filtered')">⚫ 已过滤</button>
- </div>
- </div>
- <!-- 主容器 -->
- <div class="main-container">
- <!-- 左侧导航 -->
- <div class="left-sidebar" id="leftSidebar">
- <!-- 通过JavaScript动态生成 -->
- </div>
- <!-- 右侧结果区 -->
- <div class="right-content" id="rightContent">
- <!-- 通过JavaScript动态生成 -->
- </div>
- </div>
- <script>
- // 数据
- const data = {data_json};
- let currentFilter = 'all';
- // 创建评估映射(使用索引: "featureIdx-groupIdx-swIdx-noteIdx" -> evaluation)
- const noteEvaluations = {{}};
- data.forEach((feature, fIdx) => {{
- const groups = feature['组合评估结果_分组'] || [];
- groups.forEach((group, gIdx) => {{
- const searches = group['top10_searches'] || [];
- searches.forEach((search, sIdx) => {{
- const evaluation = search['evaluation_with_filter'];
- if (evaluation && evaluation.notes_evaluation) {{
- evaluation.notes_evaluation.forEach(noteEval => {{
- const key = `${{fIdx}}-${{gIdx}}-${{sIdx}}-${{noteEval.note_index}}`;
- noteEvaluations[key] = noteEval;
- }});
- }}
- }});
- }});
- }});
- // 获取评估类别
- function getEvalCategory(noteEval) {{
- if (!noteEval || noteEval['Query相关性'] !== '相关') {{
- return 'filtered';
- }}
- const score = noteEval['综合得分'];
- if (score >= 8) return 'complete';
- if (score >= 6) return 'similar';
- if (score >= 5) return 'weak';
- return 'none';
- }}
- // 渲染左侧导航
- function renderLeftSidebar() {{
- const sidebar = document.getElementById('leftSidebar');
- let html = '';
- data.forEach((feature, featureIdx) => {{
- const groups = feature['组合评估结果_分组'] || [];
- let totalSearches = 0;
- groups.forEach(group => {{
- totalSearches += (group['top10_searches'] || []).length;
- }});
- // 层级1: 原始特征
- html += `
- <div class="feature-group">
- <div class="feature-header" onclick="toggleFeature(${{featureIdx}})" id="feature-header-${{featureIdx}}">
- <div class="feature-title">${{feature['原始特征名称']}}</div>
- <div class="feature-meta">
- ${{feature['来源层级']}} · 权重: ${{feature['权重'].toFixed(2)}} · ${{totalSearches}}个搜索词
- </div>
- </div>
- <div class="search-words-list" id="search-words-${{featureIdx}}">
- `;
- // 层级2: Base word分组
- groups.forEach((group, groupIdx) => {{
- const baseWord = group['base_word'] || '';
- const baseSimilarity = group['base_word_similarity'] || 0;
- const searches = group['top10_searches'] || [];
- // 获取相关词汇
- const relatedWords = feature['高相似度候选_按base_word']?.[baseWord] || [];
- const relatedWordNames = relatedWords.map(w => w['人设特征名称']).slice(0, 10).join('、');
- html += `
- <div class="base-word-group">
- <div class="base-word-header" onclick="toggleBaseWord(${{featureIdx}}, ${{groupIdx}})"
- id="base-word-header-${{featureIdx}}-${{groupIdx}}">
- <div class="base-word-title">🎯 ${{baseWord}}</div>
- <div class="base-word-meta">相似度: ${{baseSimilarity.toFixed(2)}} · ${{searches.length}}个搜索词</div>
- </div>
- <div class="base-word-desc" id="base-word-desc-${{featureIdx}}-${{groupIdx}}">
- ${{relatedWordNames || '无相关词汇'}}
- </div>
- <div class="search-words-sublist" id="search-words-sublist-${{featureIdx}}-${{groupIdx}}">
- `;
- // 层级3: 搜索词列表
- searches.forEach((sw, swIdx) => {{
- const score = sw.score || 0;
- const scoreClass = score >= 0.9 ? 'score-high' : score >= 0.7 ? 'score-medium' : 'score-low';
- const blockId = `block-${{featureIdx}}-${{groupIdx}}-${{swIdx}}`;
- const sourceWord = sw.source_word || '';
- // 获取评估统计
- const evaluation = sw['evaluation_with_filter'];
- let evalBadges = '';
- if (evaluation) {{
- const stats = evaluation.statistics || {{}};
- const complete = stats['完全匹配(8-10)'] || 0;
- const similar = stats['相似匹配(6-7)'] || 0;
- const weak = stats['弱相似(5-6)'] || 0;
- const none = stats['无匹配(≤4)'] || 0;
- const filtered = evaluation.filtered_count || 0;
- if (complete > 0) evalBadges += `<span class="eval-badge eval-complete">🟢${{complete}}</span>`;
- if (similar > 0) evalBadges += `<span class="eval-badge eval-similar">🟡${{similar}}</span>`;
- if (weak > 0) evalBadges += `<span class="eval-badge eval-weak">🟠${{weak}}</span>`;
- if (none > 0) evalBadges += `<span class="eval-badge eval-none">🔴${{none}}</span>`;
- if (filtered > 0) evalBadges += `<span class="eval-badge eval-filtered">⚫${{filtered}}</span>`;
- }}
- html += `
- <div class="search-word-item" onclick="scrollToBlock('${{blockId}}')"
- id="sw-${{featureIdx}}-${{groupIdx}}-${{swIdx}}"
- data-block-id="${{blockId}}">
- <div class="search-word-text">
- 🔍 ${{sw.search_word}}
- <span class="search-word-score ${{scoreClass}}">${{score.toFixed(2)}}</span>
- </div>
- <div class="search-word-meta" style="font-size:11px;color:#9ca3af;margin-top:2px">
- 来源: ${{sourceWord}}
- </div>
- <div class="search-word-eval">${{evalBadges}}</div>
- </div>
- `;
- }});
- html += `
- </div>
- </div>
- `;
- }});
- html += `
- </div>
- </div>
- `;
- }});
- sidebar.innerHTML = html;
- }}
- // 渲染右侧结果区
- function renderRightContent() {{
- const content = document.getElementById('rightContent');
- let html = '';
- data.forEach((feature, featureIdx) => {{
- const groups = feature['组合评估结果_分组'] || [];
- groups.forEach((group, groupIdx) => {{
- const searches = group['top10_searches'] || [];
- searches.forEach((sw, swIdx) => {{
- const blockId = `block-${{featureIdx}}-${{groupIdx}}-${{swIdx}}`;
- const searchResult = sw.search_result || {{}};
- const notes = searchResult.data?.data || [];
- const videoCount = notes.filter(n => n.note_card?.type === 'video').length;
- const normalCount = notes.length - videoCount;
- // 获取评估统计
- const evaluation = sw['evaluation_with_filter'];
- let evalStats = '';
- if (evaluation) {{
- const stats = evaluation.statistics || {{}};
- const complete = stats['完全匹配(8-10)'] || 0;
- const similar = stats['相似匹配(6-7)'] || 0;
- const weak = stats['弱相似(5-6)'] || 0;
- const none = stats['无匹配(≤4)'] || 0;
- const filtered = evaluation.filtered_count || 0;
- if (complete > 0) evalStats += `<span class="stat-badge eval complete">🟢 完全:${{complete}}</span>`;
- if (similar > 0) evalStats += `<span class="stat-badge eval similar">🟡 相似:${{similar}}</span>`;
- if (weak > 0) evalStats += `<span class="stat-badge eval weak">🟠 弱:${{weak}}</span>`;
- if (none > 0) evalStats += `<span class="stat-badge eval none">🔴 无:${{none}}</span>`;
- if (filtered > 0) evalStats += `<span class="stat-badge eval filtered">⚫ 过滤:${{filtered}}</span>`;
- }}
- html += `
- <div class="result-block" id="${{blockId}}">
- <div class="result-header">
- <div class="result-title">${{sw.search_word}}</div>
- <div class="result-stats">
- <span class="stat-badge">📝 ${{notes.length}} 条帖子</span>
- <span class="stat-badge">🎬 ${{videoCount}} 视频</span>
- <span class="stat-badge">📷 ${{normalCount}} 图文</span>
- ${{evalStats}}
- </div>
- </div>
- <div class="notes-grid">
- ${{notes.map((note, noteIdx) => renderNoteCard(note, featureIdx, groupIdx, swIdx, noteIdx)).join('')}}
- </div>
- </div>
- `;
- }});
- }});
- }});
- content.innerHTML = html;
- }}
- // 渲染单个帖子卡片
- function renderNoteCard(note, featureIdx, groupIdx, swIdx, noteIdx) {{
- const card = note.note_card || {{}};
- const images = card.image_list || [];
- const title = card.display_title || '无标题';
- const noteType = card.type || 'normal';
- const noteId = note.id || '';
- const user = card.user || {{}};
- const userName = user.nick_name || '未知用户';
- const userAvatar = user.avatar || '';
- const carouselId = `carousel-${{featureIdx}}-${{groupIdx}}-${{swIdx}}-${{noteIdx}}`;
- // 获取评估结果(使用索引key)
- const evalKey = `${{featureIdx}}-${{groupIdx}}-${{swIdx}}-${{noteIdx}}`;
- const noteEval = noteEvaluations[evalKey];
- const evalCategory = getEvalCategory(noteEval);
- const evalClass = `eval-${{evalCategory}}`;
- let evalSection = '';
- if (noteEval) {{
- const score = noteEval['综合得分'];
- const scoreEmoji = score >= 8 ? '🟢' : score >= 6 ? '🟡' : score >= 5 ? '🟠' : '🔴';
- const scoreText = score >= 8 ? '完全匹配' : score >= 6 ? '相似匹配' : score >= 5 ? '弱相似' : '无匹配';
- const reasoning = noteEval['评分说明'] || '无';
- const matchingPoints = (noteEval['关键匹配点'] || []).join('、') || '无';
- evalSection = `
- <div class="note-eval">
- <div class="note-eval-header" onclick="event.stopPropagation(); toggleEvalDetails('${{carouselId}}')">
- <span class="note-eval-score">${{scoreEmoji}} ${{scoreText}} (${{score}}分)</span>
- <span class="note-eval-toggle" id="${{carouselId}}-toggle">▼ 详情</span>
- </div>
- <div class="note-eval-details" id="${{carouselId}}-details">
- <div class="eval-detail-label">评估理由:</div>
- <div class="eval-detail-text">${{reasoning}}</div>
- <div class="eval-detail-label">匹配要点:</div>
- <div class="eval-detail-text">${{matchingPoints}}</div>
- </div>
- </div>
- `;
- }} else if (evalCategory === 'filtered') {{
- evalSection = `
- <div class="note-eval">
- <div class="note-eval-score">⚫ 已过滤(与搜索无关)</div>
- </div>
- `;
- }}
- return `
- <div class="note-card ${{evalClass}}" data-eval-category="${{evalCategory}}" onclick="openNote('${{noteId}}')">
- <div class="image-carousel" id="${{carouselId}}">
- <div class="carousel-images">
- ${{images.map(img => `<img class="carousel-image" src="${{img}}" alt="帖子图片" loading="lazy">`).join('')}}
- </div>
- ${{images.length > 1 ? `
- <button class="carousel-btn prev" onclick="event.stopPropagation(); changeImage('${{carouselId}}', -1)">←</button>
- <button class="carousel-btn next" onclick="event.stopPropagation(); changeImage('${{carouselId}}', 1)">→</button>
- <div class="carousel-indicators">
- ${{images.map((_, i) => `<span class="dot ${{i === 0 ? 'active' : ''}}" onclick="event.stopPropagation(); goToImage('${{carouselId}}', ${{i}})"></span>`).join('')}}
- </div>
- <span class="image-counter">1/${{images.length}}</span>
- ` : ''}}
- </div>
- <div class="note-info">
- <div class="note-title">${{title}}</div>
- <div class="note-meta">
- <span class="note-type type-${{noteType}}">
- ${{noteType === 'video' ? '🎬 视频' : '📷 图文'}}
- </span>
- <div class="note-author">
- ${{userAvatar ? `<img class="author-avatar" src="${{userAvatar}}" alt="${{userName}}">` : ''}}
- <span>${{userName}}</span>
- </div>
- </div>
- </div>
- ${{evalSection}}
- </div>
- `;
- }}
- // 图片轮播逻辑
- const carouselStates = {{}};
- function changeImage(carouselId, direction) {{
- if (!carouselStates[carouselId]) {{
- carouselStates[carouselId] = {{ currentIndex: 0 }};
- }}
- const carousel = document.getElementById(carouselId);
- const imagesContainer = carousel.querySelector('.carousel-images');
- const images = carousel.querySelectorAll('.carousel-image');
- const dots = carousel.querySelectorAll('.dot');
- const counter = carousel.querySelector('.image-counter');
- let newIndex = carouselStates[carouselId].currentIndex + direction;
- if (newIndex < 0) newIndex = images.length - 1;
- if (newIndex >= images.length) newIndex = 0;
- carouselStates[carouselId].currentIndex = newIndex;
- imagesContainer.style.transform = `translateX(-${{newIndex * 100}}%)`;
- // 更新指示器
- dots.forEach((dot, i) => {{
- dot.classList.toggle('active', i === newIndex);
- }});
- // 更新计数器
- if (counter) {{
- counter.textContent = `${{newIndex + 1}}/${{images.length}}`;
- }}
- }}
- function goToImage(carouselId, index) {{
- if (!carouselStates[carouselId]) {{
- carouselStates[carouselId] = {{ currentIndex: 0 }};
- }}
- const carousel = document.getElementById(carouselId);
- const imagesContainer = carousel.querySelector('.carousel-images');
- const dots = carousel.querySelectorAll('.dot');
- const counter = carousel.querySelector('.image-counter');
- carouselStates[carouselId].currentIndex = index;
- imagesContainer.style.transform = `translateX(-${{index * 100}}%)`;
- // 更新指示器
- dots.forEach((dot, i) => {{
- dot.classList.toggle('active', i === index);
- }});
- // 更新计数器
- if (counter) {{
- counter.textContent = `${{index + 1}}/${{dots.length}}`;
- }}
- }}
- // 展开/折叠特征组
- function toggleFeature(featureIdx) {{
- const searchWordsList = document.getElementById(`search-words-${{featureIdx}}`);
- const featureHeader = document.getElementById(`feature-header-${{featureIdx}}`);
- searchWordsList.classList.toggle('expanded');
- featureHeader.classList.toggle('active');
- }}
- // 展开/折叠base word分组
- function toggleBaseWord(featureIdx, groupIdx) {{
- const baseWordHeader = document.getElementById(`base-word-header-${{featureIdx}}-${{groupIdx}}`);
- const baseWordDesc = document.getElementById(`base-word-desc-${{featureIdx}}-${{groupIdx}}`);
- const searchWordsSublist = document.getElementById(`search-words-sublist-${{featureIdx}}-${{groupIdx}}`);
- baseWordHeader.classList.toggle('active');
- baseWordDesc.classList.toggle('expanded');
- searchWordsSublist.classList.toggle('expanded');
- }}
- // 滚动到指定结果块
- function scrollToBlock(blockId) {{
- const block = document.getElementById(blockId);
- if (block) {{
- block.scrollIntoView({{ behavior: 'smooth', block: 'start' }});
- // 高亮对应的搜索词
- document.querySelectorAll('.search-word-item').forEach(item => {{
- item.classList.remove('active');
- }});
- document.querySelectorAll(`[data-block-id="${{blockId}}"]`).forEach(item => {{
- item.classList.add('active');
- }});
- }}
- }}
- // 切换评估详情
- function toggleEvalDetails(carouselId) {{
- const details = document.getElementById(`${{carouselId}}-details`);
- const toggle = document.getElementById(`${{carouselId}}-toggle`);
- if (details && toggle) {{
- details.classList.toggle('expanded');
- toggle.textContent = details.classList.contains('expanded') ? '▲ 收起' : '▼ 详情';
- }}
- }}
- // 过滤帖子
- function filterNotes(category) {{
- currentFilter = category;
- // 更新按钮状态
- document.querySelectorAll('.filter-btn').forEach(btn => {{
- btn.classList.remove('active');
- }});
- event.target.classList.add('active');
- // 过滤帖子卡片
- document.querySelectorAll('.note-card').forEach(card => {{
- const evalCategory = card.getAttribute('data-eval-category');
- if (category === 'all' || evalCategory === category) {{
- card.classList.remove('hidden');
- }} else {{
- card.classList.add('hidden');
- }}
- }});
- // 隐藏空的结果块
- document.querySelectorAll('.result-block').forEach(block => {{
- const visibleCards = block.querySelectorAll('.note-card:not(.hidden)');
- if (visibleCards.length === 0) {{
- block.classList.add('hidden');
- }} else {{
- block.classList.remove('hidden');
- }}
- }});
- }}
- // 打开小红书帖子
- function openNote(noteId) {{
- if (noteId) {{
- window.open(`https://www.xiaohongshu.com/explore/${{noteId}}`, '_blank');
- }}
- }}
- // 初始化
- document.addEventListener('DOMContentLoaded', () => {{
- renderLeftSidebar();
- renderRightContent();
- // 默认展开第一个特征组和第一个base_word
- if (data.length > 0) {{
- toggleFeature(0);
- // 展开第一个base_word分组
- const firstGroups = data[0]['组合评估结果_分组'];
- if (firstGroups && firstGroups.length > 0) {{
- toggleBaseWord(0, 0);
- }}
- }}
- }});
- </script>
- </body>
- </html>
- '''
- # 写入文件
- with open(output_path, 'w', encoding='utf-8') as f:
- f.write(html_content)
- def main():
- """主函数"""
- # 配置路径
- script_dir = os.path.dirname(os.path.abspath(__file__))
- json_path = os.path.join(script_dir, 'output_v2', 'stage6_with_evaluations.json')
- output_dir = os.path.join(script_dir, 'visualization')
- os.makedirs(output_dir, exist_ok=True)
- timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
- output_path = os.path.join(output_dir, f'stage6_interactive_{timestamp}.html')
- # 加载数据
- print(f"📖 加载数据: {json_path}")
- data = load_data(json_path)
- print(f"✓ 加载了 {len(data)} 个原始特征")
- # 计算统计
- print("📊 计算统计数据...")
- stats = calculate_statistics(data)
- print(f"✓ 统计完成:")
- print(f" - 原始特征: {stats['total_features']}")
- print(f" - 搜索词: {stats['total_search_words']}")
- print(f" - 帖子总数: {stats['total_notes']}")
- print(f" - 视频: {stats['video_count']} ({stats['video_percentage']}%)")
- print(f" - 图文: {stats['normal_count']} ({stats['normal_percentage']}%)")
- print(f"\n 评估结果:")
- print(f" - 已评估: {stats['total_evaluated']}")
- print(f" - 已过滤: {stats['total_filtered']} ({stats['filter_rate']}%)")
- print(f" - 完全匹配: {stats['match_complete']} ({stats['complete_rate']}%)")
- print(f" - 相似匹配: {stats['match_similar']} ({stats['similar_rate']}%)")
- print(f" - 弱相似: {stats['match_weak']}")
- print(f" - 无匹配: {stats['match_none']}")
- # 生成HTML
- print(f"\n🎨 生成可视化页面...")
- generate_html(data, stats, output_path)
- print(f"✓ 生成完成: {output_path}")
- # 打印访问提示
- print(f"\n🌐 在浏览器中打开查看:")
- print(f" file://{output_path}")
- return output_path
- if __name__ == '__main__':
- main()
|