# 读取 文件/视频分析报告.xlsx文件,逐行将第5列数据的JSON字符串读取出来,提取segments字段并处理 import pandas as pd import json import logging import re # Set up logging logging.basicConfig(level=logging.INFO) logger = logging.getLogger(__name__) def clean_json_string(json_str): """清理和格式化JSON字符串""" # 移除BOM和空白字符 json_str = json_str.strip().lstrip('\ufeff') # 处理Python风格的字符串(单引号转双引号) json_str = re.sub(r'(?