|
@@ -17,7 +17,7 @@ from gemini import GeminiProcessor
|
|
|
|
|
|
# 配置日志
|
|
|
logging.basicConfig(level=logging.INFO)
|
|
|
-logger = logging.getLogger(__name__)
|
|
|
+logger = logging.getLogger("CleanTools")
|
|
|
|
|
|
# 配置常量
|
|
|
BATCH_SIZE = 5 # 分批处理大小
|
|
@@ -238,7 +238,8 @@ def batch_call_llm_for_evaluation(contents: list, query_word: str) -> list:
|
|
|
# 处理返回结果
|
|
|
evaluation_results = []
|
|
|
for i, result in enumerate(results):
|
|
|
- result = re.sub(r'^\s*```json|\s*```\s*$', '', result, flags=re.MULTILINE).strip()
|
|
|
+ # 只处理大括号外面的内容,保留JSON内部格式
|
|
|
+ result = re.sub(r'(^\s*```json)|(\s*```\s*$)', '', result, flags=re.MULTILINE).strip()
|
|
|
result = json.loads(result)
|
|
|
parsing_id = contents[i].id
|
|
|
parsing_data = contents[i].parsing_data
|