il y a 2 mois · 858ffecc37
--- a/post_evaluator_v4_langgraph.py
+++ b/post_evaluator_v4_langgraph.py
@@ -24,7 +24,8 @@ from PIL import Image
 
				 from langchain_google_genai import ChatGoogleGenerativeAI
			
 
				 from langchain_core.messages import HumanMessage, SystemMessage
			
 
				 from langgraph.graph import StateGraph, END
			
 
				-# import google.generativeai as genai  # 暂时禁用,版本冲突
			
 
				+# 视频上传相关
			
 
				+import mimetypes
			
 
				 
			
 
				 # ============================================================================
			
 
				 # 常量配置
			
@@ -42,6 +43,10 @@ MAX_RETRIES = 2
 
				 RETRY_WAIT_SECONDS = 3
			
 
				 FILE_PROCESS_TIMEOUT = 180
			
 
				 
			
 
				+# 代理配置（用于访问 Google File API）
			
 
				+HTTP_PROXY = "http://127.0.0.1:29758"
			
 
				+HTTPS_PROXY = "https://127.0.0.1:29758"
			
 
				+
			
 
				 # 缓存配置
			
 
				 ENABLE_CACHE = False
			
 
				 CACHE_DIR = ".evaluation_cache"
			
@@ -1178,11 +1183,16 @@ class GeminiClient:
 
				         if media_files:
			
 
				             print(f"      🔍 传递给Gemini: {len(media_files)}个媒体文件")
			
 
				             for i, media in enumerate(media_files[:3]):
			
 
				-                if isinstance(media, dict) and media.get("type") == "image_url":
			
 
				-                    data_url = media.get("image_url", {}).get("url", "")
			
 
				-                    print(f"         📸 图片[{i}]: Base64 data URL ({len(data_url)}字符)")
			
 
				+                if isinstance(media, dict):
			
 
				+                    if media.get("type") == "image_url":
			
 
				+                        data_url = media.get("image_url", {}).get("url", "")
			
 
				+                        print(f"         📸 图片[{i}]: Base64 data URL ({len(data_url)}字符)")
			
 
				+                    elif media.get("type") == "media":
			
 
				+                        file_uri = media.get("file_uri", "")
			
 
				+                        mime_type = media.get("mime_type", "")
			
 
				+                        print(f"         🎥 视频[{i}]: file_uri ({mime_type})")
			
 
				                 else:
			
 
				-                    print(f"         🎥 视频[{i}]: {type(media).__name__}")
			
 
				+                    print(f"         ⚠️  媒体[{i}]: 未知类型 {type(media).__name__}")
			
 
				         else:
			
 
				             print(f"      ⚠️  无媒体文件传递给Gemini（仅文本）")
			
 
				 
			
@@ -1236,18 +1246,19 @@ class GeminiClient:
 
				 # ============================================================================
			
 
				 
			
 
				 class VideoUploader:
			
 
				-    """视频上传处理器"""
			
 
				+    """视频上传处理器 - 使用 google.generativeai"""
			
 
				 
			
 
				     @staticmethod
			
 
				-    async def upload_video(video_url: str) -> tuple[Optional[Any], Optional[str], Optional[str]]:
			
 
				+    async def upload_video(video_url: str) -> tuple[Optional[Dict], Optional[str], Optional[str]]:
			
 
				         """
			
 
				-        上传视频到Gemini
			
 
				+        上传视频到Google服务器并获取file_uri
			
 
				 
			
 
				         Args:
			
 
				             video_url: 视频URL
			
 
				 
			
 
				         Returns:
			
 
				-            (video_file, video_uri, temp_path)
			
 
				+            (media_dict, file_uri, temp_path)
			
 
				+            media_dict格式: {"type": "media", "file_uri": ..., "mime_type": ...}
			
 
				         """
			
 
				         import requests
			
 
				 
			
@@ -1256,7 +1267,7 @@ class VideoUploader:
 
				         os.close(temp_fd)
			
 
				 
			
 
				         try:
			
 
				-            print(f"      📥 下载视频: {video_url[:60]}...")
			
 
				+            print(f"      📥 下载视频: {video_url[:100]}...")
			
 
				 
			
 
				             # 下载
			
 
				             loop = asyncio.get_event_loop()
			
@@ -1274,54 +1285,86 @@ class VideoUploader:
 
				             file_size_mb = os.path.getsize(temp_path) / (1024 * 1024)
			
 
				             print(f"      📦 视频下载完成,大小: {file_size_mb:.2f}MB")
			
 
				 
			
 
				-            # 上传到Gemini
			
 
				-            print(f"      ☁️  上传到Gemini...")
			
 
				-            # 暂时禁用视频上传功能(genai版本冲突)
			
 
				-            raise NotImplementedError("视频上传暂时禁用,等待修复版本冲突")
			
 
				-            # uploaded_file = await loop.run_in_executor(
			
 
				-            #     None,
			
 
				-            #     lambda: genai.upload_file(temp_path)
			
 
				-            # )
			
 
				+            # 上传到Google File API
			
 
				+            print(f"      ☁️  上传到Google File API...")
			
 
				+
			
 
				+            # 动态导入 google.generativeai（避免模块级别冲突）
			
 
				+            import google.generativeai as genai
			
 
				+
			
 
				+            # 配置代理环境变量（让底层 HTTP 库使用代理）
			
 
				+            # 设置大写和小写版本，确保 httplib2 能正确识别
			
 
				+            os.environ['HTTP_PROXY'] = HTTP_PROXY
			
 
				+            os.environ['HTTPS_PROXY'] = HTTPS_PROXY
			
 
				+            os.environ['http_proxy'] = HTTP_PROXY
			
 
				+            os.environ['https_proxy'] = HTTPS_PROXY
			
 
				+            print(f"      🔧 使用代理: {HTTPS_PROXY}")
			
 
				+
			
 
				+            # 配置 API key
			
 
				+            genai.configure(api_key=GEMINI_API_KEY)
			
 
				+
			
 
				+            # 上传文件
			
 
				+            uploaded_file = await loop.run_in_executor(
			
 
				+                None,
			
 
				+                lambda: genai.upload_file(temp_path)
			
 
				+            )
			
 
				+
			
 
				+            print(f"      📤 文件已上传: {uploaded_file.name}")
			
 
				 
			
 
				             # 等待处理
			
 
				-            processed_file = await VideoUploader._wait_for_processing(uploaded_file)
			
 
				+            processed_file = await VideoUploader._wait_for_processing(uploaded_file.name)
			
 
				             if not processed_file:
			
 
				                 return None, None, temp_path
			
 
				 
			
 
				             print(f"      ✅ 视频上传成功: {processed_file.uri}")
			
 
				-            return processed_file, processed_file.uri, temp_path
			
 
				+
			
 
				+            # 检测MIME类型
			
 
				+            mime_type = mimetypes.guess_type(temp_path)[0] or "video/mp4"
			
 
				+
			
 
				+            # 返回media字典格式
			
 
				+            media_dict = {
			
 
				+                "type": "media",
			
 
				+                "file_uri": processed_file.uri,
			
 
				+                "mime_type": mime_type
			
 
				+            }
			
 
				+
			
 
				+            return media_dict, processed_file.uri, temp_path
			
 
				 
			
 
				         except Exception as e:
			
 
				             print(f"      ❌ 视频上传失败: {str(e)[:100]}")
			
 
				             return None, None, temp_path
			
 
				 
			
 
				     @staticmethod
			
 
				-    async def _wait_for_processing(uploaded_file: Any) -> Optional[Any]:
			
 
				-        """等待Gemini处理视频文件"""
			
 
				+    async def _wait_for_processing(file_name: str) -> Optional[any]:
			
 
				+        """等待Google处理视频文件"""
			
 
				+        # 动态导入 google.generativeai
			
 
				+        import google.generativeai as genai
			
 
				+
			
 
				         start_time = time.time()
			
 
				-        current_file = uploaded_file
			
 
				 
			
 
				         loop = asyncio.get_event_loop()
			
 
				 
			
 
				-        while current_file.state.name == "PROCESSING":
			
 
				+        while True:
			
 
				             elapsed = time.time() - start_time
			
 
				             if elapsed > FILE_PROCESS_TIMEOUT:
			
 
				-                print(f"      ❌ 视频处理超时: {current_file.name}")
			
 
				+                print(f"      ❌ 视频处理超时")
			
 
				                 return None
			
 
				 
			
 
				-            print(f"      ⏳ 等待Gemini处理视频...{elapsed:.0f}s")
			
 
				-            await asyncio.sleep(RETRY_WAIT_SECONDS)
			
 
				-
			
 
				+            # 获取文件状态
			
 
				             current_file = await loop.run_in_executor(
			
 
				                 None,
			
 
				-                lambda: genai.get_file(current_file.name)
			
 
				+                lambda: genai.get_file(name=file_name)
			
 
				             )
			
 
				 
			
 
				-        if current_file.state.name == "FAILED":
			
 
				-            print(f"      ❌ 视频处理失败: {current_file.state}")
			
 
				-            return None
			
 
				-
			
 
				-        return current_file
			
 
				+            # 检查状态
			
 
				+            if current_file.state.name == "ACTIVE":
			
 
				+                print(f"      ✅ 视频处理完成")
			
 
				+                return current_file
			
 
				+            elif current_file.state.name == "PROCESSING":
			
 
				+                print(f"      ⏳ 视频处理中... ({elapsed:.1f}s)")
			
 
				+                await asyncio.sleep(RETRY_WAIT_SECONDS)
			
 
				+            else:
			
 
				+                print(f"      ❌ 视频处理失败: {current_file.state.name}")
			
 
				+                return None
			
 
				 
			
 
				 
			
 
				 # ============================================================================
			
@@ -1438,8 +1481,10 @@ class PromptAdapter:
 
				             "body_text": post.body_text or "",
			
 
				         }
			
 
				 
			
 
				-        # 媒体描述
			
 
				-        if post.type == "video":
			
 
				+        # 媒体描述（检查是否真的有视频文件）
			
 
				+        # 如果video_file存在于kwargs中且为None，说明是降级策略
			
 
				+        has_video_file = kwargs.get("video_file") if "video_file" in kwargs else (post.type == "video")
			
 
				+        if post.type == "video" and has_video_file:
			
 
				             params["num_images"] = "1个视频"
			
 
				         else:
			
 
				             num_images = len(post.images) if post.images else 0
			
@@ -1999,16 +2044,20 @@ async def evaluate_post_v4(
 
				     }
			
 
				 
			
 
				     # 处理视频
			
 
				-    if post.type == "video" and post.images and len(post.images) > 0:
			
 
				-        video_url = post.images[0]  # 视频URL通常在images[0]
			
 
				-        video_file, video_uri, temp_path = await VideoUploader.upload_video(video_url)
			
 
				-        initial_state["video_file"] = video_file
			
 
				-        initial_state["video_uri"] = video_uri
			
 
				-        initial_state["temp_video_path"] = temp_path
			
 
				-
			
 
				-        if not video_file:
			
 
				-            print(f"      ❌ 视频上传失败,停止评估")
			
 
				-            return (None, None, None, None, None, None)
			
 
				+    if post.type == "video" and post.video:
			
 
				+        print(f"      📹 检测到视频帖子，准备上传视频...")
			
 
				+        media_dict, video_uri, temp_path = await VideoUploader.upload_video(post.video)
			
 
				+
			
 
				+        if media_dict:
			
 
				+            # 视频上传成功
			
 
				+            initial_state["video_file"] = media_dict  # 存储media字典
			
 
				+            initial_state["video_uri"] = video_uri
			
 
				+            initial_state["temp_video_path"] = temp_path
			
 
				+            print(f"      ✅ 视频已准备好用于评估")
			
 
				+        else:
			
 
				+            # 降级策略：使用封面图片
			
 
				+            print(f"      ⚠️  视频上传失败，降级使用封面图片+文本进行评估")
			
 
				+            # 继续评估，使用封面图片
			
 
				 
			
 
				     try:
			
 
				         # 创建并运行图