fix: 修复 VLM 解析

2025-12-06 08:39:58 +08:00
parent 5757999ae5
commit 767aad407a
1 changed files with 43 additions and 12 deletions
--- a/src/chat/emoji_system/emoji_manager.py
+++ b/src/chat/emoji_system/emoji_manager.py
@@ -4,6 +4,7 @@ import binascii
 import hashlib
 import io
 import json
 import json_repair
 import os
 import random
 import re
@@ -1023,6 +1024,15 @@ class EmojiManager:
    -   必须是表情包，非普通截图。
    -   图中文字不超过5个。
 请确保你的最终输出是严格的JSON对象，不要添加任何额外解释或文本。
 输出格式:
 ```json
 {{
  "detailed_description": "",
  "keywords": [],
  "refined_sentence": "",
  "is_compliant": true
 }}
 ```
 """
                image_data_for_vlm, image_format_for_vlm = image_base64, image_format
@@ -1042,16 +1052,14 @@ class EmojiManager:
                        if not vlm_response_str:
                            continue
-                        match = re.search(r"\{.*\}", vlm_response_str, re.DOTALL)
+                        vlm_response_json = self._parse_json_response(vlm_response_str)
-                        if match:
+                        description = vlm_response_json.get("detailed_description", "")
-                            vlm_response_json = json.loads(match.group(0))
+                        emotions = vlm_response_json.get("keywords", [])
-                            description = vlm_response_json.get("detailed_description", "")
+                        refined_description = vlm_response_json.get("refined_sentence", "")
-                            emotions = vlm_response_json.get("keywords", [])
+                        is_compliant = vlm_response_json.get("is_compliant", False)
-                            refined_description = vlm_response_json.get("refined_sentence", "")
+                        if description and emotions and refined_description:
-                            is_compliant = vlm_response_json.get("is_compliant", False)
+                            logger.info("[VLM分析] 成功解析VLM返回的JSON数据。")
-                            if description and emotions and refined_description:
+                            break
                                logger.info("[VLM分析] 成功解析VLM返回的JSON数据。")
                                break
                        logger.warning("[VLM分析] VLM返回的JSON数据不完整或格式错误，准备重试。")
                    except (json.JSONDecodeError, AttributeError) as e:
                        logger.error(f"VLM JSON解析失败 (第 {i+1}/3 次): {e}")
@@ -1196,6 +1204,29 @@ class EmojiManager:
                    logger.error(f"[错误] 删除异常处理文件时出错: {remove_error}")
            return False
    @classmethod
    def _parse_json_response(cls, response: str) -> dict[str, Any] | None:
        """解析 LLM 的 JSON 响应"""
        try:
            # 尝试提取 JSON 代码块
            json_match = re.search(r"```json\s*(.*?)\s*```", response, re.DOTALL)
            if json_match:
                json_str = json_match.group(1)
            else:
                # 尝试直接解析
                json_str = response.strip()
            # 移除可能的注释
            json_str = re.sub(r"//.*", "", json_str)
            json_str = re.sub(r"/\*.*?\*/", "", json_str, flags=re.DOTALL)
            data = json_repair.loads(json_str)
            return data
        except json.JSONDecodeError as e:
            logger.warning(f"JSON 解析失败: {e}, 响应: {response[:200]}")
            return None
 emoji_manager = None