feat: 超大型重构

2025-03-09 10:27:54 +08:00
parent 8754571afb
commit fe3684736a
11 changed files with 1209 additions and 566 deletions
--- a/src/plugins/chat/utils_image.py
+++ b/src/plugins/chat/utils_image.py
@@ -2,7 +2,11 @@ import base64
 import io
 import os
 import time
-import zlib  # 用于 CRC32
+import zlib
+import aiohttp
+import hashlib
+from typing import Optional, Tuple, Union
+from urllib.parse import urlparse

 from loguru import logger
 from nonebot import get_driver
@@ -10,213 +14,348 @@ from PIL import Image

 from ...common.database import Database
 from ..chat.config import global_config
-
+from ..models.utils_model import LLM_request
 driver = get_driver()
 config = driver.config

-
-
-def storage_compress_image(base64_data: str, max_size: int = 200) -> str:
-    """
-    压缩base64格式的图片到指定大小（单位：KB）并在数据库中记录图片信息
-    Args:
-        base64_data: base64编码的图片数据
-        max_size: 最大文件大小（KB）
-    Returns:
-        str: 压缩后的base64图片数据
-    """
-    try:
-        # 将base64转换为字节数据
-        image_data = base64.b64decode(base64_data)
-        
-        # 使用 CRC32 计算哈希值
-        hash_value = format(zlib.crc32(image_data) & 0xFFFFFFFF, 'x')
-        
-        # 确保图片目录存在
-        images_dir = "data/images"
-        os.makedirs(images_dir, exist_ok=True)
-        
-        # 连接数据库
-        db = Database(
-            host=config.mongodb_host,
-            port=int(config.mongodb_port),
-            db_name=config.database_name,
-            username=config.mongodb_username,
-            password=config.mongodb_password,
-            auth_source=config.mongodb_auth_source
-        )
-        
-        # 检查是否已存在相同哈希值的图片
-        collection = db.db['images']
-        existing_image = collection.find_one({'hash': hash_value})
-        
-        if existing_image:
-            print(f"\033[1;33m[提示]\033[0m 发现重复图片，使用已存在的文件: {existing_image['path']}")
-            return base64_data
-
-        # 将字节数据转换为图片对象
-        img = Image.open(io.BytesIO(image_data))
-        
-        # 如果是动图，直接返回原图
-        if getattr(img, 'is_animated', False):
-            return base64_data
-            
-        # 计算当前大小（KB）
-        current_size = len(image_data) / 1024
-        
-        # 如果已经小于目标大小，直接使用原图
-        if current_size <= max_size:
-            compressed_data = image_data
-        else:
-            # 压缩逻辑
-            # 先缩放到50%
-            new_width = int(img.width * 0.5)
-            new_height = int(img.height * 0.5)
-            img = img.resize((new_width, new_height), Image.Resampling.LANCZOS)
-            
-            # 如果缩放后的最大边长仍然大于400，继续缩放
-            max_dimension = 400
-            max_current = max(new_width, new_height)
-            if max_current > max_dimension:
-                ratio = max_dimension / max_current
-                new_width = int(new_width * ratio)
-                new_height = int(new_height * ratio)
-                img = img.resize((new_width, new_height), Image.Resampling.LANCZOS)
-            
-            # 转换为RGB模式（去除透明通道）
-            if img.mode in ('RGBA', 'P'):
-                img = img.convert('RGB')
-            
-            # 使用固定质量参数压缩
-            output = io.BytesIO()
-            img.save(output, format='JPEG', quality=85, optimize=True)
-            compressed_data = output.getvalue()
-        
-        # 生成文件名（使用时间戳和哈希值确保唯一性）
-        timestamp = int(time.time())
-        filename = f"{timestamp}_{hash_value}.jpg"
-        image_path = os.path.join(images_dir, filename)
-        
-        # 保存文件
-        with open(image_path, "wb") as f:
-            f.write(compressed_data)
-            
-        print(f"\033[1;32m[成功]\033[0m 保存图片到: {image_path}")
-        
-        try:
-            # 准备数据库记录
-            image_record = {
-                'filename': filename,
-                'path': image_path,
-                'size': len(compressed_data) / 1024,
-                'timestamp': timestamp,
-                'width': img.width,
-                'height': img.height,
-                'description': '',
-                'tags': [],
-                'type': 'image',
-                'hash': hash_value
-            }
-            
-            # 保存记录
-            collection.insert_one(image_record)
-            print("\033[1;32m[成功]\033[0m 保存图片记录到数据库")
-            
-        except Exception as db_error:
-            print(f"\033[1;31m[错误]\033[0m 数据库操作失败: {str(db_error)}")
-        
-        # 将压缩后的数据转换为base64
-        compressed_base64 = base64.b64encode(compressed_data).decode('utf-8')
-        return compressed_base64
-        
-    except Exception as e:
-        print(f"\033[1;31m[错误]\033[0m 压缩图片失败: {str(e)}")
-        import traceback
-        print(traceback.format_exc())
-        return base64_data
-
-def storage_emoji(image_data: bytes) -> bytes:
-    """
-    存储表情包到本地文件夹
-    Args:
-        image_data: 图片字节数据
-        group_id: 群组ID（仅用于日志）
-        user_id: 用户ID（仅用于日志）
-    Returns:
-        bytes: 原始图片数据
-    """
-    if not global_config.EMOJI_SAVE:
-        return image_data
-    try:
-        # 使用 CRC32 计算哈希值
-        hash_value = format(zlib.crc32(image_data) & 0xFFFFFFFF, 'x')
-        
-        # 确保表情包目录存在
-        emoji_dir = "data/emoji"
-        os.makedirs(emoji_dir, exist_ok=True)
-        
-        # 检查是否已存在相同哈希值的文件
-        for filename in os.listdir(emoji_dir):
-            if hash_value in filename:
-                # print(f"\033[1;33m[提示]\033[0m 发现重复表情包: {filename}")
-                return image_data
-        
-        # 生成文件名
-        timestamp = int(time.time())
-        filename = f"{timestamp}_{hash_value}.jpg"
-        emoji_path = os.path.join(emoji_dir, filename)
-        
-        # 直接保存原始文件
-        with open(emoji_path, "wb") as f:
-            f.write(image_data)
-            
-        print(f"\033[1;32m[成功]\033[0m 保存表情包到: {emoji_path}")
-        return image_data
-        
-    except Exception as e:
-        print(f"\033[1;31m[错误]\033[0m 保存表情包失败: {str(e)}")
-        return image_data 
+class ImageManager:
+    _instance = None
+    IMAGE_DIR = "data"  # 图像存储根目录
    
-
-def storage_image(image_data: bytes) -> bytes:
-    """
-    存储图片到本地文件夹
-    Args:
-        image_data: 图片字节数据
-        group_id: 群组ID（仅用于日志）
-        user_id: 用户ID（仅用于日志）
-    Returns:
-        bytes: 原始图片数据
-    """
-    try:
-        # 使用 CRC32 计算哈希值
-        hash_value = format(zlib.crc32(image_data) & 0xFFFFFFFF, 'x')
-        
-        # 确保表情包目录存在
-        image_dir = "data/image"
-        os.makedirs(image_dir, exist_ok=True)
-        
-        # 检查是否已存在相同哈希值的文件
-        for filename in os.listdir(image_dir):
-            if hash_value in filename:
-                # print(f"\033[1;33m[提示]\033[0m 发现重复表情包: {filename}")
-                return image_data
-        
-        # 生成文件名
-        timestamp = int(time.time())
-        filename = f"{timestamp}_{hash_value}.jpg"
-        image_path = os.path.join(image_dir, filename)
-        
-        # 直接保存原始文件
-        with open(image_path, "wb") as f:
-            f.write(image_data)
+    def __new__(cls):
+        if cls._instance is None:
+            cls._instance = super().__new__(cls)
+            cls._instance.db = None
+            cls._instance._initialized = False
+        return cls._instance
+    
+    def __init__(self):
+        if not self._initialized:
+            self.db = Database.get_instance()
+            self._ensure_image_collection()
+            self._ensure_description_collection()
+            self._ensure_image_dir()
+            self._initialized = True
+            self._llm = LLM_request(model=global_config.vlm, temperature=0.4, max_tokens=300)
            
-        print(f"\033[1;32m[成功]\033[0m 保存图片到: {image_path}")
-        return image_data
+    def _ensure_image_dir(self):
+        """确保图像存储目录存在"""
+        os.makedirs(self.IMAGE_DIR, exist_ok=True)
        
-    except Exception as e:
-        print(f"\033[1;31m[错误]\033[0m 保存图片失败: {str(e)}")
-        return image_data 
+    def _ensure_image_collection(self):
+        """确保images集合存在并创建索引"""
+        if 'images' not in self.db.db.list_collection_names():
+            self.db.db.create_collection('images')
+            # 创建索引
+            self.db.db.images.create_index([('hash', 1)], unique=True)
+            self.db.db.images.create_index([('url', 1)])
+            self.db.db.images.create_index([('path', 1)])
+
+    def _ensure_description_collection(self):
+        """确保image_descriptions集合存在并创建索引"""
+        if 'image_descriptions' not in self.db.db.list_collection_names():
+            self.db.db.create_collection('image_descriptions')
+            # 创建索引
+            self.db.db.image_descriptions.create_index([('hash', 1)], unique=True)
+            self.db.db.image_descriptions.create_index([('type', 1)])
+
+    async def _get_description_from_db(self, image_hash: str, description_type: str) -> Optional[str]:
+        """从数据库获取图片描述
+        
+        Args:
+            image_hash: 图片哈希值
+            description_type: 描述类型 ('emoji' 或 'image')
+            
+        Returns:
+            Optional[str]: 描述文本，如果不存在则返回None
+        """
+        result = await self.db.db.image_descriptions.find_one({
+            'hash': image_hash,
+            'type': description_type
+        })
+        return result['description'] if result else None
+
+    async def _save_description_to_db(self, image_hash: str, description: str, description_type: str) -> None:
+        """保存图片描述到数据库
+        
+        Args:
+            image_hash: 图片哈希值
+            description: 描述文本
+            description_type: 描述类型 ('emoji' 或 'image')
+        """
+        await self.db.db.image_descriptions.update_one(
+            {'hash': image_hash, 'type': description_type},
+            {
+                '$set': {
+                    'description': description,
+                    'timestamp': int(time.time())
+                }
+            },
+            upsert=True
+        )
+
+    async def save_image(self, 
+                        image_data: Union[str, bytes], 
+                        url: str = None, 
+                        description: str = None, 
+                        is_base64: bool = False) -> Optional[str]:
+        """保存图像
+        Args:
+            image_data: 图像数据(base64字符串或字节)
+            url: 图像URL
+            description: 图像描述
+            is_base64: image_data是否为base64格式
+        Returns:
+            str: 保存后的文件路径,失败返回None
+        """
+        try:
+            # 转换为字节格式
+            if is_base64:
+                if isinstance(image_data, str):
+                    image_bytes = base64.b64decode(image_data)
+                else:
+                    return None
+            else:
+                if isinstance(image_data, bytes):
+                    image_bytes = image_data
+                else:
+                    return None
+                    
+            # 计算哈希值
+            image_hash = hashlib.md5(image_bytes).hexdigest()
+            
+            # 查重
+            existing = self.db.db.images.find_one({'hash': image_hash})
+            if existing:
+                return existing['path']
+                
+            # 生成文件名和路径
+            timestamp = int(time.time())
+            filename = f"{timestamp}_{image_hash[:8]}.jpg"
+            file_path = os.path.join(self.IMAGE_DIR, filename)
+            
+            # 保存文件
+            with open(file_path, "wb") as f:
+                f.write(image_bytes)
+                
+            # 保存到数据库
+            image_doc = {
+                'hash': image_hash,
+                'path': file_path,
+                'url': url,
+                'description': description,
+                'timestamp': timestamp
+            }
+            self.db.db.images.insert_one(image_doc)
+            
+            return file_path
+            
+        except Exception as e:
+            logger.error(f"保存图像失败: {str(e)}")
+            return None
+            
+    async def get_image_by_url(self, url: str) -> Optional[str]:
+        """根据URL获取图像路径(带查重)
+        Args:
+            url: 图像URL
+        Returns:
+            str: 本地文件路径,不存在返回None
+        """
+        try:
+            # 先查找是否已存在
+            existing = self.db.db.images.find_one({'url': url})
+            if existing:
+                return existing['path']
+                
+            # 下载图像
+            async with aiohttp.ClientSession() as session:
+                async with session.get(url) as resp:
+                    if resp.status == 200:
+                        image_bytes = await resp.read()
+                        return await self.save_image(image_bytes, url=url)
+            return None
+            
+        except Exception as e:
+            logger.error(f"获取图像失败: {str(e)}")
+            return None
+            
+    async def get_base64_by_url(self, url: str) -> Optional[str]:
+        """根据URL获取base64(带查重)
+        Args:
+            url: 图像URL
+        Returns:
+            str: base64字符串,失败返回None
+        """
+        try:
+            image_path = await self.get_image_by_url(url)
+            if not image_path:
+                return None
+                
+            with open(image_path, 'rb') as f:
+                image_bytes = f.read()
+                return base64.b64encode(image_bytes).decode('utf-8')
+                
+        except Exception as e:
+            logger.error(f"获取base64失败: {str(e)}")
+            return None
+            
+    async def save_base64_image(self, base64_str: str, description: str = None) -> Optional[str]:
+        """保存base64图像(带查重)
+        Args:
+            base64_str: base64字符串
+            description: 图像描述
+        Returns:
+            str: 保存路径,失败返回None
+        """
+        return await self.save_image(base64_str, description=description, is_base64=True)
+        
+    def check_url_exists(self, url: str) -> bool:
+        """检查URL是否已存在
+        Args:
+            url: 图像URL
+        Returns:
+            bool: 是否存在
+        """
+        return self.db.db.images.find_one({'url': url}) is not None
+        
+    def check_hash_exists(self, image_data: Union[str, bytes], is_base64: bool = False) -> bool:
+        """检查图像是否已存在
+        Args:
+            image_data: 图像数据(base64或字节)
+            is_base64: 是否为base64格式
+        Returns:
+            bool: 是否存在
+        """
+        try:
+            if is_base64:
+                if isinstance(image_data, str):
+                    image_bytes = base64.b64decode(image_data)
+                else:
+                    return False
+            else:
+                if isinstance(image_data, bytes):
+                    image_bytes = image_data
+                else:
+                    return False
+                    
+            image_hash = hashlib.md5(image_bytes).hexdigest()
+            return self.db.db.images.find_one({'hash': image_hash}) is not None
+            
+        except Exception as e:
+            logger.error(f"检查哈希失败: {str(e)}")
+            return False
+        
+    async def get_emoji_description(self, image_base64: str) -> str:
+        """获取表情包描述，带查重和保存功能"""
+        try:
+            # 计算图片哈希
+            image_bytes = base64.b64decode(image_base64)
+            image_hash = hashlib.md5(image_bytes).hexdigest()
+            
+            # 查询缓存的描述
+            cached_description = await self._get_description_from_db(image_hash, 'emoji')
+            if cached_description:
+                return f"[表情包：{cached_description}]"
+
+            # 调用AI获取描述
+            prompt = "这是一个表情包，使用中文简洁的描述一下表情包的内容和表情包所表达的情感"
+            description, _ = await self._llm.generate_response_for_image(prompt, image_base64)
+            
+            # 根据配置决定是否保存图片
+            if global_config.EMOJI_SAVE:
+                # 生成文件名和路径
+                timestamp = int(time.time())
+                filename = f"emoji_{timestamp}_{image_hash[:8]}.jpg"
+                file_path = os.path.join(self.IMAGE_DIR, filename)
+                
+                try:
+                    # 保存文件
+                    with open(file_path, "wb") as f:
+                        f.write(image_bytes)
+                    
+                    # 保存到数据库
+                    image_doc = {
+                        'hash': image_hash,
+                        'path': file_path,
+                        'type': 'emoji',
+                        'description': description,
+                        'timestamp': timestamp
+                    }
+                    await self.db.db.images.update_one(
+                        {'hash': image_hash},
+                        {'$set': image_doc},
+                        upsert=True
+                    )
+                    logger.success(f"保存表情包: {file_path}")
+                except Exception as e:
+                    logger.error(f"保存表情包文件失败: {str(e)}")
+            
+            # 保存描述到数据库
+            await self._save_description_to_db(image_hash, description, 'emoji')
+            
+            return f"[表情包：{description}]"
+        except Exception as e:
+            logger.error(f"获取表情包描述失败: {str(e)}")
+            return "[表情包]"
+
+    async def get_image_description(self, image_base64: str) -> str:
+        """获取普通图片描述，带查重和保存功能"""
+        try:
+            # 计算图片哈希
+            image_bytes = base64.b64decode(image_base64)
+            image_hash = hashlib.md5(image_bytes).hexdigest()
+            
+            # 查询缓存的描述
+            cached_description = await self._get_description_from_db(image_hash, 'image')
+            if cached_description:
+                return f"[图片：{cached_description}]"
+
+            # 调用AI获取描述
+            prompt = "请用中文描述这张图片的内容。如果有文字，请把文字都描述出来。并尝试猜测这个图片的含义。最多200个字。"
+            description, _ = await self._llm.generate_response_for_image(prompt, image_base64)
+            
+            # 根据配置决定是否保存图片
+            if global_config.EMOJI_SAVE:
+                # 生成文件名和路径
+                timestamp = int(time.time())
+                filename = f"image_{timestamp}_{image_hash[:8]}.jpg"
+                file_path = os.path.join(self.IMAGE_DIR, filename)
+                
+                try:
+                    # 保存文件
+                    with open(file_path, "wb") as f:
+                        f.write(image_bytes)
+                    
+                    # 保存到数据库
+                    image_doc = {
+                        'hash': image_hash,
+                        'path': file_path,
+                        'type': 'image',
+                        'description': description,
+                        'timestamp': timestamp
+                    }
+                    await self.db.db.images.update_one(
+                        {'hash': image_hash},
+                        {'$set': image_doc},
+                        upsert=True
+                    )
+                    logger.success(f"保存图片: {file_path}")
+                except Exception as e:
+                    logger.error(f"保存图片文件失败: {str(e)}")
+            
+            # 保存描述到数据库
+            await self._save_description_to_db(image_hash, description, 'image')
+            
+            return f"[图片：{description}]"
+        except Exception as e:
+            logger.error(f"获取图片描述失败: {str(e)}")
+            return "[图片]"
+
+
+
+# 创建全局单例
+image_manager = ImageManager()
+

 def compress_base64_image_by_scale(base64_data: str, target_size: int = 0.8 * 1024 * 1024) -> str:
    """压缩base64格式的图片到指定大小