from src.common.logger import get_logger from src.common.database.database import db from src.common.database.database_model import PersonInfo # 新增导入 import copy import hashlib from typing import Any, Callable, Dict import datetime import asyncio from src.llm_models.utils_model import LLMRequest from src.config.config import global_config import json # 新增导入 from json_repair import repair_json """ PersonInfoManager 类方法功能摘要: 1. get_person_id - 根据平台和用户ID生成MD5哈希的唯一person_id 2. create_person_info - 创建新个人信息文档(自动合并默认值) 3. update_one_field - 更新单个字段值(若文档不存在则创建) 4. del_one_document - 删除指定person_id的文档 5. get_value - 获取单个字段值(返回实际值或默认值) 6. get_values - 批量获取字段值(任一字段无效则返回空字典) 7. del_all_undefined_field - 清理全集合中未定义的字段 8. get_specific_value_list - 根据指定条件,返回person_id,value字典 """ logger = get_logger("person_info") JSON_SERIALIZED_FIELDS = ["points", "forgotten_points", "info_list"] person_info_default = { "person_id": None, "person_name": None, "name_reason": None, # Corrected from person_name_reason to match common usage if intended "platform": "unknown", "user_id": "unknown", "nickname": "Unknown", "know_times": 0, "know_since": None, "last_know": None, # "user_cardname": None, # This field is not in Peewee model PersonInfo # "user_avatar": None, # This field is not in Peewee model PersonInfo "impression": None, # Corrected from persion_impression "short_impression": None, "info_list": None, "points": None, "forgotten_points": None, } class PersonInfoManager: def __init__(self): self.person_name_list = {} # TODO: API-Adapter修改标记 self.qv_name_llm = LLMRequest( model=global_config.model.utils, request_type="relation.qv_name", ) try: db.connect(reuse_if_open=True) db.create_tables([PersonInfo], safe=True) except Exception as e: logger.error(f"数据库连接或 PersonInfo 表创建失败: {e}") # 初始化时读取所有person_name try: for record in PersonInfo.select(PersonInfo.person_id, PersonInfo.person_name).where( PersonInfo.person_name.is_null(False) ): if record.person_name: self.person_name_list[record.person_id] = record.person_name logger.debug(f"已加载 {len(self.person_name_list)} 个用户名称 (Peewee)") except Exception as e: logger.error(f"从 Peewee 加载 person_name_list 失败: {e}") @staticmethod def get_person_id(platform: str, user_id: int): """获取唯一id""" if "-" in platform: platform = platform.split("-")[1] components = [platform, str(user_id)] key = "_".join(components) return hashlib.md5(key.encode()).hexdigest() async def is_person_known(self, platform: str, user_id: int): """判断是否认识某人""" person_id = self.get_person_id(platform, user_id) def _db_check_known_sync(p_id: str): return PersonInfo.get_or_none(PersonInfo.person_id == p_id) is not None try: return await asyncio.to_thread(_db_check_known_sync, person_id) except Exception as e: logger.error(f"检查用户 {person_id} 是否已知时出错 (Peewee): {e}") return False def get_person_id_by_person_name(self, person_name: str): """根据用户名获取用户ID""" try: record = PersonInfo.get_or_none(PersonInfo.person_name == person_name) if record: return record.person_id else: return "" except Exception as e: logger.error(f"根据用户名 {person_name} 获取用户ID时出错 (Peewee): {e}") return "" @staticmethod async def create_person_info(person_id: str, data: dict = None): """创建一个项""" if not person_id: logger.debug("创建失败,personid不存在") return _person_info_default = copy.deepcopy(person_info_default) model_fields = PersonInfo._meta.fields.keys() final_data = {"person_id": person_id} # Start with defaults for all model fields for key, default_value in _person_info_default.items(): if key in model_fields: final_data[key] = default_value # Override with provided data if data: for key, value in data.items(): if key in model_fields: final_data[key] = value # Ensure person_id is correctly set from the argument final_data["person_id"] = person_id # Serialize JSON fields for key in JSON_SERIALIZED_FIELDS: if key in final_data: if isinstance(final_data[key], (list, dict)): final_data[key] = json.dumps(final_data[key], ensure_ascii=False) elif final_data[key] is None: # Default for lists is [], store as "[]" final_data[key] = json.dumps([], ensure_ascii=False) # If it's already a string, assume it's valid JSON or a non-JSON string field def _db_create_sync(p_data: dict): try: PersonInfo.create(**p_data) return True except Exception as e: logger.error(f"创建 PersonInfo 记录 {p_data.get('person_id')} 失败 (Peewee): {e}") return False await asyncio.to_thread(_db_create_sync, final_data) async def update_one_field(self, person_id: str, field_name: str, value, data: dict = None): """更新某一个字段,会补全""" if field_name not in PersonInfo._meta.fields: # if field_name in person_info_default: # Keep this check if some defaults are not DB fields # logger.debug(f"更新'{field_name}'跳过,字段存在于默认配置但不在 PersonInfo Peewee 模型中。") # return logger.debug(f"更新'{field_name}'失败,未在 PersonInfo Peewee 模型中定义的字段。") return # print(f"更新字段: {field_name},值: {value}") processed_value = value if field_name in JSON_SERIALIZED_FIELDS: if isinstance(value, (list, dict)): processed_value = json.dumps(value, ensure_ascii=False, indent=None) elif value is None: # Store None as "[]" for JSON list fields processed_value = json.dumps([], ensure_ascii=False, indent=None) # If value is already a string, assume it's pre-serialized or a non-JSON string. def _db_update_sync(p_id: str, f_name: str, val_to_set): record = PersonInfo.get_or_none(PersonInfo.person_id == p_id) if record: setattr(record, f_name, val_to_set) record.save() return True, False # Found and updated, no creation needed return False, True # Not found, needs creation found, needs_creation = await asyncio.to_thread(_db_update_sync, person_id, field_name, processed_value) if needs_creation: logger.debug(f"更新时 {person_id} 不存在,将新建。") creation_data = data if data is not None else {} # Ensure platform and user_id are present for context if available from 'data' # but primarily, set the field that triggered the update. # The create_person_info will handle defaults and serialization. creation_data[field_name] = value # Pass original value to create_person_info # Ensure platform and user_id are in creation_data if available, # otherwise create_person_info will use defaults. if data and "platform" in data: creation_data["platform"] = data["platform"] if data and "user_id" in data: creation_data["user_id"] = data["user_id"] await self.create_person_info(person_id, creation_data) @staticmethod async def has_one_field(person_id: str, field_name: str): """判断是否存在某一个字段""" if field_name not in PersonInfo._meta.fields: logger.debug(f"检查字段'{field_name}'失败,未在 PersonInfo Peewee 模型中定义。") return False def _db_has_field_sync(p_id: str, f_name: str): record = PersonInfo.get_or_none(PersonInfo.person_id == p_id) if record: return True return False try: return await asyncio.to_thread(_db_has_field_sync, person_id, field_name) except Exception as e: logger.error(f"检查字段 {field_name} for {person_id} 时出错 (Peewee): {e}") return False @staticmethod def _extract_json_from_text(text: str) -> dict: """从文本中提取JSON数据的高容错方法""" try: fixed_json = repair_json(text) if isinstance(fixed_json, str): parsed_json = json.loads(fixed_json) else: parsed_json = fixed_json if isinstance(parsed_json, list) and parsed_json: parsed_json = parsed_json[0] if isinstance(parsed_json, dict): return parsed_json except Exception as e: logger.warning(f"JSON提取失败: {e}") logger.warning(f"无法从文本中提取有效的JSON字典: {text}") logger.info(f"文本: {text}") return {"nickname": "", "reason": ""} async def _generate_unique_person_name(self, base_name: str) -> str: """生成唯一的 person_name,如果存在重复则添加数字后缀""" # 处理空昵称的情况 if not base_name or base_name.isspace(): base_name = "空格" # 检查基础名称是否已存在 if base_name not in self.person_name_list.values(): return base_name # 如果存在,添加数字后缀 counter = 1 while True: new_name = f"{base_name}[{counter}]" if new_name not in self.person_name_list.values(): return new_name counter += 1 async def qv_person_name( self, person_id: str, user_nickname: str, user_cardname: str, user_avatar: str, request: str = "" ): """给某个用户取名""" if not person_id: logger.debug("取名失败:person_id不能为空") return None old_name = await self.get_value(person_id, "person_name") old_reason = await self.get_value(person_id, "name_reason") max_retries = 8 current_try = 0 existing_names_str = "" current_name_set = set(self.person_name_list.values()) while current_try < max_retries: # prompt_personality =get_individuality().get_prompt(x_person=2, level=1) bot_name = global_config.bot.nickname qv_name_prompt = f"你是{bot_name},一个伪装成人类的AI,你不能让别人发现这一点," qv_name_prompt += f"现在你想给一个用户取一个昵称,用户的qq昵称是{user_nickname}," qv_name_prompt += f"用户的qq群昵称名是{user_cardname}," if user_avatar: qv_name_prompt += f"用户的qq头像是{user_avatar}," if old_name: qv_name_prompt += f"你之前叫他{old_name},是因为{old_reason}," qv_name_prompt += f"\n其他取名的要求是:{request},不要太浮夸,简短," qv_name_prompt += "\n请根据以上用户信息,想想你叫他什么比较好,不要太浮夸,请最好使用用户的qq昵称或群昵称原文,可以稍作修改,优先使用原文。优先使用用户的qq昵称或者群昵称原文。" if existing_names_str: qv_name_prompt += f"\n请注意,以下名称已被你尝试过或已知存在,请避免:{existing_names_str}。\n" if len(current_name_set) < 50 and current_name_set: qv_name_prompt += f"已知的其他昵称有: {', '.join(list(current_name_set)[:10])}等。\n" qv_name_prompt += "请用json给出你的想法,并给出理由,示例如下:" qv_name_prompt += """{ "nickname": "昵称", "reason": "理由" }""" response, (reasoning_content, model_name) = await self.qv_name_llm.generate_response_async(qv_name_prompt) # logger.info(f"取名提示词:{qv_name_prompt}\n取名回复:{response}") result = self._extract_json_from_text(response) if not result or not result.get("nickname"): logger.error("生成的昵称为空或结果格式不正确,重试中...") current_try += 1 continue generated_nickname = result["nickname"] is_duplicate = False if generated_nickname in current_name_set: is_duplicate = True logger.info(f"尝试给用户{user_nickname} {person_id} 取名,但是 {generated_nickname} 已存在,重试中...") else: def _db_check_name_exists_sync(name_to_check): return PersonInfo.select().where(PersonInfo.person_name == name_to_check).exists() if await asyncio.to_thread(_db_check_name_exists_sync, generated_nickname): is_duplicate = True current_name_set.add(generated_nickname) if not is_duplicate: await self.update_one_field(person_id, "person_name", generated_nickname) await self.update_one_field(person_id, "name_reason", result.get("reason", "未提供理由")) logger.info( f"成功给用户{user_nickname} {person_id} 取名 {generated_nickname},理由:{result.get('reason', '未提供理由')}" ) self.person_name_list[person_id] = generated_nickname return result else: if existing_names_str: existing_names_str += "、" existing_names_str += generated_nickname logger.debug(f"生成的昵称 {generated_nickname} 已存在,重试中...") current_try += 1 # 如果多次尝试后仍未成功,使用唯一的 user_nickname 作为默认值 unique_nickname = await self._generate_unique_person_name(user_nickname) logger.warning(f"在{max_retries}次尝试后未能生成唯一昵称,使用默认昵称 {unique_nickname}") await self.update_one_field(person_id, "person_name", unique_nickname) await self.update_one_field(person_id, "name_reason", "使用用户原始昵称作为默认值") self.person_name_list[person_id] = unique_nickname return {"nickname": unique_nickname, "reason": "使用用户原始昵称作为默认值"} @staticmethod async def del_one_document(person_id: str): """删除指定 person_id 的文档""" if not person_id: logger.debug("删除失败:person_id 不能为空") return def _db_delete_sync(p_id: str): try: query = PersonInfo.delete().where(PersonInfo.person_id == p_id) deleted_count = query.execute() return deleted_count except Exception as e: logger.error(f"删除 PersonInfo {p_id} 失败 (Peewee): {e}") return 0 deleted_count = await asyncio.to_thread(_db_delete_sync, person_id) if deleted_count > 0: logger.debug(f"删除成功:person_id={person_id} (Peewee)") else: logger.debug(f"删除失败:未找到 person_id={person_id} 或删除未影响行 (Peewee)") @staticmethod async def get_value(person_id: str, field_name: str): """获取指定用户指定字段的值""" default_value_for_field = person_info_default.get(field_name) if field_name in JSON_SERIALIZED_FIELDS and default_value_for_field is None: default_value_for_field = [] # Ensure JSON fields default to [] if not in DB def _db_get_value_sync(p_id: str, f_name: str): record = PersonInfo.get_or_none(PersonInfo.person_id == p_id) if record: val = getattr(record, f_name, None) if f_name in JSON_SERIALIZED_FIELDS: if isinstance(val, str): try: return json.loads(val) except json.JSONDecodeError: logger.warning(f"字段 {f_name} for {p_id} 包含无效JSON: {val}. 返回默认值.") return [] # Default for JSON fields on error elif val is None: # Field exists in DB but is None return [] # Default for JSON fields # If val is already a list/dict (e.g. if somehow set without serialization) return val # Should ideally not happen if update_one_field is always used return val return None # Record not found try: value_from_db = await asyncio.to_thread(_db_get_value_sync, person_id, field_name) if value_from_db is not None: return value_from_db if field_name in person_info_default: return default_value_for_field logger.warning(f"字段 {field_name} 在 person_info_default 中未定义,且在数据库中未找到。") return None # Ultimate fallback except Exception as e: logger.error(f"获取字段 {field_name} for {person_id} 时出错 (Peewee): {e}") # Fallback to default in case of any error during DB access if field_name in person_info_default: return default_value_for_field return None @staticmethod def get_value_sync(person_id: str, field_name: str): """同步获取指定用户指定字段的值""" default_value_for_field = person_info_default.get(field_name) if field_name in JSON_SERIALIZED_FIELDS and default_value_for_field is None: default_value_for_field = [] record = PersonInfo.get_or_none(PersonInfo.person_id == person_id) if record: val = getattr(record, field_name, None) if field_name in JSON_SERIALIZED_FIELDS: if isinstance(val, str): try: return json.loads(val) except json.JSONDecodeError: logger.warning(f"字段 {field_name} for {person_id} 包含无效JSON: {val}. 返回默认值.") return [] elif val is None: return [] return val return val if field_name in person_info_default: return default_value_for_field logger.warning(f"字段 {field_name} 在 person_info_default 中未定义,且在数据库中未找到。") return None @staticmethod async def get_values(person_id: str, field_names: list) -> dict: """获取指定person_id文档的多个字段值,若不存在该字段,则返回该字段的全局默认值""" if not person_id: logger.debug("get_values获取失败:person_id不能为空") return {} result = {} def _db_get_record_sync(p_id: str): return PersonInfo.get_or_none(PersonInfo.person_id == p_id) record = await asyncio.to_thread(_db_get_record_sync, person_id) for field_name in field_names: if field_name not in PersonInfo._meta.fields: if field_name in person_info_default: result[field_name] = copy.deepcopy(person_info_default[field_name]) logger.debug(f"字段'{field_name}'不在Peewee模型中,使用默认配置值。") else: logger.debug(f"get_values查询失败:字段'{field_name}'未在Peewee模型和默认配置中定义。") result[field_name] = None continue if record: value = getattr(record, field_name) if value is not None: result[field_name] = value else: result[field_name] = copy.deepcopy(person_info_default.get(field_name)) else: result[field_name] = copy.deepcopy(person_info_default.get(field_name)) return result @staticmethod async def get_specific_value_list( field_name: str, way: Callable[[Any], bool], ) -> Dict[str, Any]: """ 获取满足条件的字段值字典 """ if field_name not in PersonInfo._meta.fields: logger.error(f"字段检查失败:'{field_name}'未在 PersonInfo Peewee 模型中定义") return {} def _db_get_specific_sync(f_name: str): found_results = {} try: for record in PersonInfo.select(PersonInfo.person_id, getattr(PersonInfo, f_name)): value = getattr(record, f_name) if way(value): found_results[record.person_id] = value except Exception as e_query: logger.error(f"数据库查询失败 (Peewee specific_value_list for {f_name}): {str(e_query)}", exc_info=True) return found_results try: return await asyncio.to_thread(_db_get_specific_sync, field_name) except Exception as e: logger.error(f"执行 get_specific_value_list 线程时出错: {str(e)}", exc_info=True) return {} async def get_or_create_person( self, platform: str, user_id: int, nickname: str = None, user_cardname: str = None, user_avatar: str = None ) -> str: """ 根据 platform 和 user_id 获取 person_id。 如果对应的用户不存在,则使用提供的可选信息创建新用户。 """ person_id = self.get_person_id(platform, user_id) def _db_check_exists_sync(p_id: str): return PersonInfo.get_or_none(PersonInfo.person_id == p_id) record = await asyncio.to_thread(_db_check_exists_sync, person_id) if record is None: logger.info(f"用户 {platform}:{user_id} (person_id: {person_id}) 不存在,将创建新记录 (Peewee)。") unique_nickname = await self._generate_unique_person_name(nickname) initial_data = { "person_id": person_id, "platform": platform, "user_id": str(user_id), "nickname": nickname, "person_name": unique_nickname, # 使用群昵称作为person_name "name_reason": "从群昵称获取", "know_times": 0, "know_since": int(datetime.datetime.now().timestamp()), "last_know": int(datetime.datetime.now().timestamp()), "impression": None, "points": [], "forgotten_points": [], } model_fields = PersonInfo._meta.fields.keys() filtered_initial_data = {k: v for k, v in initial_data.items() if v is not None and k in model_fields} await self.create_person_info(person_id, data=filtered_initial_data) logger.info(f"已为 {person_id} 创建新记录,初始数据 (filtered for model): {filtered_initial_data}") return person_id async def get_person_info_by_name(self, person_name: str) -> dict | None: """根据 person_name 查找用户并返回基本信息 (如果找到)""" if not person_name: logger.debug("get_person_info_by_name 获取失败:person_name 不能为空") return None found_person_id = None for pid, name_in_cache in self.person_name_list.items(): if name_in_cache == person_name: found_person_id = pid break if not found_person_id: def _db_find_by_name_sync(p_name_to_find: str): return PersonInfo.get_or_none(PersonInfo.person_name == p_name_to_find) record = await asyncio.to_thread(_db_find_by_name_sync, person_name) if record: found_person_id = record.person_id if ( found_person_id not in self.person_name_list or self.person_name_list[found_person_id] != person_name ): self.person_name_list[found_person_id] = person_name else: logger.debug(f"数据库中也未找到名为 '{person_name}' 的用户 (Peewee)") return None if found_person_id: required_fields = [ "person_id", "platform", "user_id", "nickname", "user_cardname", "user_avatar", "person_name", "name_reason", ] valid_fields_to_get = [ f for f in required_fields if f in PersonInfo._meta.fields or f in person_info_default ] person_data = await self.get_values(found_person_id, valid_fields_to_get) if person_data: final_result = {key: person_data.get(key) for key in required_fields} return final_result else: logger.warning(f"找到了 person_id '{found_person_id}' 但 get_values 返回空 (Peewee)") return None logger.error(f"逻辑错误:未能为 '{person_name}' 确定 person_id (Peewee)") return None person_info_manager = None def get_person_info_manager(): global person_info_manager if person_info_manager is None: person_info_manager = PersonInfoManager() return person_info_manager