修复私聊PFC

2025-04-23 23:48:42 +08:00
parent 7281c13a12
commit 2732f40714
13 changed files with 681 additions and 282 deletions
--- a/src/plugins/PFC/action_planner.py
+++ b/src/plugins/PFC/action_planner.py
@@ -1,4 +1,5 @@
-from typing import Tuple
+import time
+from typing import Tuple, List, Dict, Any, Optional # 确保导入了必要的类型
 from src.common.logger import get_module_logger
 from ..models.utils_model import LLMRequest
 from ...config.config import global_config
@@ -10,7 +11,8 @@ from .conversation_info import ConversationInfo

 logger = get_module_logger("action_planner")

-
+# 注意：这个 ActionPlannerInfo 类似乎没有在 ActionPlanner 中使用，
+# 如果确实没用，可以考虑移除，但暂时保留以防万一。
 class ActionPlannerInfo:
    def __init__(self):
        self.done_action = []
@@ -18,18 +20,18 @@ class ActionPlannerInfo:
        self.knowledge_list = []
        self.memory_list = []

-
+# ActionPlanner 类定义，顶格
 class ActionPlanner:
    """行动规划器"""
-
    def __init__(self, stream_id: str):
        self.llm = LLMRequest(
-            model=global_config.llm_normal,
-            temperature=global_config.llm_normal["temp"],
-            max_tokens=1000,
+            model=global_config.llm_PFC_action_planner,
+            temperature=global_config.llm_PFC_action_planner["temp"],
+            max_tokens=1500,
            request_type="action_planning",
        )
-        self.personality_info = Individuality.get_instance().get_prompt(type="personality", x_person=2, level=2)
+        self.personality_info = Individuality.get_instance().get_prompt(type="personality", x_person=2, level=3)
+        self.identity_detail_info = Individuality.get_instance().get_prompt(type="identity", x_person=2, level=2)
        self.name = global_config.BOT_NICKNAME
        self.chat_observer = ChatObserver.get_instance(stream_id)

@@ -43,140 +45,250 @@ class ActionPlanner:
        Returns:
            Tuple[str, str]: (行动类型, 行动原因)
        """
+        # --- 获取 Bot 上次发言时间信息 ---
+        time_since_last_bot_message_info = ""
+        try:
+            bot_id = str(global_config.BOT_QQ)
+            if hasattr(observation_info, 'chat_history') and observation_info.chat_history:
+                for i in range(len(observation_info.chat_history) - 1, -1, -1):
+                    msg = observation_info.chat_history[i]
+                    if not isinstance(msg, dict):
+                        continue
+                    sender_info = msg.get('user_info', {})
+                    sender_id = str(sender_info.get('user_id')) if isinstance(sender_info, dict) else None
+                    msg_time = msg.get('time')
+                    if sender_id == bot_id and msg_time:
+                        time_diff = time.time() - msg_time
+                        if time_diff < 60.0:
+                            time_since_last_bot_message_info = f"提示：你上一条成功发送的消息是在 {time_diff:.1f} 秒前。\n"
+                        break
+            else:
+                logger.debug("Observation info chat history is empty or not available for bot time check.")
+        except AttributeError:
+            logger.warning("ObservationInfo object might not have chat_history attribute yet for bot time check.")
+        except Exception as e:
+            logger.warning(f"获取 Bot 上次发言时间时出错: {e}")
+        # --- 获取 Bot 上次发言时间信息结束 ---
+
+        timeout_context = ""
+        try: # 添加 try-except 以增加健壮性
+            if hasattr(conversation_info, 'goal_list') and conversation_info.goal_list:
+                last_goal_tuple = conversation_info.goal_list[-1]
+                if isinstance(last_goal_tuple, tuple) and len(last_goal_tuple) > 0:
+                    last_goal_text = last_goal_tuple[0]
+                    if isinstance(last_goal_text, str) and "分钟，思考接下来要做什么" in last_goal_text:
+                        try:
+                            timeout_minutes_text = last_goal_text.split('，')[0].replace('你等待了','')
+                            timeout_context = f"重要提示：你刚刚因为对方长时间（{timeout_minutes_text}）没有回复而结束了等待，这可能代表在对方看来本次聊天已结束，请基于此情况规划下一步，不要重复等待前的发言。\n"
+                        except Exception:
+                            timeout_context = f"重要提示：你刚刚因为对方长时间没有回复而结束了等待，这可能代表在对方看来本次聊天已结束，请基于此情况规划下一步，不要重复等待前的发言。\n"
+            else:
+                logger.debug("Conversation info goal_list is empty or not available for timeout check.")
+        except AttributeError:
+             logger.warning("ConversationInfo object might not have goal_list attribute yet for timeout check.")
+        except Exception as e:
+             logger.warning(f"检查超时目标时出错: {e}")
+
        # 构建提示词
-        logger.debug(f"开始规划行动：当前目标: {conversation_info.goal_list}")
+        logger.debug(f"开始规划行动：当前目标: {getattr(conversation_info, 'goal_list', '不可用')}") # 使用 getattr

-        # 构建对话目标
+        # 构建对话目标 (goals_str)
        goals_str = ""
-        if conversation_info.goal_list:
-            for goal_reason in conversation_info.goal_list:
-                # 处理字典或元组格式
-                if isinstance(goal_reason, tuple):
-                    # 假设元组的第一个元素是目标，第二个元素是原因
-                    goal = goal_reason[0]
-                    reasoning = goal_reason[1] if len(goal_reason) > 1 else "没有明确原因"
-                elif isinstance(goal_reason, dict):
-                    goal = goal_reason.get("goal")
-                    reasoning = goal_reason.get("reasoning", "没有明确原因")
-                else:
-                    # 如果是其他类型，尝试转为字符串
-                    goal = str(goal_reason)
-                    reasoning = "没有明确原因"
+        try: # 添加 try-except
+            if hasattr(conversation_info, 'goal_list') and conversation_info.goal_list:
+                for goal_reason in conversation_info.goal_list:
+                    if isinstance(goal_reason, tuple) and len(goal_reason) > 0:
+                        goal = goal_reason[0]
+                        reasoning = goal_reason[1] if len(goal_reason) > 1 else "没有明确原因"
+                    elif isinstance(goal_reason, dict):
+                        goal = goal_reason.get("goal", "目标内容缺失")
+                        reasoning = goal_reason.get("reasoning", "没有明确原因")
+                    else:
+                        goal = str(goal_reason)
+                        reasoning = "没有明确原因"
+                    goal = str(goal) if goal is not None else "目标内容缺失"
+                    reasoning = str(reasoning) if reasoning is not None else "没有明确原因"
+                    goal_str += f"- 目标：{goal}\n  原因：{reasoning}\n"
+            if not goals_str: # 如果循环后 goals_str 仍为空
+                goals_str = "- 目前没有明确对话目标，请考虑设定一个。\n"
+        except AttributeError:
+             logger.warning("ConversationInfo object might not have goal_list attribute yet.")
+             goals_str = "- 获取对话目标时出错。\n"
+        except Exception as e:
+             logger.error(f"构建对话目标字符串时出错: {e}")
+             goals_str = "- 构建对话目标时出错。\n"

-                goal_str = f"目标：{goal}，产生该对话目标的原因：{reasoning}\n"
-                goals_str += goal_str
-        else:
-            goal = "目前没有明确对话目标"
-            reasoning = "目前没有明确对话目标，最好思考一个对话目标"
-            goals_str = f"目标：{goal}，产生该对话目标的原因：{reasoning}\n"
-
-        # 获取聊天历史记录
-        chat_history_list = (
-            observation_info.chat_history[-20:]
-            if len(observation_info.chat_history) >= 20
-            else observation_info.chat_history
-        )
+        # 获取聊天历史记录 (chat_history_text)
        chat_history_text = ""
-        for msg in chat_history_list:
-            chat_history_text += f"{msg.get('detailed_plain_text', '')}\n"
+        try:
+            if hasattr(observation_info, 'chat_history') and observation_info.chat_history:
+                chat_history_list = observation_info.chat_history[-20:]
+                for msg in chat_history_list:
+                    if isinstance(msg, dict) and 'detailed_plain_text' in msg:
+                        chat_history_text += f"{msg.get('detailed_plain_text', '')}\n"
+                    elif isinstance(msg, str):
+                        chat_history_text += f"{msg}\n"
+                if not chat_history_text: # 如果历史记录是空列表
+                     chat_history_text = "还没有聊天记录。\n"
+            else:
+                chat_history_text = "还没有聊天记录。\n"

-        if observation_info.new_messages_count > 0:
-            new_messages_list = observation_info.unprocessed_messages
+            if hasattr(observation_info, 'new_messages_count') and observation_info.new_messages_count > 0:
+                if hasattr(observation_info, 'unprocessed_messages') and observation_info.unprocessed_messages:
+                    new_messages_list = observation_info.unprocessed_messages
+                    chat_history_text += f"--- 以下是 {observation_info.new_messages_count} 条新消息 ---\n"
+                    for msg in new_messages_list:
+                        if isinstance(msg, dict) and 'detailed_plain_text' in msg:
+                            chat_history_text += f"{msg.get('detailed_plain_text', '')}\n"
+                        elif isinstance(msg, str):
+                            chat_history_text += f"{msg}\n"
+                    # 清理消息应该由调用者或 observation_info 内部逻辑处理，这里不再调用 clear
+                    # if hasattr(observation_info, 'clear_unprocessed_messages'):
+                    #    observation_info.clear_unprocessed_messages()
+                else:
+                    logger.warning("ObservationInfo has new_messages_count > 0 but unprocessed_messages is empty or missing.")
+        except AttributeError:
+            logger.warning("ObservationInfo object might be missing expected attributes for chat history.")
+            chat_history_text = "获取聊天记录时出错。\n"
+        except Exception as e:
+            logger.error(f"处理聊天记录时发生未知错误: {e}")
+            chat_history_text = "处理聊天记录时出错。\n"

-            chat_history_text += f"有{observation_info.new_messages_count}条新消息：\n"
-            for msg in new_messages_list:
-                chat_history_text += f"{msg.get('detailed_plain_text', '')}\n"

-            observation_info.clear_unprocessed_messages()
+        # 构建 Persona 文本 (persona_text)
+        identity_details_only = self.identity_detail_info
+        identity_addon = ""
+        if isinstance(identity_details_only, str):
+            pronouns = ["你", "我", "他"]
+            original_details = identity_details_only
+            for p in pronouns:
+                if identity_details_only.startswith(p):
+                    identity_details_only = identity_details_only[len(p):]
+                    break
+            if identity_details_only.endswith("。"):
+                 identity_details_only = identity_details_only[:-1]
+            cleaned_details = identity_details_only.strip(',， ')
+            if cleaned_details:
+                identity_addon = f"并且{cleaned_details}"
+        persona_text = f"你的名字是{self.name}，{self.personality_info}{identity_addon}。"

-        personality_text = f"你的名字是{self.name}，{self.personality_info}"
+        # --- 构建更清晰的行动历史和上一次行动结果 ---
+        action_history_summary = "你最近执行的行动历史：\n"
+        last_action_context = "关于你【上一次尝试】的行动：\n"

-        # 构建action历史文本
-        action_history_list = (
-            conversation_info.done_action[-10:]
-            if len(conversation_info.done_action) >= 10
-            else conversation_info.done_action
-        )
-        action_history_text = "你之前做的事情是："
-        for action in action_history_list:
-            if isinstance(action, dict):
-                action_type = action.get("action")
-                action_reason = action.get("reason")
-                action_status = action.get("status")
-                if action_status == "recall":
-                    action_history_text += (
-                        f"原本打算：{action_type}，但是因为有新消息，你发现这个行动不合适，所以你没做\n"
-                    )
-                elif action_status == "done":
-                    action_history_text += f"你之前做了：{action_type}，原因：{action_reason}\n"
-            elif isinstance(action, tuple):
-                # 假设元组的格式是(action_type, action_reason, action_status)
-                action_type = action[0] if len(action) > 0 else "未知行动"
-                action_reason = action[1] if len(action) > 1 else "未知原因"
-                action_status = action[2] if len(action) > 2 else "done"
-                if action_status == "recall":
-                    action_history_text += (
-                        f"原本打算：{action_type}，但是因为有新消息，你发现这个行动不合适，所以你没做\n"
-                    )
-                elif action_status == "done":
-                    action_history_text += f"你之前做了：{action_type}，原因：{action_reason}\n"
+        action_history_list = []
+        try: # 添加 try-except
+            if hasattr(conversation_info, 'done_action') and conversation_info.done_action:
+                action_history_list = conversation_info.done_action[-5:]
+            else:
+                logger.debug("Conversation info done_action is empty or not available.")
+        except AttributeError:
+             logger.warning("ConversationInfo object might not have done_action attribute yet.")
+        except Exception as e:
+             logger.error(f"访问行动历史时出错: {e}")

-        prompt = f"""{personality_text}。现在你在参与一场QQ聊天，请分析以下内容，根据信息决定下一步行动：
+        if not action_history_list:
+            action_history_summary += "- 还没有执行过行动。\n"
+            last_action_context += "- 这是你规划的第一个行动。\n"
+        else:
+            for i, action_data in enumerate(action_history_list):
+                action_type = "未知"
+                plan_reason = "未知"
+                status = "未知"
+                final_reason = ""
+                action_time = ""

-当前对话目标：{goals_str}
+                if isinstance(action_data, dict):
+                    action_type = action_data.get("action", "未知")
+                    plan_reason = action_data.get("plan_reason", "未知规划原因")
+                    status = action_data.get("status", "未知")
+                    final_reason = action_data.get("final_reason", "")
+                    action_time = action_data.get("time", "")
+                elif isinstance(action_data, tuple):
+                    if len(action_data) > 0: action_type = action_data[0]
+                    if len(action_data) > 1: plan_reason = action_data[1]
+                    if len(action_data) > 2: status = action_data[2]
+                    if status == "recall" and len(action_data) > 3: final_reason = action_data[3]

-{action_history_text}
+                reason_text = f", 失败/取消原因: {final_reason}" if final_reason else ""
+                summary_line = f"- 时间:{action_time}, 尝试行动:'{action_type}', 状态:{status}{reason_text}"
+                action_history_summary += summary_line + "\n"

-最近的对话记录：
-{chat_history_text}
+                if i == len(action_history_list) - 1:
+                    last_action_context += f"- 上次【规划】的行动是: '{action_type}'\n"
+                    last_action_context += f"- 当时规划的【原因】是: {plan_reason}\n"
+                    if status == "done":
+                        last_action_context += f"- 该行动已【成功执行】。\n"
+                    elif status == "recall":
+                        last_action_context += f"- 但该行动最终【未能执行/被取消】。\n"
+                        if final_reason:
+                             last_action_context += f"- 【重要】失败/取消的具体原因是: “{final_reason}”\n"
+                        else:
+                             last_action_context += f"- 【重要】失败/取消原因未明确记录。\n"
+                    else:
+                        last_action_context += f"- 该行动当前状态: {status}\n"

-请你接下去想想要你要做什么，可以发言，可以等待，可以倾听，可以调取知识。注意不同行动类型的要求，不要重复发言：
-行动类型：
+        # --- 构建最终的 Prompt ---
+        prompt = f"""{persona_text}。现在你在参与一场QQ聊天，请根据以下【所有信息】审慎决策下一步行动，可以发言，可以等待，可以倾听，可以调取知识：
+
+【当前对话目标】
+{goals_str if goals_str.strip() else "- 目前没有明确对话目标，请考虑设定一个。\n"}
+
+【最近行动历史概要】
+{action_history_summary}
+【上一次行动的详细情况和结果】
+{last_action_context}
+【时间和超时提示】
+{time_since_last_bot_message_info}{timeout_context}
+【最近的对话记录】(包括你已成功发送的消息 和 新收到的消息)
+{chat_history_text if chat_history_text.strip() else "还没有聊天记录。\n"}
+--- 行动决策指南 ---
+1.  **仔细分析【上一次行动的详细情况和结果】**。如果上次行动是 direct_reply 且因“内容与你上一条发言完全相同”或“高度相似”而被取消(status: recall)，那么【绝对不要】立即再次规划 direct_reply。在这种特定情况下，你应该优先考虑 wait (等待用户的新回应) 或 rethink_goal (如果对话似乎因此卡住了)。
+2.  结合【当前对话目标】和【最近的对话记录】来判断是否需要回应、回应什么。如果【最近的对话记录】中有新的用户消息，通常需要 direct_reply。如果上次行动成功，或者上次失败的原因不是重复，可以根据对话内容考虑 direct_reply。
+3.  注意【时间和超时提示】，如果对方长时间未回复（例如在 timeout_context 中提示），end_conversation 可能更合适。
+4.  只有在你确信需要发言（比如回应新消息、追问、深入话题），并且上一次行动没有因重复被拒时，才应优先选择 direct_reply。
+
+--- 可选行动类型 ---
 fetch_knowledge: 需要调取知识，当需要专业知识或特定信息时选择
-wait: 当你做出了发言,对方尚未回复时暂时等待对方的回复
+wait: 等待对方回复（尤其是在你刚发言后、或上次发言因重复被拒时、或不确定做什么时，这是较安全的选择）
 listening: 倾听对方发言，当你认为对方发言尚未结束时采用
-direct_reply: 不符合上述情况，回复对方，注意不要过多或者重复发言
-rethink_goal: 重新思考对话目标，当发现对话目标不合适时选择，会重新思考对话目标
-end_conversation: 结束对话，长时间没回复或者当你觉得谈话暂时结束时选择，停止该场对话
+direct_reply: 直接回复或发送新消息，允许适当的追问和深入话题，**但是请务必遵守上面的决策指南，避免在因重复被拒后立即使用，也不要在对方没有回复的情况下过多的“消息轰炸”或重复发言**
+rethink_goal: 重新思考对话目标，当发现对话目标不再适用或对话卡住时选择，注意私聊的环境是灵活的，有可能需要经常选择
+end_conversation: 决定结束对话，对方长时间没回复或者当你觉得谈话暂时结束时可以选择

-请以JSON格式输出，包含以下字段：
-1. action: 行动类型，注意你之前的行为
-2. reason: 选择该行动的原因，注意你之前的行为（简要解释）
+请以JSON格式输出你的决策：
+{{
+    "action": "选择的行动类型 (必须是上面列表中的一个)",
+    "reason": "选择该行动的详细原因 (必须解释你是如何根据“上一次行动结果”、“对话记录”和“决策指南”做出判断的)"
+}}

 注意：请严格按照JSON格式输出，不要包含任何其他内容。"""

-        logger.debug(f"发送到LLM的提示词: {prompt}")
+        logger.debug(f"发送到LLM的提示词 (已更新): {prompt}")
        try:
            content, _ = await self.llm.generate_response_async(prompt)
            logger.debug(f"LLM原始返回内容: {content}")

-            # 使用简化函数提取JSON内容
            success, result = get_items_from_json(
-                content, "action", "reason", default_values={"action": "direct_reply", "reason": "没有明确原因"}
+                content, "action", "reason",
+                default_values={"action": "wait", "reason": "LLM返回格式错误或未提供原因，默认等待"}
            )

-            if not success:
-                return "direct_reply", "JSON解析失败，选择直接回复"
+            action = result.get("action", "wait")
+            reason = result.get("reason", "LLM未提供原因，默认等待")

-            action = result["action"]
-            reason = result["reason"]

            # 验证action类型
-            if action not in [
-                "direct_reply",
-                "fetch_knowledge",
-                "wait",
-                "listening",
-                "rethink_goal",
-                "end_conversation",
-            ]:
-                logger.warning(f"未知的行动类型: {action}，默认使用listening")
-                action = "listening"
+            valid_actions = ["direct_reply", "fetch_knowledge", "wait", "listening", "rethink_goal", "end_conversation"]
+            if action not in valid_actions:
+                logger.warning(f"LLM返回了未知的行动类型: '{action}'，强制改为 wait")
+                reason = f"(原始行动'{action}'无效，已强制改为wait) {reason}"
+                action = "wait"

            logger.info(f"规划的行动: {action}")
            logger.info(f"行动原因: {reason}")
            return action, reason

        except Exception as e:
-            logger.error(f"规划行动时出错: {str(e)}")
-            return "direct_reply", "发生错误，选择直接回复"
+            logger.error(f"规划行动时调用 LLM 或处理结果出错: {str(e)}")
+            return "wait", f"行动规划处理中发生错误，暂时等待: {str(e)}"