feat：统一normal和focus的动作调整,emoji统一可选随机激活或llm激活

2025-07-06 18:36:14 +08:00
parent 6c117742a9
commit 498d72384f
20 changed files with 217 additions and 748 deletions
--- a/src/chat/planner_actions/action_modifier.py
+++ b/src/chat/planner_actions/action_modifier.py
@@ -0,0 +1,548 @@
+from typing import List, Optional, Any, Dict
+from src.chat.heart_flow.observation.observation import Observation
+from src.common.logger import get_logger
+from src.chat.heart_flow.observation.hfcloop_observation import HFCloopObservation
+from src.chat.heart_flow.observation.chatting_observation import ChattingObservation
+from src.chat.message_receive.chat_stream import get_chat_manager
+from src.config.config import global_config
+from src.llm_models.utils_model import LLMRequest
+import random
+import asyncio
+import hashlib
+import time
+from src.chat.planner_actions.action_manager import ActionManager
+from src.chat.utils.chat_message_builder import get_raw_msg_before_timestamp_with_chat, build_readable_messages
+
+logger = get_logger("action_manager")
+
+
+class ActionModifier:
+    """动作处理器
+
+    用于处理Observation对象和根据激活类型处理actions。
+    集成了原有的modify_actions功能和新的激活类型处理功能。
+    支持并行判定和智能缓存优化。
+    """
+
+    def __init__(self, action_manager: ActionManager, chat_id: str):
+        """初始化动作处理器"""
+        self.chat_id = chat_id
+        self.chat_stream = get_chat_manager().get_stream(self.chat_id)
+        self.log_prefix = f"[{get_chat_manager().get_stream_name(self.chat_id) or self.chat_id}]"
+
+        self.action_manager = action_manager
+
+        # 用于LLM判定的小模型
+        self.llm_judge = LLMRequest(
+            model=global_config.model.utils_small,
+            request_type="action.judge",
+        )
+
+        # 缓存相关属性
+        self._llm_judge_cache = {}  # 缓存LLM判定结果
+        self._cache_expiry_time = 30  # 缓存过期时间（秒）
+        self._last_context_hash = None  # 上次上下文的哈希值
+
+    async def modify_actions(
+        self,
+        mode: str = "focus",
+        observations: Optional[List[Observation]] = None,
+        message_content: str = "",
+    ):
+        """
+        动作修改流程，整合传统观察处理和新的激活类型判定
+
+        这个方法处理完整的动作管理流程：
+        1. 基于观察的传统动作修改（循环历史分析、类型匹配等）
+        2. 基于激活类型的智能动作判定，最终确定可用动作集
+
+        处理后，ActionManager 将包含最终的可用动作集，供规划器直接使用
+        """
+        logger.debug(f"{self.log_prefix}开始完整动作修改流程")
+
+        removals_s1 = []
+        removals_s2 = []
+        
+        self.action_manager.restore_actions()
+        all_actions = self.action_manager.get_using_actions_for_mode(mode)
+        
+        message_list_before_now_half = get_raw_msg_before_timestamp_with_chat(
+            chat_id=self.chat_stream.stream_id,
+            timestamp=time.time(),
+            limit=int(global_config.chat.max_context_size * 0.5),
+        )
+        chat_content = build_readable_messages(
+            message_list_before_now_half,
+            replace_bot_name=True,
+            merge_messages=False,
+            timestamp_mode="relative",
+            read_mark=0.0,
+            show_actions=True,
+        )
+        
+        if message_content:
+            chat_content = chat_content + "\n" + f"现在，最新的消息是：{message_content}"
+
+        # === 第一阶段：传统观察处理 ===
+        if observations:
+            for obs in observations:
+                if isinstance(obs, HFCloopObservation):
+                    # 获取适用于FOCUS模式的动作
+                    removals_from_loop = await self.analyze_loop_actions(obs)
+                    if removals_from_loop:
+                        removals_s1.extend(removals_from_loop)
+
+        # 检查动作的关联类型
+        chat_context = self.chat_stream.context
+        type_mismatched_actions = self._check_action_associated_types(all_actions, chat_context)
+
+        if type_mismatched_actions:
+            removals_s1.extend(type_mismatched_actions)
+
+        # 应用第一阶段的移除
+        for action_name, reason in removals_s1:
+            self.action_manager.remove_action_from_using(action_name)
+            logger.debug(f"{self.log_prefix}阶段一移除动作: {action_name}，原因: {reason}")
+
+
+        # === 第二阶段：激活类型判定 ===
+        if chat_content is not None:
+            logger.debug(f"{self.log_prefix}开始激活类型判定阶段")
+
+            # 获取当前使用的动作集（经过第一阶段处理）
+            current_using_actions = self.action_manager.get_using_actions_for_mode(mode)
+            
+            # 获取因激活类型判定而需要移除的动作
+            removals_s2 = await self._get_deactivated_actions_by_type(
+                current_using_actions,
+                mode,
+                chat_content,
+            )
+
+            # 应用第二阶段的移除
+            for action_name, reason in removals_s2:
+                self.action_manager.remove_action_from_using(action_name)
+                logger.debug(f"{self.log_prefix}阶段二移除动作: {action_name}，原因: {reason}")
+        
+        # === 统一日志记录 ===
+        all_removals = removals_s1 + removals_s2
+        if all_removals:
+            removals_summary = " | ".join([f"{name}({reason})" for name, reason in all_removals])
+
+        logger.info(
+            f"{self.log_prefix}{mode}模式动作修改流程结束，最终可用动作: {list(self.action_manager.get_using_actions_for_mode(mode).keys())}||移除记录: {removals_summary}"
+        )
+
+    def _check_action_associated_types(self, all_actions, chat_context):
+        type_mismatched_actions = []
+        for action_name, data in all_actions.items():
+            if data.get("associated_types"):
+                if not chat_context.check_types(data["associated_types"]):
+                    associated_types_str = ", ".join(data["associated_types"])
+                    reason = f"适配器不支持（需要: {associated_types_str}）"
+                    type_mismatched_actions.append((action_name, reason))
+                    logger.debug(
+                        f"{self.log_prefix}决定移除动作: {action_name}，原因: {reason}"
+                    )
+        return type_mismatched_actions
+    
+    async def _get_deactivated_actions_by_type(
+        self,
+        actions_with_info: Dict[str, Any],
+        mode: str = "focus",
+        chat_content: str = "",
+    ) -> List[tuple[str, str]]:
+        """
+        根据激活类型过滤，返回需要停用的动作列表及原因
+
+        Args:
+            actions_with_info: 带完整信息的动作字典
+            chat_content: 聊天内容
+
+        Returns:
+            List[Tuple[str, str]]: 需要停用的 (action_name, reason) 元组列表
+        """
+        deactivated_actions = []
+
+        # 分类处理不同激活类型的actions
+        llm_judge_actions = {}
+        
+        actions_to_check = list(actions_with_info.items())
+        random.shuffle(actions_to_check)
+
+        for action_name, action_info in actions_to_check:
+            activation_type = f"{mode}_activation_type"
+            activation_type = action_info.get(activation_type, "always")
+
+            if activation_type == "always":
+                continue  # 总是激活，无需处理
+
+            elif activation_type == "random":
+                probability = action_info.get("random_activation_probability", ActionManager.DEFAULT_RANDOM_PROBABILITY)
+                if not (random.random() < probability):
+                    reason = f"RANDOM类型未触发（概率{probability}）"
+                    deactivated_actions.append((action_name, reason))
+                    logger.debug(f"{self.log_prefix}未激活动作: {action_name}，原因: {reason}")
+
+            elif activation_type == "keyword":
+                if not self._check_keyword_activation(action_name, action_info, chat_content):
+                    keywords = action_info.get("activation_keywords", [])
+                    reason = f"关键词未匹配（关键词: {keywords}）"
+                    deactivated_actions.append((action_name, reason))
+                    logger.debug(f"{self.log_prefix}未激活动作: {action_name}，原因: {reason}")
+
+            elif activation_type == "llm_judge":
+                llm_judge_actions[action_name] = action_info
+            
+            else:
+                logger.warning(f"{self.log_prefix}未知的激活类型: {activation_type}，跳过处理")
+
+        # 并行处理LLM_JUDGE类型
+        if llm_judge_actions:
+            llm_results = await self._process_llm_judge_actions_parallel(
+                llm_judge_actions,
+                chat_content,
+            )
+            for action_name, should_activate in llm_results.items():
+                if not should_activate:
+                    reason = "LLM判定未激活"
+                    deactivated_actions.append((action_name, reason))
+                    logger.debug(f"{self.log_prefix}未激活动作: {action_name}，原因: {reason}")
+
+        return deactivated_actions
+
+    async def process_actions_for_planner(
+        self, observed_messages_str: str = "", chat_context: Optional[str] = None, extra_context: Optional[str] = None
+    ) -> Dict[str, Any]:
+        """
+        [已废弃] 此方法现在已被整合到 modify_actions() 中
+
+        为了保持向后兼容性而保留，但建议直接使用 ActionManager.get_using_actions()
+        规划器应该直接从 ActionManager 获取最终的可用动作集，而不是调用此方法
+
+        新的架构：
+        1. 主循环调用 modify_actions() 处理完整的动作管理流程
+        2. 规划器直接使用 ActionManager.get_using_actions() 获取最终动作集
+        """
+        logger.warning(
+            f"{self.log_prefix}process_actions_for_planner() 已废弃，建议规划器直接使用 ActionManager.get_using_actions()"
+        )
+
+        # 为了向后兼容，仍然返回当前使用的动作集
+        current_using_actions = self.action_manager.get_using_actions()
+        all_registered_actions = self.action_manager.get_registered_actions()
+
+        # 构建完整的动作信息
+        result = {}
+        for action_name in current_using_actions.keys():
+            if action_name in all_registered_actions:
+                result[action_name] = all_registered_actions[action_name]
+
+        return result
+
+    def _generate_context_hash(self, chat_content: str) -> str:
+        """生成上下文的哈希值用于缓存"""
+        context_content = f"{chat_content}"
+        return hashlib.md5(context_content.encode("utf-8")).hexdigest()
+
+    async def _process_llm_judge_actions_parallel(
+        self,
+        llm_judge_actions: Dict[str, Any],
+        chat_content: str = "",
+    ) -> Dict[str, bool]:
+        """
+        并行处理LLM判定actions，支持智能缓存
+
+        Args:
+            llm_judge_actions: 需要LLM判定的actions
+            chat_content: 聊天内容
+
+        Returns:
+            Dict[str, bool]: action名称到激活结果的映射
+        """
+
+        # 生成当前上下文的哈希值
+        current_context_hash = self._generate_context_hash(chat_content)
+        current_time = time.time()
+
+        results = {}
+        tasks_to_run = {}
+
+        # 检查缓存
+        for action_name, action_info in llm_judge_actions.items():
+            cache_key = f"{action_name}_{current_context_hash}"
+
+            # 检查是否有有效的缓存
+            if (
+                cache_key in self._llm_judge_cache
+                and current_time - self._llm_judge_cache[cache_key]["timestamp"] < self._cache_expiry_time
+            ):
+                results[action_name] = self._llm_judge_cache[cache_key]["result"]
+                logger.debug(
+                    f"{self.log_prefix}使用缓存结果 {action_name}: {'激活' if results[action_name] else '未激活'}"
+                )
+            else:
+                # 需要进行LLM判定
+                tasks_to_run[action_name] = action_info
+
+        # 如果有需要运行的任务，并行执行
+        if tasks_to_run:
+            logger.debug(f"{self.log_prefix}并行执行LLM判定，任务数: {len(tasks_to_run)}")
+
+            # 创建并行任务
+            tasks = []
+            task_names = []
+
+            for action_name, action_info in tasks_to_run.items():
+                task = self._llm_judge_action(
+                    action_name,
+                    action_info,
+                    chat_content,
+                )
+                tasks.append(task)
+                task_names.append(action_name)
+
+            # 并行执行所有任务
+            try:
+                task_results = await asyncio.gather(*tasks, return_exceptions=True)
+
+                # 处理结果并更新缓存
+                for _, (action_name, result) in enumerate(zip(task_names, task_results)):
+                    if isinstance(result, Exception):
+                        logger.error(f"{self.log_prefix}LLM判定action {action_name} 时出错: {result}")
+                        results[action_name] = False
+                    else:
+                        results[action_name] = result
+
+                        # 更新缓存
+                        cache_key = f"{action_name}_{current_context_hash}"
+                        self._llm_judge_cache[cache_key] = {"result": result, "timestamp": current_time}
+
+                logger.debug(f"{self.log_prefix}并行LLM判定完成，耗时: {time.time() - current_time:.2f}s")
+
+            except Exception as e:
+                logger.error(f"{self.log_prefix}并行LLM判定失败: {e}")
+                # 如果并行执行失败，为所有任务返回False
+                for action_name in tasks_to_run.keys():
+                    results[action_name] = False
+
+        # 清理过期缓存
+        self._cleanup_expired_cache(current_time)
+
+        return results
+
+    def _cleanup_expired_cache(self, current_time: float):
+        """清理过期的缓存条目"""
+        expired_keys = []
+        for cache_key, cache_data in self._llm_judge_cache.items():
+            if current_time - cache_data["timestamp"] > self._cache_expiry_time:
+                expired_keys.append(cache_key)
+
+        for key in expired_keys:
+            del self._llm_judge_cache[key]
+
+        if expired_keys:
+            logger.debug(f"{self.log_prefix}清理了 {len(expired_keys)} 个过期缓存条目")
+
+    async def _llm_judge_action(
+        self,
+        action_name: str,
+        action_info: Dict[str, Any],
+        chat_content: str = "",
+    ) -> bool:
+        """
+        使用LLM判定是否应该激活某个action
+
+        Args:
+            action_name: 动作名称
+            action_info: 动作信息
+            observed_messages_str: 观察到的聊天消息
+            chat_context: 聊天上下文
+            extra_context: 额外上下文
+
+        Returns:
+            bool: 是否应该激活此action
+        """
+
+        try:
+            # 构建判定提示词
+            action_description = action_info.get("description", "")
+            action_require = action_info.get("require", [])
+            custom_prompt = action_info.get("llm_judge_prompt", "")
+
+            # 构建基础判定提示词
+            base_prompt = f"""
+你需要判断在当前聊天情况下，是否应该激活名为"{action_name}"的动作。
+
+动作描述：{action_description}
+
+动作使用场景：
+"""
+            for req in action_require:
+                base_prompt += f"- {req}\n"
+
+            if custom_prompt:
+                base_prompt += f"\n额外判定条件：\n{custom_prompt}\n"
+
+            if chat_content:
+                base_prompt += f"\n当前聊天记录：\n{chat_content}\n"
+
+            base_prompt += """
+请根据以上信息判断是否应该激活这个动作。
+只需要回答"是"或"否"，不要有其他内容。
+"""
+
+            # 调用LLM进行判定
+            response, _ = await self.llm_judge.generate_response_async(prompt=base_prompt)
+
+            # 解析响应
+            response = response.strip().lower()
+
+            # print(base_prompt)
+            # print(f"LLM判定动作 {action_name}：响应='{response}'")
+
+            should_activate = "是" in response or "yes" in response or "true" in response
+
+            logger.debug(
+                f"{self.log_prefix}LLM判定动作 {action_name}：响应='{response}'，结果={'激活' if should_activate else '不激活'}"
+            )
+            return should_activate
+
+        except Exception as e:
+            logger.error(f"{self.log_prefix}LLM判定动作 {action_name} 时出错: {e}")
+            # 出错时默认不激活
+            return False
+
+    def _check_keyword_activation(
+        self,
+        action_name: str,
+        action_info: Dict[str, Any],
+        chat_content: str = "",
+    ) -> bool:
+        """
+        检查是否匹配关键词触发条件
+
+        Args:
+            action_name: 动作名称
+            action_info: 动作信息
+            observed_messages_str: 观察到的聊天消息
+            chat_context: 聊天上下文
+            extra_context: 额外上下文
+
+        Returns:
+            bool: 是否应该激活此action
+        """
+
+        activation_keywords = action_info.get("activation_keywords", [])
+        case_sensitive = action_info.get("keyword_case_sensitive", False)
+
+        if not activation_keywords:
+            logger.warning(f"{self.log_prefix}动作 {action_name} 设置为关键词触发但未配置关键词")
+            return False
+
+        # 构建检索文本
+        search_text = ""
+        if chat_content:
+            search_text += chat_content
+        # if chat_context:
+        # search_text += f" {chat_context}"
+        # if extra_context:
+        # search_text += f" {extra_context}"
+
+        # 如果不区分大小写，转换为小写
+        if not case_sensitive:
+            search_text = search_text.lower()
+
+        # 检查每个关键词
+        matched_keywords = []
+        for keyword in activation_keywords:
+            check_keyword = keyword if case_sensitive else keyword.lower()
+            if check_keyword in search_text:
+                matched_keywords.append(keyword)
+
+        if matched_keywords:
+            logger.debug(f"{self.log_prefix}动作 {action_name} 匹配到关键词: {matched_keywords}")
+            return True
+        else:
+            logger.debug(f"{self.log_prefix}动作 {action_name} 未匹配到任何关键词: {activation_keywords}")
+            return False
+
+    async def analyze_loop_actions(self, obs: HFCloopObservation) -> List[tuple[str, str]]:
+        """分析最近的循环内容并决定动作的移除
+
+        Returns:
+            List[Tuple[str, str]]: 包含要删除的动作及原因的元组列表
+                [("action3", "some reason")]
+        """
+        removals = []
+
+        # 获取最近10次循环
+        recent_cycles = obs.history_loop[-10:] if len(obs.history_loop) > 10 else obs.history_loop
+        if not recent_cycles:
+            return removals
+
+        reply_sequence = []  # 记录最近的动作序列
+
+        for cycle in recent_cycles:
+            action_result = cycle.loop_plan_info.get("action_result", {})
+            action_type = action_result.get("action_type", "unknown")
+            reply_sequence.append(action_type == "reply")
+
+        # 计算连续回复的相关阈值
+
+        max_reply_num = int(global_config.focus_chat.consecutive_replies * 3.2)
+        sec_thres_reply_num = int(global_config.focus_chat.consecutive_replies * 2)
+        one_thres_reply_num = int(global_config.focus_chat.consecutive_replies * 1.5)
+
+        # 获取最近max_reply_num次的reply状态
+        if len(reply_sequence) >= max_reply_num:
+            last_max_reply_num = reply_sequence[-max_reply_num:]
+        else:
+            last_max_reply_num = reply_sequence[:]
+
+        # 详细打印阈值和序列信息，便于调试
+        logger.info(
+            f"连续回复阈值: max={max_reply_num}, sec={sec_thres_reply_num}, one={one_thres_reply_num}，"
+            f"最近reply序列: {last_max_reply_num}"
+        )
+        # print(f"consecutive_replies: {consecutive_replies}")
+
+        # 根据最近的reply情况决定是否移除reply动作
+        if len(last_max_reply_num) >= max_reply_num and all(last_max_reply_num):
+            # 如果最近max_reply_num次都是reply，直接移除
+            reason = f"连续回复过多（最近{len(last_max_reply_num)}次全是reply，超过阈值{max_reply_num}）"
+            removals.append(("reply", reason))
+            # reply_count = len(last_max_reply_num) - no_reply_count
+        elif len(last_max_reply_num) >= sec_thres_reply_num and all(last_max_reply_num[-sec_thres_reply_num:]):
+            # 如果最近sec_thres_reply_num次都是reply，40%概率移除
+            removal_probability = 0.4 / global_config.focus_chat.consecutive_replies
+            if random.random() < removal_probability:
+                reason = f"连续回复较多（最近{sec_thres_reply_num}次全是reply，{removal_probability:.2f}概率移除，触发移除）"
+                removals.append(("reply", reason))
+        elif len(last_max_reply_num) >= one_thres_reply_num and all(last_max_reply_num[-one_thres_reply_num:]):
+            # 如果最近one_thres_reply_num次都是reply，20%概率移除
+            removal_probability = 0.2 / global_config.focus_chat.consecutive_replies
+            if random.random() < removal_probability:
+                reason = f"连续回复检测（最近{one_thres_reply_num}次全是reply，{removal_probability:.2f}概率移除，触发移除）"
+                removals.append(("reply", reason))
+        else:
+            logger.debug(f"{self.log_prefix}连续回复检测：无需移除reply动作，最近回复模式正常")
+
+        return removals
+
+
+
+    def get_available_actions_count(self) -> int:
+        """获取当前可用动作数量（排除默认的no_action）"""
+        current_actions = self.action_manager.get_using_actions_for_mode("normal")
+        # 排除no_action（如果存在）
+        filtered_actions = {k: v for k, v in current_actions.items() if k != "no_action"}
+        return len(filtered_actions)
+
+    def should_skip_planning(self) -> bool:
+        """判断是否应该跳过规划过程"""
+        available_count = self.get_available_actions_count()
+        if available_count == 0:
+            logger.debug(f"{self.log_prefix} 没有可用动作，跳过规划")
+            return True
+        return False