mirror of https://github.com/Mai-with-u/MaiBot.git
更智能的checker,拦截伪复读
parent
ad438c9461
commit
cb06662eb4
|
|
@ -2,6 +2,7 @@ from typing import Tuple, List, Dict, Any
|
|||
from src.common.logger import get_module_logger
|
||||
from src.config.config import global_config # 为了获取 BOT_QQ
|
||||
from .chat_observer import ChatObserver
|
||||
import re
|
||||
|
||||
logger = get_module_logger("reply_checker")
|
||||
|
||||
|
|
@ -10,32 +11,39 @@ class ReplyChecker:
|
|||
"""回复检查器 - 新版:仅检查机器人自身发言的精确重复"""
|
||||
|
||||
def __init__(self, stream_id: str, private_name: str):
|
||||
# self.llm = LLMRequest(...) # <--- 移除 LLM 初始化
|
||||
self.name = global_config.BOT_NICKNAME
|
||||
self.private_name = private_name
|
||||
self.chat_observer = ChatObserver.get_instance(stream_id, private_name)
|
||||
# self.max_retries = 3 # 这个 max_retries 属性在当前设计下不再由 checker 控制,而是由 conversation.py 控制
|
||||
self.bot_qq_str = str(global_config.BOT_QQ) # 获取机器人QQ号用于识别自身消息
|
||||
self.bot_qq_str = str(global_config.BOT_QQ)
|
||||
|
||||
def _normalize_text(self, text: str) -> str:
|
||||
"""
|
||||
规范化文本,去除首尾空格,移除末尾的特定标点符号。
|
||||
"""
|
||||
if not text:
|
||||
return ""
|
||||
text = text.strip() # 1. 去除首尾空格
|
||||
# 2. 移除末尾的一个或多个特定标点符号
|
||||
# 可以根据需要调整正则表达式以包含更多或更少的标点
|
||||
text = re.sub(r"[~\s,.!?;;,。]+$", "", text)
|
||||
# 如果需要忽略大小写,可以取消下面一行的注释
|
||||
# text = text.lower()
|
||||
return text
|
||||
|
||||
async def check(
|
||||
self,
|
||||
reply: str,
|
||||
goal: str,
|
||||
goal: str, # 当前逻辑未使用
|
||||
chat_history: List[Dict[str, Any]],
|
||||
chat_history_text: str,
|
||||
current_time_str: str,
|
||||
retry_count: int = 0,
|
||||
chat_history_text: str, # 当前逻辑未使用
|
||||
current_time_str: str, # 当前逻辑未使用
|
||||
retry_count: int = 0, # 当前逻辑未使用
|
||||
) -> Tuple[bool, str, bool]:
|
||||
"""检查生成的回复是否与机器人之前的发言完全一致(长度大于4)
|
||||
|
||||
Args:
|
||||
reply: 待检查的机器人回复内容
|
||||
goal: 当前对话目标 (新逻辑中未使用)
|
||||
chat_history: 对话历史记录 (包含用户和机器人的消息字典列表)
|
||||
chat_history_text: 对话历史记录的文本格式 (新逻辑中未使用)
|
||||
current_time_str: 当前时间的字符串格式 (新逻辑中未使用)
|
||||
retry_count: 当前重试次数 (新逻辑中未使用)
|
||||
|
||||
Returns:
|
||||
Tuple[bool, str, bool]: (是否合适, 原因, 是否需要重新规划)
|
||||
对于重复消息: (False, "机器人尝试发送重复消息", False)
|
||||
|
|
@ -46,13 +54,16 @@ class ReplyChecker:
|
|||
f"[私聊][{self.private_name}] ReplyChecker: BOT_QQ 未配置,无法检查{global_config.BOT_NICKNAME}自身消息。"
|
||||
)
|
||||
return True, "BOT_QQ未配置,跳过重复检查。", False # 无法检查则默认通过
|
||||
|
||||
# 对当前待发送的回复进行规范化
|
||||
normalized_reply = self._normalize_text(reply)
|
||||
|
||||
if len(reply) <= 4:
|
||||
if len(normalized_reply) <= 4:
|
||||
return True, "消息长度小于等于4字符,跳过重复检查。", False
|
||||
|
||||
try:
|
||||
match_found = False # <--- 用于调试
|
||||
for i, msg_dict in enumerate(chat_history): # <--- 添加索引用于日志
|
||||
for i, msg_dict in enumerate(reversed(chat_history)):
|
||||
if not isinstance(msg_dict, dict):
|
||||
continue
|
||||
|
||||
|
|
@ -64,26 +75,31 @@ class ReplyChecker:
|
|||
|
||||
if sender_id == self.bot_qq_str:
|
||||
historical_message_text = msg_dict.get("processed_plain_text", "")
|
||||
# 日志
|
||||
logger.debug(
|
||||
f"[私聊][{self.private_name}] ReplyChecker: 历史记录 #{i} ({global_config.BOT_NICKNAME}): '{historical_message_text}' (长度 {len(historical_message_text)})"
|
||||
)
|
||||
if reply == historical_message_text:
|
||||
logger.warning(f"[私聊][{self.private_name}] ReplyChecker: !!! 精确匹配成功 !!!")
|
||||
logger.warning(
|
||||
f"[私聊][{self.private_name}] ReplyChecker 检测到{global_config.BOT_NICKNAME}自身重复消息: '{reply}'"
|
||||
)
|
||||
match_found = True # <--- 标记找到
|
||||
return (False, "机器人尝试发送重复消息", False)
|
||||
# 对历史消息也进行同样的规范化处理
|
||||
normalized_historical_text = self._normalize_text(historical_message_text)
|
||||
|
||||
if not match_found: # <--- 根据标记判断
|
||||
logger.debug(f"[私聊][{self.private_name}] ReplyChecker: 未找到重复。") # <--- 新增日志
|
||||
return (True, "消息内容未与机器人历史发言重复。", False)
|
||||
logger.debug(
|
||||
f"[私聊][{self.private_name}] ReplyChecker: 历史记录 (反向索引 {i}) ({global_config.BOT_NICKNAME}): "
|
||||
f"原始='{historical_message_text[:50]}...', 规范化后='{normalized_historical_text[:50]}...'"
|
||||
)
|
||||
if normalized_reply == normalized_historical_text and len(normalized_reply) > 0: # 确保规范化后不为空串才比较
|
||||
logger.warning(
|
||||
f"[私聊][{self.private_name}] ReplyChecker: !!! 成功拦截一次复读 !!!"
|
||||
)
|
||||
logger.warning(
|
||||
f"[私聊][{self.private_name}] ReplyChecker 检测到{global_config.BOT_NICKNAME}自身重复消息 (规范化后内容相同): '{normalized_reply[:50]}...'"
|
||||
)
|
||||
match_found = True
|
||||
# 返回: 不合适, 原因, 不需要重规划 (让上层逻辑决定是否重试生成)
|
||||
return (False, "机器人尝试发送与历史发言相似的消息 (内容规范化后相同)", False)
|
||||
|
||||
if not match_found:
|
||||
logger.debug(f"[私聊][{self.private_name}] ReplyChecker: 未找到重复内容 (规范化后比较)。")
|
||||
return (True, "消息内容未与机器人历史发言重复 (规范化后比较)。", False)
|
||||
|
||||
except Exception as e:
|
||||
import traceback
|
||||
|
||||
logger.error(f"[私聊][{self.private_name}] ReplyChecker 检查重复时出错: 类型={type(e)}, 值={e}")
|
||||
logger.error(f"[私聊][{self.private_name}]{traceback.format_exc()}")
|
||||
# 发生未知错误时,为安全起见,默认通过,并记录原因
|
||||
return (True, f"检查重复时发生内部错误: {str(e)}", False)
|
||||
return (True, f"检查重复时发生内部错误 (规范化检查): {str(e)}", False)
|
||||
Loading…
Reference in New Issue