Ruff fix

2025-11-13 13:24:55 +08:00
parent e78a070fbd
commit 7839acd25d
52 changed files with 1322 additions and 1408 deletions
--- a/src/express/express_utils.py
+++ b/src/express/express_utils.py
@@ -3,31 +3,30 @@ import difflib
 import random
 from datetime import datetime
 from typing import Optional, List, Dict
-from collections import defaultdict


 def filter_message_content(content: Optional[str]) -> str:
    """
    过滤消息内容，移除回复、@、图片等格式
-    
+
    Args:
        content: 原始消息内容
-        
+
    Returns:
        str: 过滤后的内容
    """
    if not content:
        return ""
-        
+
    # 移除以[回复开头、]结尾的部分，包括后面的"，说："部分
-    content = re.sub(r'\[回复.*?\]，说：\s*', '', content)
+    content = re.sub(r"\[回复.*?\]，说：\s*", "", content)
    # 移除@<...>格式的内容
-    content = re.sub(r'@<[^>]*>', '', content)
+    content = re.sub(r"@<[^>]*>", "", content)
    # 移除[picid:...]格式的图片ID
-    content = re.sub(r'\[picid:[^\]]*\]', '', content)
+    content = re.sub(r"\[picid:[^\]]*\]", "", content)
    # 移除[表情包：...]格式的内容
-    content = re.sub(r'\[表情包：[^\]]*\]', '', content)
-    
+    content = re.sub(r"\[表情包：[^\]]*\]", "", content)
+
    return content.strip()


@@ -35,11 +34,11 @@ def calculate_similarity(text1: str, text2: str) -> float:
    """
    计算两个文本的相似度，返回0-1之间的值
    使用SequenceMatcher计算相似度
-    
+
    Args:
        text1: 第一个文本
        text2: 第二个文本
-        
+
    Returns:
        float: 相似度值，范围0-1
    """
@@ -49,10 +48,10 @@ def calculate_similarity(text1: str, text2: str) -> float:
 def format_create_date(timestamp: float) -> str:
    """
    将时间戳格式化为可读的日期字符串
-    
+
    Args:
        timestamp: 时间戳
-        
+
    Returns:
        str: 格式化后的日期字符串
    """
@@ -65,11 +64,11 @@ def format_create_date(timestamp: float) -> str:
 def weighted_sample(population: List[Dict], k: int) -> List[Dict]:
    """
    随机抽样函数
-    
+
    Args:
        population: 总体数据列表
        k: 需要抽取的数量
-        
+
    Returns:
        List[Dict]: 抽取的数据列表
    """
--- a/src/express/expression_learner.py
+++ b/src/express/expression_learner.py
@@ -1,7 +1,6 @@
 import time
 import json
 import os
-from datetime import datetime
 from typing import List, Optional, Tuple
 import traceback
 from src.common.logger import get_logger
@@ -158,8 +157,6 @@ class ExpressionLearner:
            traceback.print_exc()
            return

-
-
    async def learn_and_store(self, num: int = 10) -> List[Tuple[str, str, str]]:
        """
        学习并存储表达方式
@@ -169,7 +166,7 @@ class ExpressionLearner:
        if learnt_expressions is None:
            logger.info("没有学习到表达风格")
            return []
-        
+
        # 展示学到的表达方式
        learnt_expressions_str = ""
        for (
@@ -186,7 +183,7 @@ class ExpressionLearner:
        # 存储到数据库 Expression 表并训练 style_learner
        has_new_expressions = False  # 记录是否有新的表达方式
        learner = style_learner_manager.get_learner(self.chat_id)  # 获取 learner 实例
-        
+
        for (
            situation,
            style,
@@ -195,9 +192,7 @@ class ExpressionLearner:
        ) in learnt_expressions:
            # 查找是否已存在相似表达方式
            query = Expression.select().where(
-                (Expression.chat_id == self.chat_id)
-                & (Expression.situation == situation)
-                & (Expression.style == style)
+                (Expression.chat_id == self.chat_id) & (Expression.situation == situation) & (Expression.style == style)
            )
            if query.exists():
                # 表达方式完全相同，只更新时间戳
@@ -216,39 +211,37 @@ class ExpressionLearner:
                    up_content=up_content,
                )
                has_new_expressions = True
-            
+
            # 训练 style_learner（up_content 和 style 必定存在）
            try:
                learner.add_style(style, situation)
-                
+
                # 学习映射关系
-                success = style_learner_manager.learn_mapping(
-                    self.chat_id, 
-                    up_content, 
-                    style
-                )
+                success = style_learner_manager.learn_mapping(self.chat_id, up_content, style)
                if success:
-                    logger.debug(f"StyleLearner学习成功: {self.chat_id} - {up_content} -> {style}" + (f" (situation: {situation})" if situation else ""))
+                    logger.debug(
+                        f"StyleLearner学习成功: {self.chat_id} - {up_content} -> {style}"
+                        + (f" (situation: {situation})" if situation else "")
+                    )
                else:
                    logger.warning(f"StyleLearner学习失败: {self.chat_id} - {up_content} -> {style}")
            except Exception as e:
                logger.error(f"StyleLearner学习异常: {self.chat_id} - {e}")
-            
-        
+
        # 保存当前聊天室的 style_learner 模型
        if has_new_expressions:
            try:
                logger.info(f"开始保存聊天室 {self.chat_id} 的 StyleLearner 模型...")
                save_success = learner.save(style_learner_manager.model_save_path)
-                
+
                if save_success:
                    logger.info(f"StyleLearner 模型保存成功，聊天室: {self.chat_id}")
                else:
                    logger.warning(f"StyleLearner 模型保存失败，聊天室: {self.chat_id}")
-                    
+
            except Exception as e:
                logger.error(f"StyleLearner 模型保存异常: {e}")
-        
+
        return learnt_expressions

    async def match_expression_context(
@@ -334,7 +327,7 @@ class ExpressionLearner:

        matched_expressions = []
        used_pair_indices = set()  # 用于跟踪已经使用的expression_pair索引
-        
+
        logger.debug(f"match_responses 类型: {type(match_responses)}, 长度: {len(match_responses)}")
        logger.debug(f"match_responses 内容: {match_responses}")

@@ -344,12 +337,12 @@ class ExpressionLearner:
                if not isinstance(match_response, dict):
                    logger.error(f"match_response 不是字典类型: {type(match_response)}, 内容: {match_response}")
                    continue
-                
+
                # 获取表达方式序号
                if "expression_pair" not in match_response:
                    logger.error(f"match_response 缺少 'expression_pair' 字段: {match_response}")
                    continue
-                    
+
                pair_index = int(match_response["expression_pair"]) - 1  # 转换为0-based索引

                # 检查索引是否有效且未被使用过
@@ -367,9 +360,7 @@ class ExpressionLearner:

        return matched_expressions

-    async def learn_expression(
-        self, num: int = 10
-    ) -> Optional[List[Tuple[str, str, str, str]]]:
+    async def learn_expression(self, num: int = 10) -> Optional[List[Tuple[str, str, str, str]]]:
        """从指定聊天流学习表达方式

        Args:
@@ -409,7 +400,6 @@ class ExpressionLearner:
        expressions: List[Tuple[str, str]] = self.parse_expression_response(response)
        # logger.debug(f"学习{type_str}的response: {response}")

-        
        # 对表达方式溯源
        matched_expressions: List[Tuple[str, str, str]] = await self.match_expression_context(
            expressions, random_msg_match_str
@@ -426,17 +416,17 @@ class ExpressionLearner:
                if similarity >= 0.85:  # 85%相似度阈值
                    pos = i
                    break
-            
+
            if pos is None or pos == 0:
                # 没有匹配到目标句或没有上一句，跳过该表达
                continue
-            
+
            # 检查目标句是否为空
            target_content = bare_lines[pos][1]
            if not target_content:
                # 目标句为空，跳过该表达
                continue
-            
+
            prev_original_idx = bare_lines[pos - 1][0]
            up_content = filter_message_content(random_msg[prev_original_idx].processed_plain_text or "")
            if not up_content:
@@ -449,7 +439,6 @@ class ExpressionLearner:

        return filtered_with_up

-
    def parse_expression_response(self, response: str) -> List[Tuple[str, str, str]]:
        """
        解析LLM返回的表达风格总结，每一行提取"当"和"使用"之间的内容，存储为(situation, style)元组
@@ -483,21 +472,21 @@ class ExpressionLearner:
    def _build_bare_lines(self, messages: List) -> List[Tuple[int, str]]:
        """
        为每条消息构建精简文本列表，保留到原消息索引的映射
-        
+
        Args:
            messages: 消息列表
-            
+
        Returns:
            List[Tuple[int, str]]: (original_index, bare_content) 元组列表
        """
        bare_lines: List[Tuple[int, str]] = []
-        
+
        for idx, msg in enumerate(messages):
            content = msg.processed_plain_text or ""
            content = filter_message_content(content)
            # 即使content为空也要记录，防止错位
            bare_lines.append((idx, content))
-                
+
        return bare_lines


--- a/src/express/expression_selector.py
+++ b/src/express/expression_selector.py
@@ -1,8 +1,6 @@
 import json
 import time
-import random
 import hashlib
-import re

 from typing import List, Dict, Optional, Any, Tuple
 from json_repair import repair_json
@@ -115,30 +113,31 @@ class ExpressionSelector:
                return group_chat_ids
        return [chat_id]

-    def get_model_predicted_expressions(self, chat_id: str, target_message: str, total_num: int = 10) -> List[Dict[str, Any]]:
+    def get_model_predicted_expressions(
+        self, chat_id: str, target_message: str, total_num: int = 10
+    ) -> List[Dict[str, Any]]:
        """
        使用 style_learner 模型预测最合适的表达方式
-        
+
        Args:
            chat_id: 聊天室ID
            target_message: 目标消息内容
            total_num: 需要预测的数量
-            
+
        Returns:
            List[Dict[str, Any]]: 预测的表达方式列表
        """
        try:
            # 过滤目标消息内容，移除回复、表情包等特殊格式
            filtered_target_message = filter_message_content(target_message)
-            
+
            logger.info(f"为{chat_id} 预测表达方式，过滤后的目标消息内容: {filtered_target_message}")
-            
+
            # 支持多chat_id合并预测
            related_chat_ids = self.get_related_chat_ids(chat_id)
-            

            predicted_expressions = []
-            
+
            # 为每个相关的chat_id进行预测
            for related_chat_id in related_chat_ids:
                try:
@@ -146,59 +145,65 @@ class ExpressionSelector:
                    best_style, scores = style_learner_manager.predict_style(
                        related_chat_id, filtered_target_message, top_k=total_num
                    )
-                    
+
                    if best_style and scores:
                        # 获取预测风格的完整信息
                        learner = style_learner_manager.get_learner(related_chat_id)
                        style_id, situation = learner.get_style_info(best_style)
-                        
+
                        if style_id and situation:
                            # 从数据库查找对应的表达记录
                            expr_query = Expression.select().where(
-                                (Expression.chat_id == related_chat_id) &
-                                (Expression.situation == situation) &
-                                (Expression.style == best_style)
+                                (Expression.chat_id == related_chat_id)
+                                & (Expression.situation == situation)
+                                & (Expression.style == best_style)
                            )
-                            
+
                            if expr_query.exists():
                                expr = expr_query.get()
-                                predicted_expressions.append({
-                                    "id": expr.id,
-                                    "situation": expr.situation,
-                                    "style": expr.style,
-                                    "last_active_time": expr.last_active_time,
-                                    "source_id": expr.chat_id,
-                                    "create_date": expr.create_date if expr.create_date is not None else expr.last_active_time,
-                                    "prediction_score": scores.get(best_style, 0.0),
-                                    "prediction_input": filtered_target_message
-                                })
+                                predicted_expressions.append(
+                                    {
+                                        "id": expr.id,
+                                        "situation": expr.situation,
+                                        "style": expr.style,
+                                        "last_active_time": expr.last_active_time,
+                                        "source_id": expr.chat_id,
+                                        "create_date": expr.create_date
+                                        if expr.create_date is not None
+                                        else expr.last_active_time,
+                                        "prediction_score": scores.get(best_style, 0.0),
+                                        "prediction_input": filtered_target_message,
+                                    }
+                                )
                            else:
-                                logger.warning(f"为聊天室 {related_chat_id} 预测表达方式失败: {best_style} 没有找到对应的表达方式")
-                                
+                                logger.warning(
+                                    f"为聊天室 {related_chat_id} 预测表达方式失败: {best_style} 没有找到对应的表达方式"
+                                )
+
                except Exception as e:
                    logger.warning(f"为聊天室 {related_chat_id} 预测表达方式失败: {e}")
                    continue
-            
+
            # 按预测分数排序，取前 total_num 个
            predicted_expressions.sort(key=lambda x: x.get("prediction_score", 0.0), reverse=True)
            selected_expressions = predicted_expressions[:total_num]
-            
+
            logger.info(f"为{chat_id} 预测到 {len(selected_expressions)} 个表达方式")
            return selected_expressions
-            
+
        except Exception as e:
            logger.error(f"模型预测表达方式失败: {e}")
            # 如果预测失败，回退到随机选择
            return self._random_expressions(chat_id, total_num)
-    
+
    def _random_expressions(self, chat_id: str, total_num: int) -> List[Dict[str, Any]]:
        """
        随机选择表达方式
-        
+
        Args:
            chat_id: 聊天室ID
            total_num: 需要选择的数量
-            
+
        Returns:
            List[Dict[str, Any]]: 随机选择的表达方式列表
        """
@@ -207,9 +212,7 @@ class ExpressionSelector:
            related_chat_ids = self.get_related_chat_ids(chat_id)

            # 优化：一次性查询所有相关chat_id的表达方式
-            style_query = Expression.select().where(
-                (Expression.chat_id.in_(related_chat_ids))
-            )
+            style_query = Expression.select().where((Expression.chat_id.in_(related_chat_ids)))

            style_exprs = [
                {
@@ -228,15 +231,14 @@ class ExpressionSelector:
                selected_style = weighted_sample(style_exprs, total_num)
            else:
                selected_style = []
-            
+
            logger.info(f"随机选择，为聊天室 {chat_id} 选择了 {len(selected_style)} 个表达方式")
            return selected_style
-            
+
        except Exception as e:
            logger.error(f"随机选择表达方式失败: {e}")
            return []

-
    async def select_suitable_expressions(
        self,
        chat_id: str,
@@ -246,13 +248,13 @@ class ExpressionSelector:
    ) -> Tuple[List[Dict[str, Any]], List[int]]:
        """
        根据配置模式选择适合的表达方式
-        
+
        Args:
            chat_id: 聊天流ID
            chat_info: 聊天内容信息
            max_num: 最大选择数量
            target_message: 目标消息内容
-            
+
        Returns:
            Tuple[List[Dict[str, Any]], List[int]]: 选中的表达方式列表和ID列表
        """
@@ -263,7 +265,7 @@ class ExpressionSelector:

        # 获取配置模式
        expression_mode = global_config.expression.mode
-        
+
        if expression_mode == "exp_model":
            # exp_model模式：直接使用模型预测，不经过LLM
            logger.debug(f"使用exp_model模式为聊天流 {chat_id} 选择表达方式")
@@ -284,12 +286,12 @@ class ExpressionSelector:
    ) -> Tuple[List[Dict[str, Any]], List[int]]:
        """
        exp_model模式：直接使用模型预测，不经过LLM
-        
+
        Args:
            chat_id: 聊天流ID
            target_message: 目标消息内容
            max_num: 最大选择数量
-            
+
        Returns:
            Tuple[List[Dict[str, Any]], List[int]]: 选中的表达方式列表和ID列表
        """
@@ -297,14 +299,14 @@ class ExpressionSelector:
            # 使用模型预测最合适的表达方式
            selected_expressions = self.get_model_predicted_expressions(chat_id, target_message, max_num)
            selected_ids = [expr["id"] for expr in selected_expressions]
-            
+
            # 更新last_active_time
            if selected_expressions:
                self.update_expressions_last_active_time(selected_expressions)
-            
+
            logger.info(f"exp_model模式为聊天流 {chat_id} 选择了 {len(selected_expressions)} 个表达方式")
            return selected_expressions, selected_ids
-            
+
        except Exception as e:
            logger.error(f"exp_model模式选择表达方式失败: {e}")
            return [], []
@@ -318,13 +320,13 @@ class ExpressionSelector:
    ) -> Tuple[List[Dict[str, Any]], List[int]]:
        """
        classic模式：随机选择+LLM选择
-        
+
        Args:
            chat_id: 聊天流ID
            chat_info: 聊天内容信息
            max_num: 最大选择数量
            target_message: 目标消息内容
-            
+
        Returns:
            Tuple[List[Dict[str, Any]], List[int]]: 选中的表达方式列表和ID列表
        """
@@ -425,17 +427,13 @@ class ExpressionSelector:
                updates_by_key[key] = expr
        for chat_id, situation, style in updates_by_key:
            query = Expression.select().where(
-                (Expression.chat_id == chat_id)
-                & (Expression.situation == situation)
-                & (Expression.style == style)
+                (Expression.chat_id == chat_id) & (Expression.situation == situation) & (Expression.style == style)
            )
            if query.exists():
                expr_obj = query.get()
                expr_obj.last_active_time = time.time()
                expr_obj.save()
-                logger.debug(
-                    "表达方式激活: 更新last_active_time in db"
-                )
+                logger.debug("表达方式激活: 更新last_active_time in db")


 init_prompt()
--- a/src/express/expressor_model/model.py
+++ b/src/express/expressor_model/model.py
@@ -6,18 +6,21 @@ import os
 from .tokenizer import Tokenizer
 from .online_nb import OnlineNaiveBayes

+
 class ExpressorModel:
    """
    直接使用朴素贝叶斯精排（可在线学习）
    支持存储situation字段，不参与计算，仅与style对应
    """

-    def __init__(self,
-                 alpha: float = 0.5,
-                 beta: float = 0.5,
-                 gamma: float = 1.0,
-                 vocab_size: int = 200000,
-                 use_jieba: bool = True):
+    def __init__(
+        self,
+        alpha: float = 0.5,
+        beta: float = 0.5,
+        gamma: float = 1.0,
+        vocab_size: int = 200000,
+        use_jieba: bool = True,
+    ):
        self.tokenizer = Tokenizer(stopwords=set(), use_jieba=use_jieba)
        self.nb = OnlineNaiveBayes(alpha=alpha, beta=beta, gamma=gamma, vocab_size=vocab_size)
        self._candidates: Dict[str, str] = {}  # cid -> text (style)
@@ -28,7 +31,7 @@ class ExpressorModel:
        self._candidates[cid] = text
        if situation is not None:
            self._situations[cid] = situation
-        
+
        # 确保在nb模型中初始化该候选的计数
        if cid not in self.nb.cls_counts:
            self.nb.cls_counts[cid] = 0.0
@@ -46,7 +49,7 @@ class ExpressorModel:
        toks = self.tokenizer.tokenize(text)
        if not toks:
            return None, {}
-        
+
        if not self._candidates:
            return None, {}

@@ -58,7 +61,7 @@ class ExpressorModel:
        # 取最高分
        if not scores:
            return None, {}
-        
+
        # 根据k参数限制返回的候选数量
        if k is not None and k > 0:
            # 按分数降序排序，取前k个
@@ -81,40 +84,42 @@ class ExpressorModel:

    def decay(self, factor: float):
        self.nb.decay(factor=factor)
-    
+
    def get_situation(self, cid: str) -> Optional[str]:
        """获取候选对应的situation"""
        return self._situations.get(cid)
-    
+
    def get_style(self, cid: str) -> Optional[str]:
        """获取候选对应的style"""
        return self._candidates.get(cid)
-    
+
    def get_candidate_info(self, cid: str) -> Tuple[Optional[str], Optional[str]]:
        """获取候选的style和situation信息"""
        return self._candidates.get(cid), self._situations.get(cid)
-    
+
    def get_all_candidates(self) -> Dict[str, Tuple[str, Optional[str]]]:
        """获取所有候选的style和situation信息"""
-        return {cid: (style, self._situations.get(cid)) 
-                for cid, style in self._candidates.items()}
+        return {cid: (style, self._situations.get(cid)) for cid, style in self._candidates.items()}

    def save(self, path: str):
        """保存模型"""
        os.makedirs(os.path.dirname(path), exist_ok=True)
        with open(path, "wb") as f:
-            pickle.dump({
-                "candidates": self._candidates,
-                "situations": self._situations,
-                "nb": {
-                    "cls_counts": dict(self.nb.cls_counts),
-                    "token_counts": {cid: dict(tc) for cid, tc in self.nb.token_counts.items()},
-                    "alpha": self.nb.alpha,
-                    "beta": self.nb.beta,
-                    "gamma": self.nb.gamma,
-                    "V": self.nb.V,
-                }
-            }, f)
+            pickle.dump(
+                {
+                    "candidates": self._candidates,
+                    "situations": self._situations,
+                    "nb": {
+                        "cls_counts": dict(self.nb.cls_counts),
+                        "token_counts": {cid: dict(tc) for cid, tc in self.nb.token_counts.items()},
+                        "alpha": self.nb.alpha,
+                        "beta": self.nb.beta,
+                        "gamma": self.nb.gamma,
+                        "V": self.nb.V,
+                    },
+                },
+                f,
+            )

    def load(self, path: str):
        """加载模型"""
@@ -133,9 +138,11 @@ class ExpressorModel:
        self.nb.V = obj["nb"]["V"]
        self.nb._logZ.clear()

+
 def defaultdict_dict(d: Dict[str, Dict[str, float]]):
    from collections import defaultdict
+
    outer = defaultdict(lambda: defaultdict(float))
    for k, inner in d.items():
        outer[k].update(inner)
-    return outer
+    return outer
--- a/src/express/expressor_model/online_nb.py
+++ b/src/express/expressor_model/online_nb.py
@@ -2,6 +2,7 @@ import math
 from typing import Dict, List
 from collections import defaultdict, Counter

+
 class OnlineNaiveBayes:
    def __init__(self, alpha: float = 0.5, beta: float = 0.5, gamma: float = 1.0, vocab_size: int = 200000):
        self.alpha = alpha
@@ -9,9 +10,9 @@ class OnlineNaiveBayes:
        self.gamma = gamma
        self.V = vocab_size

-        self.cls_counts: Dict[str, float] = defaultdict(float)                 # cid -> total token count
+        self.cls_counts: Dict[str, float] = defaultdict(float)  # cid -> total token count
        self.token_counts: Dict[str, Dict[str, float]] = defaultdict(lambda: defaultdict(float))  # cid -> term -> count
-        self._logZ: Dict[str, float] = {}                                      # cache log(∑counts + Vα)
+        self._logZ: Dict[str, float] = {}  # cache log(∑counts + Vα)

    def _invalidate(self, cid: str):
        if cid in self._logZ:
@@ -57,4 +58,4 @@ class OnlineNaiveBayes:
            self.cls_counts[cid] *= g
            for term in list(self.token_counts[cid].keys()):
                self.token_counts[cid][term] *= g
-            self._invalidate(cid)
+            self._invalidate(cid)
--- a/src/express/expressor_model/tokenizer.py
+++ b/src/express/expressor_model/tokenizer.py
@@ -3,17 +3,20 @@ from typing import List, Optional, Set

 try:
    import jieba
+
    _HAS_JIEBA = True
 except Exception:
    _HAS_JIEBA = False

 _WORD_RE = re.compile(r"[A-Za-z0-9_]+")
 # 匹配纯符号的正则表达式
-_SYMBOL_RE = re.compile(r'^[^\w\u4e00-\u9fff]+$')
+_SYMBOL_RE = re.compile(r"^[^\w\u4e00-\u9fff]+$")
+

 def simple_en_tokenize(text: str) -> List[str]:
    return _WORD_RE.findall(text.lower())

+
 class Tokenizer:
    def __init__(self, stopwords: Optional[Set[str]] = None, use_jieba: bool = True):
        self.stopwords = stopwords or set()
@@ -28,4 +31,4 @@ class Tokenizer:
        else:
            toks = simple_en_tokenize(text)
        # 过滤掉纯符号和停用词
-        return [t for t in toks if t not in self.stopwords and not _SYMBOL_RE.match(t)]
+        return [t for t in toks if t not in self.stopwords and not _SYMBOL_RE.match(t)]
--- a/src/express/style_learner.py
+++ b/src/express/style_learner.py
@@ -22,42 +22,42 @@ class StyleLearner:
    学习从up_content到style的映射关系
    支持动态管理风格集合（无数量上限）
    """
-    
+
    def __init__(self, chat_id: str, model_config: Optional[Dict] = None):
        self.chat_id = chat_id
        self.model_config = model_config or {
            "alpha": 0.5,
-            "beta": 0.5, 
+            "beta": 0.5,
            "gamma": 0.99,  # 衰减因子，支持遗忘
            "vocab_size": 200000,
-            "use_jieba": True
+            "use_jieba": True,
        }
-        
+
        # 初始化表达模型
        self.expressor = ExpressorModel(**self.model_config)
-        
+
        # 动态风格管理
        self.style_to_id: Dict[str, str] = {}  # style文本 -> style_id
        self.id_to_style: Dict[str, str] = {}  # style_id -> style文本
        self.id_to_situation: Dict[str, str] = {}  # style_id -> situation文本
        self.next_style_id = 0  # 下一个可用的style_id
-        
+
        # 学习统计
        self.learning_stats = {
            "total_samples": 0,
            "style_counts": defaultdict(int),
            "last_update": None,
-            "style_usage_frequency": defaultdict(int)  # 风格使用频率
+            "style_usage_frequency": defaultdict(int),  # 风格使用频率
        }
-    
+
    def add_style(self, style: str, situation: str = None) -> bool:
        """
        动态添加一个新的风格
-        
+
        Args:
            style: 风格文本
            situation: 对应的situation文本（可选）
-            
+
        Returns:
            bool: 添加是否成功
        """
@@ -66,35 +66,37 @@ class StyleLearner:
            if style in self.style_to_id:
                logger.debug(f"[{self.chat_id}] 风格 '{style}' 已存在")
                return True
-            
+
            # 生成新的style_id
            style_id = f"style_{self.next_style_id}"
            self.next_style_id += 1
-            
+
            # 添加到映射
            self.style_to_id[style] = style_id
            self.id_to_style[style_id] = style
            if situation:
                self.id_to_situation[style_id] = situation
-            
+
            # 添加到expressor模型
            self.expressor.add_candidate(style_id, style, situation)
-            
-            logger.info(f"[{self.chat_id}] 已添加风格: '{style}' (ID: {style_id})" + 
-                       (f", situation: '{situation}'" if situation else ""))
+
+            logger.info(
+                f"[{self.chat_id}] 已添加风格: '{style}' (ID: {style_id})"
+                + (f", situation: '{situation}'" if situation else "")
+            )
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 添加风格失败: {e}")
            return False
-    
+
    def remove_style(self, style: str) -> bool:
        """
        删除一个风格
-        
+
        Args:
            style: 要删除的风格文本
-            
+
        Returns:
            bool: 删除是否成功
        """
@@ -102,33 +104,33 @@ class StyleLearner:
            if style not in self.style_to_id:
                logger.warning(f"[{self.chat_id}] 风格 '{style}' 不存在")
                return False
-            
+
            style_id = self.style_to_id[style]
-            
+
            # 从映射中删除
            del self.style_to_id[style]
            del self.id_to_style[style_id]
            if style_id in self.id_to_situation:
                del self.id_to_situation[style_id]
-            
+
            # 从expressor模型中删除（通过重新构建）
            self._rebuild_expressor()
-            
+
            logger.info(f"[{self.chat_id}] 已删除风格: '{style}' (ID: {style_id})")
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 删除风格失败: {e}")
            return False
-    
+
    def update_style(self, old_style: str, new_style: str) -> bool:
        """
        更新一个风格
-        
+
        Args:
            old_style: 原风格文本
            new_style: 新风格文本
-            
+
        Returns:
            bool: 更新是否成功
        """
@@ -136,37 +138,37 @@ class StyleLearner:
            if old_style not in self.style_to_id:
                logger.warning(f"[{self.chat_id}] 原风格 '{old_style}' 不存在")
                return False
-            
+
            if new_style in self.style_to_id and new_style != old_style:
                logger.warning(f"[{self.chat_id}] 新风格 '{new_style}' 已存在")
                return False
-            
+
            style_id = self.style_to_id[old_style]
-            
+
            # 更新映射
            del self.style_to_id[old_style]
            self.style_to_id[new_style] = style_id
            self.id_to_style[style_id] = new_style
-            
+
            # 更新expressor模型（保留原有的situation）
            situation = self.id_to_situation.get(style_id)
            self.expressor.add_candidate(style_id, new_style, situation)
-            
+
            logger.info(f"[{self.chat_id}] 已更新风格: '{old_style}' -> '{new_style}'")
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 更新风格失败: {e}")
            return False
-    
+
    def add_styles_batch(self, styles: List[str], situations: List[str] = None) -> int:
        """
        批量添加风格
-        
+
        Args:
            styles: 风格文本列表
            situations: 对应的situation文本列表（可选）
-            
+
        Returns:
            int: 成功添加的数量
        """
@@ -175,55 +177,55 @@ class StyleLearner:
            situation = situations[i] if situations and i < len(situations) else None
            if self.add_style(style, situation):
                success_count += 1
-        
+
        logger.info(f"[{self.chat_id}] 批量添加风格: {success_count}/{len(styles)} 成功")
        return success_count
-    
+
    def get_all_styles(self) -> List[str]:
        """获取所有已注册的风格"""
        return list(self.style_to_id.keys())
-    
+
    def get_style_count(self) -> int:
        """获取当前风格数量"""
        return len(self.style_to_id)
-    
+
    def get_situation(self, style: str) -> Optional[str]:
        """
        获取风格对应的situation
-        
+
        Args:
            style: 风格文本
-            
+
        Returns:
            Optional[str]: 对应的situation，如果不存在则返回None
        """
        if style not in self.style_to_id:
            return None
-        
+
        style_id = self.style_to_id[style]
        return self.id_to_situation.get(style_id)
-    
+
    def get_style_info(self, style: str) -> Tuple[Optional[str], Optional[str]]:
        """
        获取风格的完整信息
-        
+
        Args:
            style: 风格文本
-            
+
        Returns:
            Tuple[Optional[str], Optional[str]]: (style_id, situation)
        """
        if style not in self.style_to_id:
            return None, None
-        
+
        style_id = self.style_to_id[style]
        situation = self.id_to_situation.get(style_id)
        return style_id, situation
-    
+
    def get_all_style_info(self) -> Dict[str, Tuple[str, Optional[str]]]:
        """
        获取所有风格的完整信息
-        
+
        Returns:
            Dict[str, Tuple[str, Optional[str]]]: {style: (style_id, situation)}
        """
@@ -232,32 +234,32 @@ class StyleLearner:
            situation = self.id_to_situation.get(style_id)
            result[style] = (style_id, situation)
        return result
-    
+
    def _rebuild_expressor(self):
        """重新构建expressor模型（删除风格后使用）"""
        try:
            # 重新创建expressor
            self.expressor = ExpressorModel(**self.model_config)
-            
+
            # 重新添加所有风格和situation
            for style_id, style_text in self.id_to_style.items():
                situation = self.id_to_situation.get(style_id)
                self.expressor.add_candidate(style_id, style_text, situation)
-            
+
            logger.debug(f"[{self.chat_id}] 已重新构建expressor模型")
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 重新构建expressor失败: {e}")
-    
+
    def learn_mapping(self, up_content: str, style: str) -> bool:
        """
        学习一个up_content到style的映射
        如果style不存在，会自动添加
-        
+
        Args:
            up_content: 输入内容
            style: 对应的style文本
-            
+
        Returns:
            bool: 学习是否成功
        """
@@ -267,71 +269,71 @@ class StyleLearner:
                if not self.add_style(style):
                    logger.warning(f"[{self.chat_id}] 无法添加风格 '{style}'，学习失败")
                    return False
-            
+
            # 获取style_id
            style_id = self.style_to_id[style]
-            
+
            # 使用正反馈学习
            self.expressor.update_positive(up_content, style_id)
-            
+
            # 更新统计
            self.learning_stats["total_samples"] += 1
            self.learning_stats["style_counts"][style_id] += 1
            self.learning_stats["style_usage_frequency"][style] += 1
            self.learning_stats["last_update"] = asyncio.get_event_loop().time()
-            
+
            logger.debug(f"[{self.chat_id}] 学习映射: '{up_content}' -> '{style}'")
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 学习映射失败: {e}")
            traceback.print_exc()
            return False
-    
+
    def predict_style(self, up_content: str, top_k: int = 5) -> Tuple[Optional[str], Dict[str, float]]:
        """
        根据up_content预测最合适的style
-        
+
        Args:
            up_content: 输入内容
            top_k: 返回前k个候选
-            
+
        Returns:
            Tuple[最佳style文本, 所有候选的分数]
        """
        try:
            best_style_id, scores = self.expressor.predict(up_content, k=top_k)
-            
+
            if best_style_id is None:
                return None, {}
-            
+
            # 将style_id转换为style文本
            best_style = self.id_to_style.get(best_style_id)
-            
+
            # 转换所有分数
            style_scores = {}
            for sid, score in scores.items():
                style_text = self.id_to_style.get(sid)
                if style_text:
                    style_scores[style_text] = score
-            
+
            return best_style, style_scores
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 预测style失败: {e}")
            traceback.print_exc()
            return None, {}
-    
+
    def decay_learning(self, factor: Optional[float] = None) -> None:
        """
        对学习到的知识进行衰减（遗忘）
-        
+
        Args:
            factor: 衰减因子，None则使用配置中的gamma
        """
        self.expressor.decay(factor)
        logger.debug(f"[{self.chat_id}] 执行知识衰减")
-    
+
    def get_stats(self) -> Dict:
        """获取学习统计信息"""
        return {
@@ -341,20 +343,20 @@ class StyleLearner:
            "style_counts": dict(self.learning_stats["style_counts"]),
            "style_usage_frequency": dict(self.learning_stats["style_usage_frequency"]),
            "last_update": self.learning_stats["last_update"],
-            "all_styles": list(self.style_to_id.keys())
+            "all_styles": list(self.style_to_id.keys()),
        }
-    
+
    def save(self, base_path: str) -> bool:
        """
        保存模型到文件
-        
+
        Args:
            base_path: 基础路径，实际文件为 {base_path}/{chat_id}_style_model.pkl
        """
        try:
            os.makedirs(base_path, exist_ok=True)
            file_path = os.path.join(base_path, f"{self.chat_id}_style_model.pkl")
-            
+
            # 保存模型和统计信息
            save_data = {
                "model_config": self.model_config,
@@ -362,43 +364,43 @@ class StyleLearner:
                "id_to_style": self.id_to_style,
                "id_to_situation": self.id_to_situation,
                "next_style_id": self.next_style_id,
-                "learning_stats": self.learning_stats
+                "learning_stats": self.learning_stats,
            }
-            
+
            # 先保存expressor模型
            expressor_path = os.path.join(base_path, f"{self.chat_id}_expressor.pkl")
            self.expressor.save(expressor_path)
-            
+
            # 保存其他数据
            with open(file_path, "wb") as f:
                pickle.dump(save_data, f)
-            
+
            logger.info(f"[{self.chat_id}] 模型已保存到 {file_path}")
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 保存模型失败: {e}")
            return False
-    
+
    def load(self, base_path: str) -> bool:
        """
        从文件加载模型
-        
+
        Args:
            base_path: 基础路径
        """
        try:
            file_path = os.path.join(base_path, f"{self.chat_id}_style_model.pkl")
            expressor_path = os.path.join(base_path, f"{self.chat_id}_expressor.pkl")
-            
+
            if not os.path.exists(file_path) or not os.path.exists(expressor_path):
                logger.warning(f"[{self.chat_id}] 模型文件不存在，将使用默认配置")
                return False
-            
+
            # 加载其他数据
            with open(file_path, "rb") as f:
                save_data = pickle.load(f)
-            
+
            # 恢复配置和状态
            self.model_config = save_data["model_config"]
            self.style_to_id = save_data["style_to_id"]
@@ -406,14 +408,14 @@ class StyleLearner:
            self.id_to_situation = save_data.get("id_to_situation", {})  # 兼容旧版本
            self.next_style_id = save_data["next_style_id"]
            self.learning_stats = save_data["learning_stats"]
-            
+
            # 重新创建expressor并加载
            self.expressor = ExpressorModel(**self.model_config)
            self.expressor.load(expressor_path)
-            
+
            logger.info(f"[{self.chat_id}] 模型已从 {file_path} 加载")
            return True
-            
+
        except Exception as e:
            logger.error(f"[{self.chat_id}] 加载模型失败: {e}")
            return False
@@ -425,156 +427,156 @@ class StyleLearnerManager:
    为每个chat_id维护独立的StyleLearner实例
    每个chat_id可以动态管理自己的风格集合（无数量上限）
    """
-    
+
    def __init__(self, model_save_path: str = "data/style_models"):
        self.model_save_path = model_save_path
        self.learners: Dict[str, StyleLearner] = {}
-        
+
        # 自动保存配置
        self.auto_save_interval = 300  # 5分钟
        self._auto_save_task: Optional[asyncio.Task] = None
-        
+
        logger.info("StyleLearnerManager 已初始化")
-    
+
    def get_learner(self, chat_id: str, model_config: Optional[Dict] = None) -> StyleLearner:
        """
        获取或创建指定chat_id的学习器
-        
+
        Args:
            chat_id: 聊天室ID
            model_config: 模型配置，None则使用默认配置
-            
+
        Returns:
            StyleLearner实例
        """
        if chat_id not in self.learners:
            # 创建新的学习器
            learner = StyleLearner(chat_id, model_config)
-            
+
            # 尝试加载已保存的模型
            learner.load(self.model_save_path)
-            
+
            self.learners[chat_id] = learner
            logger.info(f"为 chat_id={chat_id} 创建新的StyleLearner")
-        
+
        return self.learners[chat_id]
-    
+
    def add_style(self, chat_id: str, style: str) -> bool:
        """
        为指定chat_id添加风格
-        
+
        Args:
            chat_id: 聊天室ID
            style: 风格文本
-            
+
        Returns:
            bool: 添加是否成功
        """
        learner = self.get_learner(chat_id)
        return learner.add_style(style)
-    
+
    def remove_style(self, chat_id: str, style: str) -> bool:
        """
        为指定chat_id删除风格
-        
+
        Args:
            chat_id: 聊天室ID
            style: 风格文本
-            
+
        Returns:
            bool: 删除是否成功
        """
        learner = self.get_learner(chat_id)
        return learner.remove_style(style)
-    
+
    def update_style(self, chat_id: str, old_style: str, new_style: str) -> bool:
        """
        为指定chat_id更新风格
-        
+
        Args:
            chat_id: 聊天室ID
            old_style: 原风格文本
            new_style: 新风格文本
-            
+
        Returns:
            bool: 更新是否成功
        """
        learner = self.get_learner(chat_id)
        return learner.update_style(old_style, new_style)
-    
+
    def get_chat_styles(self, chat_id: str) -> List[str]:
        """
        获取指定chat_id的所有风格
-        
+
        Args:
            chat_id: 聊天室ID
-            
+
        Returns:
            List[str]: 风格列表
        """
        learner = self.get_learner(chat_id)
        return learner.get_all_styles()
-    
+
    def learn_mapping(self, chat_id: str, up_content: str, style: str) -> bool:
        """
        学习一个映射关系
-        
+
        Args:
            chat_id: 聊天室ID
            up_content: 输入内容
            style: 对应的style
-            
+
        Returns:
            bool: 学习是否成功
        """
        learner = self.get_learner(chat_id)
        return learner.learn_mapping(up_content, style)
-    
+
    def predict_style(self, chat_id: str, up_content: str, top_k: int = 5) -> Tuple[Optional[str], Dict[str, float]]:
        """
        预测最合适的style
-        
+
        Args:
            chat_id: 聊天室ID
            up_content: 输入内容
            top_k: 返回前k个候选
-            
+
        Returns:
            Tuple[最佳style, 所有候选分数]
        """
        learner = self.get_learner(chat_id)
        return learner.predict_style(up_content, top_k)
-    
+
    def decay_all_learners(self, factor: Optional[float] = None) -> None:
        """
        对所有学习器执行衰减
-        
+
        Args:
            factor: 衰减因子
        """
        for learner in self.learners.values():
            learner.decay_learning(factor)
        logger.info("已对所有学习器执行衰减")
-    
+
    def get_all_stats(self) -> Dict[str, Dict]:
        """获取所有学习器的统计信息"""
        return {chat_id: learner.get_stats() for chat_id, learner in self.learners.items()}
-    
+
    def save_all_models(self) -> bool:
        """保存所有模型"""
        success_count = 0
        for learner in self.learners.values():
            if learner.save(self.model_save_path):
                success_count += 1
-        
+
        logger.info(f"已保存 {success_count}/{len(self.learners)} 个模型")
        return success_count == len(self.learners)
-    
+
    def load_all_models(self) -> int:
        """加载所有已保存的模型"""
        if not os.path.exists(self.model_save_path):
            return 0
-        
+
        loaded_count = 0
        for filename in os.listdir(self.model_save_path):
            if filename.endswith("_style_model.pkl"):
@@ -583,16 +585,16 @@ class StyleLearnerManager:
                if learner.load(self.model_save_path):
                    self.learners[chat_id] = learner
                    loaded_count += 1
-        
+
        logger.info(f"已加载 {loaded_count} 个模型")
        return loaded_count
-    
+
    async def start_auto_save(self) -> None:
        """启动自动保存任务"""
        if self._auto_save_task is None or self._auto_save_task.done():
            self._auto_save_task = asyncio.create_task(self._auto_save_loop())
            logger.info("已启动自动保存任务")
-    
+
    async def stop_auto_save(self) -> None:
        """停止自动保存任务"""
        if self._auto_save_task and not self._auto_save_task.done():
@@ -602,7 +604,7 @@ class StyleLearnerManager:
            except asyncio.CancelledError:
                pass
            logger.info("已停止自动保存任务")
-    
+
    async def _auto_save_loop(self) -> None:
        """自动保存循环"""
        while True: