remove：移除无用代码

2025-09-29 21:24:23 +08:00
parent a3390f6cba
commit d519406e4a
5 changed files with 40 additions and 771 deletions
--- a/src/migrate_helper/migrate.py
+++ b/src/migrate_helper/migrate.py
@@ -6,211 +6,6 @@ from src.common.logger import get_logger

 logger = get_logger("migrate")

-
-async def migrate_memory_items_to_string():
-    """
-    将数据库中记忆节点的memory_items从list格式迁移到string格式
-    并根据原始list的项目数量设置weight值
-    """
-    logger.info("开始迁移记忆节点格式...")
-
-    migration_stats = {
-        "total_nodes": 0,
-        "converted_nodes": 0,
-        "already_string_nodes": 0,
-        "empty_nodes": 0,
-        "error_nodes": 0,
-        "weight_updated_nodes": 0,
-        "truncated_nodes": 0,
-    }
-
-    try:
-        # 获取所有图节点
-        all_nodes = GraphNodes.select()
-        migration_stats["total_nodes"] = all_nodes.count()
-
-        logger.info(f"找到 {migration_stats['total_nodes']} 个记忆节点")
-
-        for node in all_nodes:
-            try:
-                concept = node.concept
-                memory_items_raw = node.memory_items.strip() if node.memory_items else ""
-                original_weight = node.weight if hasattr(node, "weight") and node.weight is not None else 1.0
-
-                # 如果为空，跳过
-                if not memory_items_raw:
-                    migration_stats["empty_nodes"] += 1
-                    logger.debug(f"跳过空节点: {concept}")
-                    continue
-
-                try:
-                    # 尝试解析JSON
-                    parsed_data = json.loads(memory_items_raw)
-
-                    if isinstance(parsed_data, list):
-                        # 如果是list格式，需要转换
-                        if parsed_data:
-                            # 转换为字符串格式
-                            new_memory_items = " | ".join(str(item) for item in parsed_data)
-                            original_length = len(new_memory_items)
-
-                            # 检查长度并截断
-                            if len(new_memory_items) > 100:
-                                new_memory_items = new_memory_items[:100]
-                                migration_stats["truncated_nodes"] += 1
-                                logger.debug(f"节点 '{concept}' 内容过长，从 {original_length} 字符截断到 100 字符")
-
-                            new_weight = float(len(parsed_data))  # weight = list项目数量
-
-                            # 更新数据库
-                            node.memory_items = new_memory_items
-                            node.weight = new_weight
-                            node.save()
-
-                            migration_stats["converted_nodes"] += 1
-                            migration_stats["weight_updated_nodes"] += 1
-
-                            length_info = f" (截断: {original_length}→100)" if original_length > 100 else ""
-                            logger.info(
-                                f"转换节点 '{concept}': {len(parsed_data)} 项 -> 字符串{length_info}, weight: {original_weight} -> {new_weight}"
-                            )
-                        else:
-                            # 空list，设置为空字符串
-                            node.memory_items = ""
-                            node.weight = 1.0
-                            node.save()
-
-                            migration_stats["converted_nodes"] += 1
-                            logger.debug(f"转换空list节点: {concept}")
-
-                    elif isinstance(parsed_data, str):
-                        # 已经是字符串格式，检查长度和weight
-                        current_content = parsed_data
-                        original_length = len(current_content)
-                        content_truncated = False
-
-                        # 检查长度并截断
-                        if len(current_content) > 100:
-                            current_content = current_content[:100]
-                            content_truncated = True
-                            migration_stats["truncated_nodes"] += 1
-                            node.memory_items = current_content
-                            logger.debug(f"节点 '{concept}' 字符串内容过长，从 {original_length} 字符截断到 100 字符")
-
-                        # 检查weight是否需要更新
-                        update_needed = False
-                        if original_weight == 1.0:
-                            # 如果weight还是默认值，可以根据内容复杂度估算
-                            content_parts = (
-                                current_content.split(" | ") if " | " in current_content else [current_content]
-                            )
-                            estimated_weight = max(1.0, float(len(content_parts)))
-
-                            if estimated_weight != original_weight:
-                                node.weight = estimated_weight
-                                update_needed = True
-                                logger.debug(f"更新字符串节点权重 '{concept}': {original_weight} -> {estimated_weight}")
-
-                        # 如果内容被截断或权重需要更新，保存到数据库
-                        if content_truncated or update_needed:
-                            node.save()
-                            if update_needed:
-                                migration_stats["weight_updated_nodes"] += 1
-                            if content_truncated:
-                                migration_stats["converted_nodes"] += 1  # 算作转换节点
-                            else:
-                                migration_stats["already_string_nodes"] += 1
-                        else:
-                            migration_stats["already_string_nodes"] += 1
-
-                    else:
-                        # 其他JSON类型，转换为字符串
-                        new_memory_items = str(parsed_data) if parsed_data else ""
-                        original_length = len(new_memory_items)
-
-                        # 检查长度并截断
-                        if len(new_memory_items) > 100:
-                            new_memory_items = new_memory_items[:100]
-                            migration_stats["truncated_nodes"] += 1
-                            logger.debug(f"节点 '{concept}' 其他类型内容过长，从 {original_length} 字符截断到 100 字符")
-
-                        node.memory_items = new_memory_items
-                        node.weight = 1.0
-                        node.save()
-
-                        migration_stats["converted_nodes"] += 1
-                        length_info = f" (截断: {original_length}→100)" if original_length > 100 else ""
-                        logger.debug(f"转换其他类型节点: {concept}{length_info}")
-
-                except json.JSONDecodeError:
-                    # 不是JSON格式，假设已经是纯字符串
-                    # 检查是否是带引号的字符串
-                    if memory_items_raw.startswith('"') and memory_items_raw.endswith('"'):
-                        # 去掉引号
-                        clean_content = memory_items_raw[1:-1]
-                        original_length = len(clean_content)
-
-                        # 检查长度并截断
-                        if len(clean_content) > 100:
-                            clean_content = clean_content[:100]
-                            migration_stats["truncated_nodes"] += 1
-                            logger.debug(f"节点 '{concept}' 去引号内容过长，从 {original_length} 字符截断到 100 字符")
-
-                        node.memory_items = clean_content
-                        node.save()
-
-                        migration_stats["converted_nodes"] += 1
-                        length_info = f" (截断: {original_length}→100)" if original_length > 100 else ""
-                        logger.debug(f"去除引号节点: {concept}{length_info}")
-                    else:
-                        # 已经是纯字符串格式，检查长度
-                        current_content = memory_items_raw
-                        original_length = len(current_content)
-
-                        # 检查长度并截断
-                        if len(current_content) > 100:
-                            current_content = current_content[:100]
-                            node.memory_items = current_content
-                            node.save()
-
-                            migration_stats["converted_nodes"] += 1  # 算作转换节点
-                            migration_stats["truncated_nodes"] += 1
-                            logger.debug(f"节点 '{concept}' 纯字符串内容过长，从 {original_length} 字符截断到 100 字符")
-                        else:
-                            migration_stats["already_string_nodes"] += 1
-                            logger.debug(f"已是字符串格式节点: {concept}")
-
-            except Exception as e:
-                migration_stats["error_nodes"] += 1
-                logger.error(f"处理节点 {concept} 时发生错误: {e}")
-                continue
-
-    except Exception as e:
-        logger.error(f"迁移过程中发生严重错误: {e}")
-        raise
-
-    # 输出迁移统计
-    logger.info("=== 记忆节点迁移完成 ===")
-    logger.info(f"总节点数: {migration_stats['total_nodes']}")
-    logger.info(f"已转换节点: {migration_stats['converted_nodes']}")
-    logger.info(f"已是字符串格式: {migration_stats['already_string_nodes']}")
-    logger.info(f"空节点: {migration_stats['empty_nodes']}")
-    logger.info(f"错误节点: {migration_stats['error_nodes']}")
-    logger.info(f"权重更新节点: {migration_stats['weight_updated_nodes']}")
-    logger.info(f"内容截断节点: {migration_stats['truncated_nodes']}")
-
-    success_rate = (
-        (migration_stats["converted_nodes"] + migration_stats["already_string_nodes"])
-        / migration_stats["total_nodes"]
-        * 100
-        if migration_stats["total_nodes"] > 0
-        else 0
-    )
-    logger.info(f"迁移成功率: {success_rate:.1f}%")
-
-    return migration_stats
-
-
 async def set_all_person_known():
    """
    将person_info库中所有记录的is_known字段设置为True
@@ -312,7 +107,6 @@ async def check_and_run_migrations():
        # 执行迁移函数
        # 依次执行两个异步函数
        await asyncio.sleep(3)
-        await migrate_memory_items_to_string()
        await set_all_person_known()
        # 创建done.mem文件
        with open(done_file, "w", encoding="utf-8") as f: