PyPI - MemoryOS - Versions diffs - 0.2.1__py3-none-any.whl → 0.2.2__py3-none-any.whl - Mend

MemoryOS 0.2.1py3-none-any.whl → 0.2.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of MemoryOS might be problematic. Click here for more details.

Files changed (74) hide show

{memoryos-0.2.1.dist-info → memoryos-0.2.2.dist-info}/METADATA +2 -1
{memoryos-0.2.1.dist-info → memoryos-0.2.2.dist-info}/RECORD +72 -55
memos/__init__.py +1 -1
memos/api/config.py +156 -65
memos/api/context/context.py +147 -0
memos/api/context/dependencies.py +90 -0
memos/api/product_models.py +5 -1
memos/api/routers/product_router.py +54 -26
memos/configs/graph_db.py +49 -1
memos/configs/internet_retriever.py +6 -0
memos/configs/mem_os.py +5 -0
memos/configs/mem_reader.py +9 -0
memos/configs/mem_scheduler.py +18 -4
memos/configs/mem_user.py +58 -0
memos/graph_dbs/base.py +9 -1
memos/graph_dbs/factory.py +2 -0
memos/graph_dbs/nebular.py +1364 -0
memos/graph_dbs/neo4j.py +4 -4
memos/log.py +1 -1
memos/mem_cube/utils.py +13 -6
memos/mem_os/core.py +140 -30
memos/mem_os/main.py +1 -1
memos/mem_os/product.py +266 -152
memos/mem_os/utils/format_utils.py +314 -67
memos/mem_reader/simple_struct.py +13 -5
memos/mem_scheduler/base_scheduler.py +220 -250
memos/mem_scheduler/general_scheduler.py +193 -73
memos/mem_scheduler/modules/base.py +5 -5
memos/mem_scheduler/modules/dispatcher.py +6 -9
memos/mem_scheduler/modules/misc.py +81 -16
memos/mem_scheduler/modules/monitor.py +52 -41
memos/mem_scheduler/modules/rabbitmq_service.py +9 -7
memos/mem_scheduler/modules/retriever.py +108 -191
memos/mem_scheduler/modules/scheduler_logger.py +255 -0
memos/mem_scheduler/mos_for_test_scheduler.py +16 -19
memos/mem_scheduler/schemas/__init__.py +0 -0
memos/mem_scheduler/schemas/general_schemas.py +43 -0
memos/mem_scheduler/schemas/message_schemas.py +148 -0
memos/mem_scheduler/schemas/monitor_schemas.py +329 -0
memos/mem_scheduler/utils/__init__.py +0 -0
memos/mem_scheduler/utils/filter_utils.py +176 -0
memos/mem_scheduler/utils/misc_utils.py +61 -0
memos/mem_user/factory.py +94 -0
memos/mem_user/mysql_persistent_user_manager.py +271 -0
memos/mem_user/mysql_user_manager.py +500 -0
memos/mem_user/persistent_factory.py +96 -0
memos/mem_user/user_manager.py +4 -4
memos/memories/activation/item.py +4 -0
memos/memories/textual/base.py +1 -1
memos/memories/textual/general.py +35 -91
memos/memories/textual/item.py +5 -33
memos/memories/textual/tree.py +13 -7
memos/memories/textual/tree_text_memory/organize/conflict.py +4 -2
memos/memories/textual/tree_text_memory/organize/relation_reason_detector.py +47 -43
memos/memories/textual/tree_text_memory/organize/reorganizer.py +8 -5
memos/memories/textual/tree_text_memory/retrieve/internet_retriever.py +6 -3
memos/memories/textual/tree_text_memory/retrieve/internet_retriever_factory.py +2 -0
memos/memories/textual/tree_text_memory/retrieve/retrieval_mid_structs.py +2 -0
memos/memories/textual/tree_text_memory/retrieve/searcher.py +46 -23
memos/memories/textual/tree_text_memory/retrieve/task_goal_parser.py +42 -15
memos/memories/textual/tree_text_memory/retrieve/utils.py +11 -7
memos/memories/textual/tree_text_memory/retrieve/xinyusearch.py +62 -58
memos/memos_tools/dinding_report_bot.py +422 -0
memos/memos_tools/notification_service.py +44 -0
memos/memos_tools/notification_utils.py +96 -0
memos/settings.py +3 -1
memos/templates/mem_reader_prompts.py +2 -1
memos/templates/mem_scheduler_prompts.py +41 -7
memos/templates/mos_prompts.py +87 -0
memos/mem_scheduler/modules/schemas.py +0 -328
memos/mem_scheduler/utils.py +0 -75
{memoryos-0.2.1.dist-info → memoryos-0.2.2.dist-info}/LICENSE +0 -0
{memoryos-0.2.1.dist-info → memoryos-0.2.2.dist-info}/WHEEL +0 -0
{memoryos-0.2.1.dist-info → memoryos-0.2.2.dist-info}/entry_points.txt +0 -0

memos/mem_os/utils/format_utils.py CHANGED Viewed

@@ -239,10 +239,10 @@ def sample_nodes_with_type_balance(
             "MetaMemory": 0.05,  # 5%
         }
-    print(
+    logger.info(
         f"Starting type-balanced sampling, original nodes: {len(nodes)}, target nodes: {target_count}"
     )
-    print(f"Target type ratios: {type_ratios}")
+    logger.info(f"Target type ratios: {type_ratios}")
     # Analyze current node type distribution
     current_type_counts = {}
@@ -255,7 +255,7 @@ def sample_nodes_with_type_balance(
             nodes_by_type[memory_type] = []
         nodes_by_type[memory_type].append(node)
-    print(f"Current type distribution: {current_type_counts}")
+    logger.info(f"Current type distribution: {current_type_counts}")
     # Calculate target node count for each type
     type_targets = {}
@@ -290,7 +290,7 @@ def sample_nodes_with_type_balance(
                 )
                 type_targets[memory_type] = type_targets.get(memory_type, 0) + additional
-    print(f"Target node count for each type: {type_targets}")
+    logger.info(f"Target node count for each type: {type_targets}")
     # Perform subtree quality sampling for each type
     selected_nodes = []
@@ -300,16 +300,18 @@ def sample_nodes_with_type_balance(
             continue
         type_nodes = nodes_by_type[memory_type]
-        print(f"\n--- Processing {memory_type} type: {len(type_nodes)} -> {target_for_type} ---")
+        logger.info(
+            f"\n--- Processing {memory_type} type: {len(type_nodes)} -> {target_for_type} ---"
+        )
         if len(type_nodes) <= target_for_type:
             selected_nodes.extend(type_nodes)
-            print(f"  Select all: {len(type_nodes)} nodes")
+            logger.info(f"  Select all: {len(type_nodes)} nodes")
         else:
             # Use enhanced subtree quality sampling
             type_selected = sample_by_enhanced_subtree_quality(type_nodes, edges, target_for_type)
             selected_nodes.extend(type_selected)
-            print(f"  Sampled selection: {len(type_selected)} nodes")
+            logger.info(f"  Sampled selection: {len(type_selected)} nodes")
     # Filter edges
     selected_node_ids = {node["id"] for node in selected_nodes}
@@ -319,8 +321,8 @@ def sample_nodes_with_type_balance(
         if edge["source"] in selected_node_ids and edge["target"] in selected_node_ids
     ]
-    print(f"\nFinal selected nodes: {len(selected_nodes)}")
-    print(f"Final edges: {len(filtered_edges)}")
+    logger.info(f"\nFinal selected nodes: {len(selected_nodes)}")
+    logger.info(f"Final edges: {len(filtered_edges)}")
     # Verify final type distribution
     final_type_counts = {}
@@ -328,11 +330,11 @@ def sample_nodes_with_type_balance(
         memory_type = node.get("metadata", {}).get("memory_type", "Unknown")
         final_type_counts[memory_type] = final_type_counts.get(memory_type, 0) + 1
-    print(f"Final type distribution: {final_type_counts}")
+    logger.info(f"Final type distribution: {final_type_counts}")
     for memory_type, count in final_type_counts.items():
         percentage = count / len(selected_nodes) * 100
         target_percentage = type_ratios.get(memory_type, 0) * 100
-        print(
+        logger.info(
             f"  {memory_type}: {count} nodes ({percentage:.1f}%, target: {target_percentage:.1f}%)"
         )
@@ -358,9 +360,9 @@ def sample_by_enhanced_subtree_quality(
         subtree_analysis.items(), key=lambda x: x[1]["quality_score"], reverse=True
     )
-    print("  Subtree quality ranking:")
+    logger.info("  Subtree quality ranking:")
     for i, (root_id, analysis) in enumerate(sorted_subtrees[:5]):
-        print(
+        logger.info(
             f"    #{i + 1} Root node {root_id}: Quality={analysis['quality_score']:.2f}, "
             f"Depth={analysis['max_depth']}, Branches={analysis['branch_nodes']}, "
             f"Leaves={analysis['leaf_count']}, Max Width={analysis['max_width']}"
@@ -386,7 +388,7 @@ def sample_by_enhanced_subtree_quality(
                 if node:
                     selected_nodes.append(node)
                     selected_node_ids.add(node_id)
-            print(f"    Select entire subtree {root_id}: +{len(new_nodes)} nodes")
+            logger.info(f"    Select entire subtree {root_id}: +{len(new_nodes)} nodes")
         else:
             # Subtree too large, need partial selection
             if analysis["quality_score"] > 5:  # Only partial selection for high-quality subtrees
@@ -398,7 +400,7 @@ def sample_by_enhanced_subtree_quality(
                 selected_nodes.extend(partial_selection)
                 for node in partial_selection:
                     selected_node_ids.add(node["id"])
-                print(
+                logger.info(
                     f"    Partial selection of subtree {root_id}: +{len(partial_selection)} nodes"
                 )
@@ -411,7 +413,7 @@ def sample_by_enhanced_subtree_quality(
         remaining_count = target_count - len(selected_nodes)
         additional = sample_nodes_by_importance(remaining_nodes, edges, remaining_count)
         selected_nodes.extend(additional)
-        print(f"    Supplementary selection: +{len(additional)} nodes")
+        logger.info(f"    Supplementary selection: +{len(additional)} nodes")
     return selected_nodes
@@ -493,7 +495,7 @@ def sample_nodes_by_importance(
 # Modified main function to use new sampling strategy
 def convert_graph_to_tree_forworkmem(
     json_data: dict[str, Any],
-    target_node_count: int = 150,
+    target_node_count: int = 200,
     type_ratios: dict[str, float] | None = None,
 ) -> dict[str, Any]:
     """
@@ -502,8 +504,8 @@ def convert_graph_to_tree_forworkmem(
     original_nodes = json_data.get("nodes", [])
     original_edges = json_data.get("edges", [])
-    print(f"Original node count: {len(original_nodes)}")
-    print(f"Target node count: {target_node_count}")
+    logger.info(f"Original node count: {len(original_nodes)}")
+    logger.info(f"Target node count: {target_node_count}")
     filter_original_edges = []
     for original_edge in original_edges:
         if original_edge["type"] == "PARENT":
@@ -531,7 +533,7 @@ def convert_graph_to_tree_forworkmem(
         node_name = extract_node_name(memory)
         memory_key = node.get("metadata", {}).get("key", node_name)
         usage = node.get("metadata", {}).get("usage", [])
-        frequency = len(usage)
+        frequency = len(usage) if len(usage) < 100 else 100
         node_map[node["id"]] = {
             "id": node["id"],
             "value": memory,
@@ -633,7 +635,7 @@ def convert_graph_to_tree_forworkmem(
 def print_tree_structure(node: dict[str, Any], level: int = 0, max_level: int = 5):
-    """Print the first few layers of tree structure for easy viewing"""
+    """logger.info the first few layers of tree structure for easy viewing"""
     if level > max_level:
         return
@@ -647,21 +649,21 @@ def print_tree_structure(node: dict[str, Any], level: int = 0, max_level: int =
     children = node.get("children", [])
     if children:
         # Intermediate node, display name, type and child count
-        print(f"{indent}- {node_name} [{memory_type}] ({len(children)} children)")
-        print(f"{indent}  ID: {node_id}")
+        logger.info(f"{indent}- {node_name} [{memory_type}] ({len(children)} children)")
+        logger.info(f"{indent}  ID: {node_id}")
         display_value = node_value[:80] + "..." if len(node_value) > 80 else node_value
-        print(f"{indent}  Value: {display_value}")
+        logger.info(f"{indent}  Value: {display_value}")
         if level < max_level:
             for child in children:
                 print_tree_structure(child, level + 1, max_level)
         elif level == max_level:
-            print(f"{indent}  ... (expansion limited)")
+            logger.info(f"{indent}  ... (expansion limited)")
     else:
         # Leaf node, display name, type and value
         display_value = node_value[:80] + "..." if len(node_value) > 80 else node_value
-        print(f"{indent}- {node_name} [{memory_type}]: {display_value}")
-        print(f"{indent}  ID: {node_id}")
+        logger.info(f"{indent}- {node_name} [{memory_type}]: {display_value}")
+        logger.info(f"{indent}  ID: {node_id}")
 def analyze_final_tree_quality(tree_data: dict[str, Any]) -> dict:
@@ -856,107 +858,107 @@ def analyze_final_tree_quality(tree_data: dict[str, Any]) -> dict:
 def print_tree_analysis(tree_data: dict[str, Any]):
-    """Print enhanced tree analysis results"""
+    """logger.info enhanced tree analysis results"""
     stats = analyze_final_tree_quality(tree_data)
-    print("\n" + "=" * 60)
-    print("🌳 Enhanced Tree Structure Quality Analysis Report")
-    print("=" * 60)
+    logger.info("\n" + "=" * 60)
+    logger.info("🌳 Enhanced Tree Structure Quality Analysis Report")
+    logger.info("=" * 60)
     # Basic statistics
-    print("\n📊 Basic Statistics:")
-    print(f"  Total nodes: {stats['total_nodes']}")
-    print(f"  Max depth: {stats['max_depth']}")
-    print(
+    logger.info("\n📊 Basic Statistics:")
+    logger.info(f"  Total nodes: {stats['total_nodes']}")
+    logger.info(f"  Max depth: {stats['max_depth']}")
+    logger.info(
         f"  Leaf nodes: {stats['total_leaves']} ({stats['total_leaves'] / stats['total_nodes'] * 100:.1f}%)"
     )
-    print(
+    logger.info(
         f"  Branch nodes: {stats['total_branches']} ({stats['total_branches'] / stats['total_nodes'] * 100:.1f}%)"
     )
     # Structure quality assessment
     structure = stats.get("structure_quality", {})
     if structure:
-        print("\n🏗️  Structure Quality Assessment:")
-        print(
+        logger.info("\n🏗️  Structure Quality Assessment:")
+        logger.info(
             f"  Branch density: {structure['branch_density']:.3f} ({'✅ Good' if 0.2 <= structure['branch_density'] <= 0.6 else '⚠️  Needs improvement'})"
         )
-        print(
+        logger.info(
             f"  Leaf ratio: {structure['leaf_ratio']:.3f} ({'✅ Good' if 0.3 <= structure['leaf_ratio'] <= 0.7 else '⚠️  Needs improvement'})"
         )
-        print(f"  Max width: {structure['max_width']}")
-        print(
+        logger.info(f"  Max width: {structure['max_width']}")
+        logger.info(
             f"  Depth-width ratio: {structure['depth_width_ratio']:.2f} ({'✅ Good' if structure['depth_width_ratio'] <= 3 else '⚠️  Too thin'})"
         )
-        print(
+        logger.info(
             f"  Overall balance: {'✅ Good' if structure['is_well_balanced'] else '⚠️  Needs improvement'}"
         )
     # Single chain analysis
     chain_analysis = stats.get("chain_analysis", {})
     if chain_analysis:
-        print("\n🔗 Single Chain Structure Analysis:")
-        print(f"  Longest chain: {chain_analysis.get('max_chain_length', 0)} layers")
-        print(f"  Single chain subtrees: {chain_analysis.get('single_chain_subtrees', 0)}")
-        print(
+        logger.info("\n🔗 Single Chain Structure Analysis:")
+        logger.info(f"  Longest chain: {chain_analysis.get('max_chain_length', 0)} layers")
+        logger.info(f"  Single chain subtrees: {chain_analysis.get('single_chain_subtrees', 0)}")
+        logger.info(
             f"  Single chain subtree ratio: {chain_analysis.get('chain_subtree_ratio', 0) * 100:.1f}%"
         )
         if chain_analysis.get("max_chain_length", 0) > 5:
-            print("  ⚠️  Warning: Overly long single chain structure may affect display")
+            logger.info("  ⚠️  Warning: Overly long single chain structure may affect display")
         elif chain_analysis.get("chain_subtree_ratio", 0) > 0.3:
-            print(
+            logger.info(
                 "  ⚠️  Warning: Too many single chain subtrees, suggest increasing branch structure"
             )
         else:
-            print("  ✅ Single chain structure well controlled")
+            logger.info("  ✅ Single chain structure well controlled")
     # Type diversity
     type_div = stats.get("type_diversity", {})
     if type_div:
-        print("\n🎨 Type Diversity Analysis:")
-        print(f"  Total types: {type_div['total_types']}")
-        print(f"  Diversity index: {type_div['shannon_diversity']:.3f}")
-        print(f"  Normalized diversity: {type_div['normalized_diversity']:.3f}")
-        print(f"  Distribution balance: {type_div['distribution_balance']:.3f}")
+        logger.info("\n🎨 Type Diversity Analysis:")
+        logger.info(f"  Total types: {type_div['total_types']}")
+        logger.info(f"  Diversity index: {type_div['shannon_diversity']:.3f}")
+        logger.info(f"  Normalized diversity: {type_div['normalized_diversity']:.3f}")
+        logger.info(f"  Distribution balance: {type_div['distribution_balance']:.3f}")
     # Type distribution
-    print("\n📋 Type Distribution Details:")
+    logger.info("\n📋 Type Distribution Details:")
     for mem_type, count in sorted(stats["by_type"].items(), key=lambda x: x[1], reverse=True):
         percentage = count / stats["total_nodes"] * 100
-        print(f"  {mem_type}: {count} nodes ({percentage:.1f}%)")
+        logger.info(f"  {mem_type}: {count} nodes ({percentage:.1f}%)")
     # Depth distribution
-    print("\n📏 Depth Distribution:")
+    logger.info("\n📏 Depth Distribution:")
     for depth in sorted(stats["by_depth"].keys()):
         count = stats["by_depth"][depth]
-        print(f"  Depth {depth}: {count} nodes")
+        logger.info(f"  Depth {depth}: {count} nodes")
     # Major subtree analysis
     if stats["subtrees"]:
-        print("\n🌲 Major Subtree Analysis (sorted by quality):")
+        logger.info("\n🌲 Major Subtree Analysis (sorted by quality):")
         sorted_subtrees = sorted(
             stats["subtrees"], key=lambda x: x.get("quality_score", 0), reverse=True
         )
         for i, subtree in enumerate(sorted_subtrees[:8]):  # Show first 8
             quality = subtree.get("quality_score", 0)
-            print(f"  #{i + 1} {subtree['root']} [{subtree['type']}]:")
-            print(f"    Quality score: {quality:.2f}")
-            print(
+            logger.info(f"  #{i + 1} {subtree['root']} [{subtree['type']}]:")
+            logger.info(f"    Quality score: {quality:.2f}")
+            logger.info(
                 f"    Structure: Depth={subtree['depth']}, Branches={subtree['branches']}, Leaves={subtree['leaves']}"
             )
-            print(
+            logger.info(
                 f"    Density: Branch density={subtree.get('branch_density', 0):.3f}, Leaf ratio={subtree.get('leaf_ratio', 0):.3f}"
             )
             if quality > 15:
-                print("    ✅ High quality subtree")
+                logger.info("    ✅ High quality subtree")
             elif quality > 8:
-                print("    🟡 Medium quality subtree")
+                logger.info("    🟡 Medium quality subtree")
             else:
-                print("    🔴 Low quality subtree")
+                logger.info("    🔴 Low quality subtree")
-    print("\n" + "=" * 60)
+    logger.info("\n" + "=" * 60)
 def remove_embedding_recursive(memory_info: dict) -> Any:
@@ -1152,3 +1154,248 @@ def convert_activation_memory_summary(act_mem_items: list[KVCacheItem]) -> dict[
         "total_parameters": total_parameters,
         "summary": f"Activation memory contains {total_items} items with {total_layers} layers and approximately {total_parameters:,} parameters",
     }
+def detect_and_remove_duplicate_ids(tree_node: dict[str, Any]) -> dict[str, Any]:
+    """
+    Detect and remove duplicate IDs in tree structure by skipping duplicate nodes.
+    First occurrence of each ID is kept, subsequent duplicates are removed.
+    Args:
+        tree_node: Tree node (dictionary format)
+    Returns:
+        dict: Fixed tree node with duplicate nodes removed
+    """
+    used_ids = set()
+    removed_count = 0
+    def remove_duplicates_recursive(
+        node: dict[str, Any], parent_path: str = ""
+    ) -> dict[str, Any] | None:
+        """Recursively remove duplicate IDs by skipping duplicate nodes"""
+        nonlocal removed_count
+        if not isinstance(node, dict):
+            return node
+        # Create node copy
+        fixed_node = node.copy()
+        # Handle current node ID
+        current_id = fixed_node.get("id", "")
+        if current_id in used_ids and current_id not in ["root", "WorkingMemory"]:
+            # Skip this duplicate node
+            logger.info(f"Skipping duplicate node: {current_id} (path: {parent_path})")
+            removed_count += 1
+            return None  # Return None to indicate this node should be removed
+        else:
+            used_ids.add(current_id)
+        # Recursively process child nodes
+        if "children" in fixed_node and isinstance(fixed_node["children"], list):
+            fixed_children = []
+            for i, child in enumerate(fixed_node["children"]):
+                child_path = f"{parent_path}/{fixed_node.get('node_name', 'unknown')}[{i}]"
+                fixed_child = remove_duplicates_recursive(child, child_path)
+                if fixed_child is not None:  # Only add non-None children
+                    fixed_children.append(fixed_child)
+            fixed_node["children"] = fixed_children
+        return fixed_node
+    result = remove_duplicates_recursive(tree_node)
+    if result is not None:
+        logger.info(f"Removed {removed_count} duplicate nodes")
+        return result
+    else:
+        # If root node itself was removed (shouldn't happen), return empty root
+        return {
+            "id": "root",
+            "node_name": "root",
+            "value": "root",
+            "memory_type": "Root",
+            "children": [],
+        }
+def validate_tree_structure(tree_node: dict[str, Any]) -> dict[str, Any]:
+    """
+    Validate tree structure integrity, including ID uniqueness check
+    Args:
+        tree_node: Tree node (dictionary format)
+    Returns:
+        dict: Validation result containing error messages and fix suggestions
+    """
+    validation_result = {
+        "is_valid": True,
+        "errors": [],
+        "warnings": [],
+        "total_nodes": 0,
+        "unique_ids": set(),
+        "duplicate_ids": set(),
+        "missing_ids": set(),
+        "invalid_structure": [],
+    }
+    def validate_recursive(node: dict[str, Any], path: str = "", depth: int = 0):
+        """Recursively validate tree structure"""
+        if not isinstance(node, dict):
+            validation_result["errors"].append(f"Node is not a dictionary: {path}")
+            validation_result["is_valid"] = False
+            return
+        validation_result["total_nodes"] += 1
+        # Check required fields
+        if "id" not in node:
+            validation_result["errors"].append(f"Node missing ID field: {path}")
+            validation_result["missing_ids"].add(path)
+            validation_result["is_valid"] = False
+        else:
+            node_id = node["id"]
+            if node_id in validation_result["unique_ids"]:
+                validation_result["errors"].append(f"Duplicate node ID: {node_id} (path: {path})")
+                validation_result["duplicate_ids"].add(node_id)
+                validation_result["is_valid"] = False
+            else:
+                validation_result["unique_ids"].add(node_id)
+        # Check other required fields
+        required_fields = ["node_name", "value", "memory_type"]
+        for field in required_fields:
+            if field not in node:
+                validation_result["warnings"].append(f"Node missing field '{field}': {path}")
+        # Recursively validate child nodes
+        if "children" in node:
+            if not isinstance(node["children"], list):
+                validation_result["errors"].append(f"Children field is not a list: {path}")
+                validation_result["is_valid"] = False
+            else:
+                for i, child in enumerate(node["children"]):
+                    child_path = f"{path}/children[{i}]"
+                    validate_recursive(child, child_path, depth + 1)
+        # Check depth limit
+        if depth > 20:
+            validation_result["warnings"].append(f"Tree depth too deep ({depth}): {path}")
+    validate_recursive(tree_node)
+    # Generate fix suggestions
+    if validation_result["duplicate_ids"]:
+        validation_result["fix_suggestion"] = (
+            "Use detect_and_fix_duplicate_ids() function to fix duplicate IDs"
+        )
+    return validation_result
+def ensure_unique_tree_ids(tree_result: dict[str, Any]) -> dict[str, Any]:
+    """
+    Ensure all node IDs in tree structure are unique by removing duplicate nodes,
+    this is a post-processing function for convert_graph_to_tree_forworkmem
+    Args:
+        tree_result: Tree structure returned by convert_graph_to_tree_forworkmem
+    Returns:
+        dict: Fixed tree structure with duplicate nodes removed
+    """
+    logger.info("🔍 Starting duplicate ID check in tree structure...")
+    # First validate tree structure
+    validation = validate_tree_structure(tree_result)
+    if validation["is_valid"]:
+        logger.info("Tree structure validation passed, no duplicate IDs found")
+        return tree_result
+    # Report issues
+    logger.info(f"Found {len(validation['errors'])} errors:")
+    for error in validation["errors"][:5]:  # Only show first 5 errors
+        logger.info(f"   - {error}")
+    if len(validation["errors"]) > 5:
+        logger.info(f"   ... and {len(validation['errors']) - 5} more errors")
+    logger.info("Statistics:")
+    logger.info(f"   - Total nodes: {validation['total_nodes']}")
+    logger.info(f"   - Unique IDs: {len(validation['unique_ids'])}")
+    logger.info(f"   - Duplicate IDs: {len(validation['duplicate_ids'])}")
+    # Remove duplicate nodes
+    logger.info(" Starting duplicate node removal...")
+    fixed_tree = detect_and_remove_duplicate_ids(tree_result)
+    # Validate again
+    post_validation = validate_tree_structure(fixed_tree)
+    if post_validation["is_valid"]:
+        logger.info("Removal completed, tree structure is now valid")
+        logger.info(f"Final node count: {post_validation['total_nodes']}")
+    else:
+        logger.info("Issues remain after removal, please check code logic")
+        for error in post_validation["errors"][:3]:
+            logger.info(f"   - {error}")
+    return fixed_tree
+def clean_json_response(response: str) -> str:
+    """
+    Remove markdown JSON code block formatting from LLM response.
+    Args:
+        response: Raw response string that may contain ```json and ```
+    Returns:
+        str: Clean JSON string without markdown formatting
+    """
+    return response.replace("```json", "").replace("```", "").strip()
+def split_continuous_references(text: str) -> str:
+    """
+    Split continuous reference tags into individual reference tags.
+    Converts patterns like [1:92ff35fb, 4:bfe6f044] to [1:92ff35fb] [4:bfe6f044]
+    Only processes text if:
+    1. '[' appears exactly once
+    2. ']' appears exactly once
+    3. Contains commas between '[' and ']'
+    Args:
+        text (str): Text containing reference tags
+    Returns:
+        str: Text with split reference tags, or original text if conditions not met
+    """
+    # Early return if text is empty
+    if not text:
+        return text
+    # Check if '[' appears exactly once
+    if text.count("[") != 1:
+        return text
+    # Check if ']' appears exactly once
+    if text.count("]") != 1:
+        return text
+    # Find positions of brackets
+    open_bracket_pos = text.find("[")
+    close_bracket_pos = text.find("]")
+    # Check if brackets are in correct order
+    if open_bracket_pos >= close_bracket_pos:
+        return text
+    # Extract content between brackets
+    content_between_brackets = text[open_bracket_pos + 1 : close_bracket_pos]
+    # Check if there's a comma between brackets
+    if "," not in content_between_brackets:
+        return text
+    text = text.replace(content_between_brackets, content_between_brackets.replace(", ", "]["))
+    text = text.replace(content_between_brackets, content_between_brackets.replace(",", "]["))
+    return text

memos/mem_reader/simple_struct.py CHANGED Viewed

@@ -58,9 +58,13 @@ class SimpleStructMemReader(BaseMemReader, ABC):
                 metadata=TreeNodeTextualMemoryMetadata(
                     user_id=info.get("user_id"),
                     session_id=info.get("session_id"),
-                    memory_type=memory_i_raw.get("memory_type", ""),
+                    memory_type=memory_i_raw.get("memory_type", "")
+                    .replace("长期记忆", "LongTermMemory")
+                    .replace("用户记忆", "UserMemory"),
                     status="activated",
-                    tags=memory_i_raw.get("tags", ""),
+                    tags=memory_i_raw.get("tags", [])
+                    if type(memory_i_raw.get("tags", [])) is list
+                    else [],
                     key=memory_i_raw.get("key", ""),
                     embedding=self.embedder.embed([memory_i_raw.get("value", "")])[0],
                     usage=[],
@@ -176,8 +180,12 @@ class SimpleStructMemReader(BaseMemReader, ABC):
         elif type == "doc":
             for item in scene_data:
                 try:
-                    parsed_text = parser.parse(item)
-                    results.append({"file": item, "text": parsed_text})
+                    if not isinstance(item, str):
+                        parsed_text = parser.parse(item)
+                        results.append({"file": "pure_text", "text": parsed_text})
+                    else:
+                        parsed_text = item
+                        results.append({"file": item, "text": parsed_text})
                 except Exception as e:
                     print(f"Error parsing file {item}: {e!s}")
@@ -214,7 +222,7 @@ class SimpleStructMemReader(BaseMemReader, ABC):
                         session_id=info.get("session_id"),
                         memory_type="LongTermMemory",
                         status="activated",
-                        tags=chunk_res["tags"],
+                        tags=chunk_res["tags"] if type(chunk_res["tags"]) is list else [],
                         key=chunk_res["key"],
                         embedding=self.embedder.embed([chunk_res["value"]])[0],
                         usage=[],

MemoryOS 0.2.1__py3-none-any.whl → 0.2.2__py3-none-any.whl

Potentially problematic release.

MemoryOS 0.2.1py3-none-any.whl → 0.2.2py3-none-any.whl