npm - claude-self-reflect - Versions diffs - 4.0.3 → 5.0.2 - Mend

claude-self-reflect 4.0.3 → 5.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/mcp-server/src/code_reload_tool.py +207 -98
package/mcp-server/src/parallel_search.py +7 -6
package/mcp-server/src/rich_formatting.py +10 -6
package/mcp-server/src/safe_getters.py +217 -0
package/mcp-server/src/search_tools.py +30 -8
package/package.json +1 -1

package/mcp-server/src/code_reload_tool.py CHANGED Viewed

@@ -5,11 +5,22 @@ import sys
 import importlib
 import logging
 from pathlib import Path
-from typing import Dict, List, Optional, Literal
+from typing import Dict, List, Optional
 from fastmcp import Context
 from pydantic import Field
 import hashlib
 import json
+import asyncio
+# Import security module - handle both relative and absolute imports
+try:
+    from .security_patches import ModuleWhitelist
+except ImportError:
+    try:
+        from security_patches import ModuleWhitelist
+    except ImportError:
+        # Security module is required - fail closed, not open
+        raise RuntimeError("Security module 'security_patches' is required for code reload functionality")
 logger = logging.getLogger(__name__)
@@ -19,20 +30,36 @@ class CodeReloader:
     def __init__(self):
         """Initialize the code reloader."""
-        self.module_hashes: Dict[str, str] = {}
-        self.reload_history: List[Dict] = []
         self.cache_dir = Path.home() / '.claude-self-reflect' / 'reload_cache'
         self.cache_dir.mkdir(parents=True, exist_ok=True)
-        # Test comment: Hot reload test at 2025-09-15
-        logger.info("CodeReloader initialized with hot reload support")
+        self.hash_file = self.cache_dir / 'module_hashes.json'
+        self._lock = asyncio.Lock()  # Thread safety for async operations
+        # Load persisted hashes from disk with error handling
+        if self.hash_file.exists():
+            try:
+                with open(self.hash_file, 'r') as f:
+                    self.module_hashes: Dict[str, str] = json.load(f)
+            except (json.JSONDecodeError, IOError) as e:
+                logger.error(f"Failed to load module hashes: {e}. Starting fresh.")
+                self.module_hashes: Dict[str, str] = {}
+        else:
+            self.module_hashes: Dict[str, str] = {}
+        self.reload_history: List[Dict] = []
+        logger.info(f"CodeReloader initialized with {len(self.module_hashes)} cached hashes")
     def _get_file_hash(self, filepath: Path) -> str:
         """Get SHA256 hash of a file."""
         with open(filepath, 'rb') as f:
             return hashlib.sha256(f.read()).hexdigest()
-    def _get_changed_modules(self) -> List[str]:
-        """Detect which modules have changed since last check."""
+    def _detect_changed_modules(self) -> List[str]:
+        """Detect which modules have changed since last check.
+        This method ONLY detects changes, it does NOT update the stored hashes.
+        Use _update_module_hashes() to update hashes after successful reload.
+        """
         changed = []
         src_dir = Path(__file__).parent
@@ -43,13 +70,61 @@ class CodeReloader:
             module_name = f"src.{py_file.stem}"
             current_hash = self._get_file_hash(py_file)
+            # Only detect changes, DO NOT update hashes here
             if module_name in self.module_hashes:
                 if self.module_hashes[module_name] != current_hash:
                     changed.append(module_name)
+                    logger.debug(f"Change detected in {module_name}: {self.module_hashes[module_name][:8]} -> {current_hash[:8]}")
+            else:
+                # New module not seen before
+                changed.append(module_name)
+                logger.debug(f"New module detected: {module_name}")
+        return changed
+    def _update_module_hashes(self, modules: Optional[List[str]] = None) -> None:
+        """Update the stored hashes for specified modules or all modules.
+        This should be called AFTER successful reload to mark modules as up-to-date.
+        Args:
+            modules: List of module names to update. If None, updates all modules.
+        """
+        src_dir = Path(__file__).parent
+        updated = []
+        for py_file in src_dir.glob("*.py"):
+            if py_file.name == "__pycache__":
+                continue
+            module_name = f"src.{py_file.stem}"
+            # If specific modules provided, only update those
+            if modules is not None and module_name not in modules:
+                continue
+            current_hash = self._get_file_hash(py_file)
+            old_hash = self.module_hashes.get(module_name, "new")
             self.module_hashes[module_name] = current_hash
+            if old_hash != current_hash:
+                updated.append(module_name)
+                logger.debug(f"Updated hash for {module_name}: {old_hash[:8] if old_hash != 'new' else 'new'} -> {current_hash[:8]}")
-        return changed
+        # Persist the updated hashes to disk using atomic write
+        temp_file = Path(str(self.hash_file) + '.tmp')
+        try:
+            with open(temp_file, 'w') as f:
+                json.dump(self.module_hashes, f, indent=2)
+            # Atomic rename on POSIX systems
+            temp_file.replace(self.hash_file)
+        except Exception as e:
+            logger.error(f"Failed to persist module hashes: {e}")
+            if temp_file.exists():
+                temp_file.unlink()  # Clean up temp file on failure
+        if updated:
+            logger.info(f"Updated hashes for {len(updated)} modules: {', '.join(updated)}")
     async def reload_modules(
         self,
@@ -61,93 +136,98 @@ class CodeReloader:
         await ctx.debug("Starting code reload process...")
-        try:
-            # Track what we're reloading
-            reload_targets = []
-            if auto_detect:
-                # Detect changed modules
-                changed = self._get_changed_modules()
-                if changed:
-                    reload_targets.extend(changed)
-                    await ctx.debug(f"Auto-detected changes in: {changed}")
-            if modules:
-                # Add explicitly requested modules
-                reload_targets.extend(modules)
-            if not reload_targets:
-                return "📊 No modules to reload. All code is up to date!"
-            # Perform the reload
-            reloaded = []
-            failed = []
-            for module_name in reload_targets:
-                try:
-                    # SECURITY FIX: Validate module is in whitelist
-                    from .security_patches import ModuleWhitelist
-                    if not ModuleWhitelist.is_allowed_module(module_name):
-                        logger.warning(f"Module not in whitelist, skipping: {module_name}")
-                        failed.append((module_name, "Module not in whitelist"))
-                        continue
-                    if module_name in sys.modules:
-                        # Store old module reference for rollback
-                        old_module = sys.modules[module_name]
-                        # Reload the module
-                        logger.info(f"Reloading module: {module_name}")
-                        reloaded_module = importlib.reload(sys.modules[module_name])
-                        # Update any global references if needed
-                        self._update_global_references(module_name, reloaded_module)
-                        reloaded.append(module_name)
-                        await ctx.debug(f"✅ Reloaded: {module_name}")
-                    else:
-                        # Module not loaded yet, import it
-                        importlib.import_module(module_name)
-                        reloaded.append(module_name)
-                        await ctx.debug(f"✅ Imported: {module_name}")
-                except Exception as e:
-                    logger.error(f"Failed to reload {module_name}: {e}", exc_info=True)
-                    failed.append((module_name, str(e)))
-                    await ctx.debug(f"❌ Failed: {module_name} - {e}")
-            # Record reload history
-            self.reload_history.append({
-                "timestamp": os.environ.get('MCP_REQUEST_ID', 'unknown'),
-                "reloaded": reloaded,
-                "failed": failed
-            })
-            # Build response
-            response = "🔄 **Code Reload Results**\n\n"
-            if reloaded:
-                response += f"**Successfully Reloaded ({len(reloaded)}):**\n"
-                for module in reloaded:
-                    response += f"- ✅ {module}\n"
-                response += "\n"
-            if failed:
-                response += f"**Failed to Reload ({len(failed)}):**\n"
-                for module, error in failed:
-                    response += f"- ❌ {module}: {error}\n"
-                response += "\n"
-            response += "**Important Notes:**\n"
-            response += "- Class instances created before reload keep old code\n"
-            response += "- New requests will use the reloaded code\n"
-            response += "- Some changes may require full restart (e.g., new tools)\n"
-            return response
-        except Exception as e:
-            logger.error(f"Code reload failed: {e}", exc_info=True)
-            return f"❌ Code reload failed: {str(e)}"
+        async with self._lock:  # Ensure thread safety for reload operations
+            try:
+                # Track what we're reloading
+                reload_targets = []
+                if auto_detect:
+                    # Detect changed modules (without updating hashes)
+                    changed = self._detect_changed_modules()
+                    if changed:
+                        reload_targets.extend(changed)
+                        await ctx.debug(f"Auto-detected changes in: {changed}")
+                if modules:
+                    # Add explicitly requested modules
+                    reload_targets.extend(modules)
+                if not reload_targets:
+                    return "📊 No modules to reload. All code is up to date!"
+                # Perform the reload
+                reloaded = []
+                failed = []
+                for module_name in reload_targets:
+                    try:
+                        # SECURITY FIX: Validate module is in whitelist
+                        if not ModuleWhitelist.is_allowed_module(module_name):
+                            logger.warning(f"Module not in whitelist, skipping: {module_name}")
+                            failed.append((module_name, "Module not in whitelist"))
+                            continue
+                        if module_name in sys.modules:
+                            # Store old module reference for rollback
+                            old_module = sys.modules[module_name]
+                            # Reload the module
+                            logger.info(f"Reloading module: {module_name}")
+                            reloaded_module = importlib.reload(sys.modules[module_name])
+                            # Update any global references if needed
+                            self._update_global_references(module_name, reloaded_module)
+                            reloaded.append(module_name)
+                            await ctx.debug(f"✅ Reloaded: {module_name}")
+                        else:
+                            # Module not loaded yet, import it
+                            importlib.import_module(module_name)
+                            reloaded.append(module_name)
+                            await ctx.debug(f"✅ Imported: {module_name}")
+                    except Exception as e:
+                        logger.error(f"Failed to reload {module_name}: {e}", exc_info=True)
+                        failed.append((module_name, str(e)))
+                        await ctx.debug(f"❌ Failed: {module_name} - {e}")
+                # Update hashes ONLY for successfully reloaded modules
+                if reloaded:
+                    self._update_module_hashes(reloaded)
+                    await ctx.debug(f"Updated hashes for {len(reloaded)} successfully reloaded modules")
+                # Record reload history
+                self.reload_history.append({
+                    "timestamp": os.environ.get('MCP_REQUEST_ID', 'unknown'),
+                    "reloaded": reloaded,
+                    "failed": failed
+                })
+                # Build response
+                response = "🔄 **Code Reload Results**\n\n"
+                if reloaded:
+                    response += f"**Successfully Reloaded ({len(reloaded)}):**\n"
+                    for module in reloaded:
+                        response += f"- ✅ {module}\n"
+                    response += "\n"
+                if failed:
+                    response += f"**Failed to Reload ({len(failed)}):**\n"
+                    for module, error in failed:
+                        response += f"- ❌ {module}: {error}\n"
+                    response += "\n"
+                response += "**Important Notes:**\n"
+                response += "- Class instances created before reload keep old code\n"
+                response += "- New requests will use the reloaded code\n"
+                response += "- Some changes may require full restart (e.g., new tools)\n"
+                return response
+            except Exception as e:
+                logger.error(f"Code reload failed: {e}", exc_info=True)
+                return f"❌ Code reload failed: {str(e)}"
     def _update_global_references(self, module_name: str, new_module):
         """Update global references after module reload."""
@@ -171,8 +251,8 @@ class CodeReloader:
         """Get the current reload status and history."""
         try:
-            # Check for changed files
-            changed = self._get_changed_modules()
+            # Check for changed files (WITHOUT updating hashes)
+            changed = self._detect_changed_modules()
             response = "📊 **Code Reload Status**\n\n"
@@ -224,6 +304,24 @@ class CodeReloader:
             logger.error(f"Failed to clear cache: {e}", exc_info=True)
             return f"❌ Failed to clear cache: {str(e)}"
+    async def force_update_hashes(self, ctx: Context) -> str:
+        """Force update all module hashes to current state.
+        This is useful when you want to mark all current code as 'baseline'
+        without actually reloading anything.
+        """
+        try:
+            await ctx.debug("Force updating all module hashes...")
+            # Update all module hashes
+            self._update_module_hashes(modules=None)
+            return f"✅ Force updated hashes for all {len(self.module_hashes)} tracked modules"
+        except Exception as e:
+            logger.error(f"Failed to force update hashes: {e}", exc_info=True)
+            return f"❌ Failed to force update hashes: {str(e)}"
 def register_code_reload_tool(mcp, get_embedding_manager):
     """Register the code reloading tool with the MCP server."""
@@ -257,6 +355,8 @@ def register_code_reload_tool(mcp, get_embedding_manager):
         Shows which files have been modified since last reload and
         the history of recent reload operations.
+        Note: This only checks for changes, it does not update the stored hashes.
         """
         return await reloader.get_reload_status(ctx)
@@ -267,5 +367,14 @@ def register_code_reload_tool(mcp, get_embedding_manager):
         Useful when reload isn't working due to cached bytecode.
         """
         return await reloader.clear_python_cache(ctx)
+    @mcp.tool()
+    async def force_update_module_hashes(ctx: Context) -> str:
+        """Force update all module hashes to mark current code as baseline.
+        Use this when you want to ignore current changes and treat
+        the current state as the new baseline without reloading.
+        """
+        return await reloader.force_update_hashes(ctx)
-    logger.info("Code reload tools registered successfully")
+    logger.info("Code reload tools registered successfully")

package/mcp-server/src/parallel_search.py CHANGED Viewed

@@ -8,6 +8,7 @@ import time
 from typing import List, Dict, Any, Optional, Tuple
 from datetime import datetime
 import logging
+from .safe_getters import safe_get_list, safe_get_str
 logger = logging.getLogger(__name__)
@@ -176,9 +177,9 @@ async def search_single_collection(
                         'collection_name': collection_name,
                         'raw_payload': point.payload,  # Renamed from 'payload' for consistency
                         'code_patterns': point.payload.get('code_patterns'),
-                        'files_analyzed': point.payload.get('files_analyzed'),
-                        'tools_used': list(point.payload.get('tools_used', [])) if isinstance(point.payload.get('tools_used'), set) else point.payload.get('tools_used'),
-                        'concepts': point.payload.get('concepts')
+                        'files_analyzed': safe_get_list(point.payload, 'files_analyzed'),
+                        'tools_used': safe_get_list(point.payload, 'tools_used'),
+                        'concepts': safe_get_list(point.payload, 'concepts')
                     }
                     results.append(search_result)
             else:
@@ -219,9 +220,9 @@ async def search_single_collection(
                         'collection_name': collection_name,
                         'raw_payload': point.payload,
                         'code_patterns': point.payload.get('code_patterns'),
-                        'files_analyzed': point.payload.get('files_analyzed'),
-                        'tools_used': list(point.payload.get('tools_used', [])) if isinstance(point.payload.get('tools_used'), set) else point.payload.get('tools_used'),
-                        'concepts': point.payload.get('concepts')
+                        'files_analyzed': safe_get_list(point.payload, 'files_analyzed'),
+                        'tools_used': safe_get_list(point.payload, 'tools_used'),
+                        'concepts': safe_get_list(point.payload, 'concepts')
                     }
                     results.append(search_result)

package/mcp-server/src/rich_formatting.py CHANGED Viewed

@@ -5,6 +5,7 @@ import time
 from datetime import datetime, timezone
 from typing import List, Dict, Any, Optional
 import logging
+from .safe_getters import safe_get_list, safe_get_str
 logger = logging.getLogger(__name__)
@@ -114,16 +115,19 @@ def format_search_results_rich(
         concept_frequency = {}
         for result in results:
-            # Count file modifications
-            for file in result.get('files_analyzed', []):
+            # Count file modifications - using safe_get_list for consistency
+            files = safe_get_list(result, 'files_analyzed')
+            for file in files:
                 file_frequency[file] = file_frequency.get(file, 0) + 1
-            # Count tool usage
-            for tool in result.get('tools_used', []):
+            # Count tool usage - using safe_get_list for consistency
+            tools = safe_get_list(result, 'tools_used')
+            for tool in tools:
                 tool_frequency[tool] = tool_frequency.get(tool, 0) + 1
-            # Count concepts
-            for concept in result.get('concepts', []):
+            # Count concepts - using safe_get_list for consistency
+            concepts = safe_get_list(result, 'concepts')
+            for concept in concepts:
                 concept_frequency[concept] = concept_frequency.get(concept, 0) + 1
         # Show most frequently modified files

package/mcp-server/src/safe_getters.py ADDED Viewed

@@ -0,0 +1,217 @@
+"""Safe getter utilities for handling None values consistently."""
+import logging
+from typing import Any, Dict, List, Optional, Set, Union
+logger = logging.getLogger(__name__)
+def safe_get_list(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: Optional[List] = None
+) -> List[Any]:
+    """
+    Safely get a list field from a dictionary, handling None and non-list values.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None
+    Returns:
+        A list, either the value, converted value, or default/empty list
+    """
+    if data is None:
+        return default if default is not None else []
+    value = data.get(key)
+    if value is None:
+        return default if default is not None else []
+    # Handle sets and tuples by converting to list
+    if isinstance(value, (set, tuple)):
+        return list(value)
+    # If it's already a list, return it
+    if isinstance(value, list):
+        return value
+    # If it's not a list-like type, log warning and return empty list
+    logger.warning(
+        f"Expected list-like type for key '{key}', got {type(value).__name__}. "
+        f"Value: {repr(value)[:100]}"
+    )
+    return default if default is not None else []
+def safe_get_str(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: str = ""
+) -> str:
+    """
+    Safely get a string field from a dictionary.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None
+    Returns:
+        A string, either the value or the default
+    """
+    if data is None:
+        return default
+    value = data.get(key)
+    if value is None:
+        return default
+    # Convert to string if needed
+    return str(value)
+def safe_get_dict(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: Optional[Dict] = None
+) -> Dict[str, Any]:
+    """
+    Safely get a dictionary field from another dictionary.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None
+    Returns:
+        A dictionary, either the value or the default/empty dict
+    """
+    if data is None:
+        return default if default is not None else {}
+    value = data.get(key)
+    if value is None:
+        return default if default is not None else {}
+    if isinstance(value, dict):
+        return value
+    logger.warning(
+        f"Expected dict for key '{key}', got {type(value).__name__}. "
+        f"Value: {repr(value)[:100]}"
+    )
+    return default if default is not None else {}
+def safe_get_float(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: float = 0.0
+) -> float:
+    """
+    Safely get a float field from a dictionary.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None/non-numeric
+    Returns:
+        A float, either the converted value or the default
+    """
+    if data is None:
+        return default
+    value = data.get(key)
+    if value is None:
+        return default
+    try:
+        return float(value)
+    except (TypeError, ValueError) as e:
+        logger.warning(
+            f"Could not convert key '{key}' value to float: {repr(value)[:100]}. "
+            f"Error: {e}"
+        )
+        return default
+def safe_get_int(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: int = 0
+) -> int:
+    """
+    Safely get an integer field from a dictionary.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None/non-numeric
+    Returns:
+        An integer, either the converted value or the default
+    """
+    if data is None:
+        return default
+    value = data.get(key)
+    if value is None:
+        return default
+    try:
+        return int(value)
+    except (TypeError, ValueError) as e:
+        logger.warning(
+            f"Could not convert key '{key}' value to int: {repr(value)[:100]}. "
+            f"Error: {e}"
+        )
+        return default
+def safe_get_bool(
+    data: Optional[Dict[str, Any]],
+    key: str,
+    default: bool = False
+) -> bool:
+    """
+    Safely get a boolean field from a dictionary.
+    Args:
+        data: Dictionary to get value from (can be None)
+        key: Key to retrieve
+        default: Default value if key not found or value is None
+    Returns:
+        A boolean, either the value or the default
+    """
+    if data is None:
+        return default
+    value = data.get(key)
+    if value is None:
+        return default
+    if isinstance(value, bool):
+        return value
+    # Handle string booleans
+    if isinstance(value, str):
+        return value.lower() in ('true', '1', 'yes', 'on')
+    # Handle numeric booleans
+    try:
+        return bool(int(value))
+    except (TypeError, ValueError):
+        logger.warning(
+            f"Could not convert key '{key}' value to bool: {repr(value)[:100]}"
+        )
+        return default

package/mcp-server/src/search_tools.py CHANGED Viewed

@@ -20,6 +20,26 @@ from .rich_formatting import format_search_results_rich
 logger = logging.getLogger(__name__)
+def is_searchable_collection(name: str) -> bool:
+    """
+    Check if collection name matches searchable patterns.
+    Supports both v3 and v4 collection naming conventions.
+    """
+    return (
+        # v3 patterns
+        name.endswith('_local')
+        or name.endswith('_voyage')
+        # v4 patterns
+        or name.endswith('_384d')  # Local v4 collections
+        or name.endswith('_1024d')  # Cloud v4 collections
+        or '_cloud_' in name  # Cloud v4 intermediate naming
+        # Reflections
+        or name.startswith('reflections')
+        # CSR prefixed collections
+        or name.startswith('csr_')
+    )
 class SearchTools:
     """Handles all search operations for the MCP server."""
@@ -114,6 +134,11 @@ class SearchTools:
             # Convert results to dict format
             results = []
             for result in search_results:
+                # Guard against None payload
+                if result.payload is None:
+                    logger.warning(f"Result in {collection_name} has None payload, skipping")
+                    continue
                 results.append({
                     'conversation_id': result.payload.get('conversation_id'),
                     'timestamp': result.payload.get('timestamp'),
@@ -274,10 +299,10 @@ class SearchTools:
                     return "<search_results><message>No collections available</message></search_results>"
                 # Include both conversation collections and reflection collections
+                # Use module-level function for consistency
                 filtered_collections = [
                     c for c in collections
-                    if (c.name.endswith('_local') or c.name.endswith('_voyage') or
-                        c.name.startswith('reflections'))
+                    if is_searchable_collection(c.name)
                 ]
                 await ctx.debug(f"Searching across {len(filtered_collections)} collections")
@@ -403,8 +428,7 @@ class SearchTools:
                 # Include both conversation collections and reflection collections
                 filtered_collections = [
                     c for c in collections
-                    if (c.name.endswith('_local') or c.name.endswith('_voyage') or
-                        c.name.startswith('reflections'))
+                    if is_searchable_collection(c.name)
                 ]
             # Quick PARALLEL count across collections
@@ -493,8 +517,7 @@ class SearchTools:
                 # Include both conversation collections and reflection collections
                 filtered_collections = [
                     c for c in collections
-                    if (c.name.endswith('_local') or c.name.endswith('_voyage') or
-                        c.name.startswith('reflections'))
+                    if is_searchable_collection(c.name)
                 ]
             # Gather results for summary using PARALLEL search
@@ -590,8 +613,7 @@ class SearchTools:
                 # Include both conversation collections and reflection collections
                 filtered_collections = [
                     c for c in collections
-                    if (c.name.endswith('_local') or c.name.endswith('_voyage') or
-                        c.name.startswith('reflections'))
+                    if is_searchable_collection(c.name)
                 ]
             # Gather all results using PARALLEL search

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-self-reflect",
-  "version": "4.0.3",
+  "version": "5.0.2",
   "description": "Give Claude perfect memory of all your conversations - Installation wizard for Python MCP server",
   "keywords": [
     "claude",