npm - claude-self-reflect - Versions diffs - 5.0.2 → 5.0.5 - Mend

claude-self-reflect 5.0.2 → 5.0.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/.claude/agents/csr-validator.md +43 -0
package/.claude/agents/open-source-maintainer.md +77 -0
package/docker-compose.yaml +3 -1
package/installer/setup-wizard-docker.js +64 -9
package/package.json +6 -1
package/scripts/ast_grep_final_analyzer.py +16 -6
package/scripts/csr-status +120 -17
package/scripts/debug-august-parsing.py +5 -1
package/scripts/debug-project-resolver.py +3 -3
package/scripts/doctor.py +342 -0
package/scripts/embedding_service.py +241 -0
package/scripts/import-conversations-unified.py +292 -821
package/scripts/import_strategies.py +344 -0
package/scripts/message_processors.py +248 -0
package/scripts/metadata_extractor.py +262 -0
package/scripts/session_quality_tracker.py +10 -0
package/scripts/unified_state_manager.py +7 -4
package/mcp-server/src/test_quality.py +0 -153

package/scripts/metadata_extractor.py ADDED Viewed

@@ -0,0 +1,262 @@
+"""
+Metadata extractor using message processors to reduce complexity.
+Refactored from extract_metadata_single_pass function.
+"""
+import json
+import os
+import logging
+from pathlib import Path
+from typing import Dict, Any, Tuple, Optional
+from datetime import datetime
+from message_processors import (
+    MessageProcessorFactory,
+    extract_concepts,
+    MAX_CONCEPT_MESSAGES,
+    MAX_FILES_ANALYZED,
+    MAX_FILES_EDITED,
+    MAX_TOOLS_USED,
+    MAX_AST_ELEMENTS
+)
+logger = logging.getLogger(__name__)
+class MetadataExtractor:
+    """Extract metadata from JSONL conversation files."""
+    def __init__(self):
+        self.processor_factory = MessageProcessorFactory()
+    def extract_metadata_from_file(self, file_path: str) -> Tuple[Dict[str, Any], str, int]:
+        """
+        Extract metadata from a JSONL file in a single pass.
+        Returns: (metadata, first_timestamp, message_count)
+        """
+        metadata = self._initialize_metadata()
+        first_timestamp = None
+        message_count = 0
+        all_text = []
+        try:
+            with open(file_path, 'r', encoding='utf-8') as f:
+                for line in f:
+                    if not line.strip():
+                        continue
+                    result = self._process_line(line, metadata)
+                    if result:
+                        text_content, is_message = result
+                        # Update timestamp and counts
+                        if first_timestamp is None:
+                            first_timestamp = self._extract_timestamp(line)
+                        if is_message:
+                            message_count += 1
+                        if text_content:
+                            # Limit text accumulation to prevent memory issues
+                            if len(all_text) < MAX_CONCEPT_MESSAGES:
+                                all_text.append(text_content[:1000])
+        except (IOError, OSError) as e:
+            logger.warning(f"Error reading file {file_path}: {e}")
+        except (json.JSONDecodeError, ValueError) as e:
+            logger.warning(f"Error parsing JSON in {file_path}: {e}")
+        except Exception as e:
+            logger.error(f"Unexpected error extracting metadata from {file_path}: {e}")
+        # Post-process collected data
+        self._post_process_metadata(metadata, all_text, file_path)
+        # Apply limits to arrays
+        self._apply_metadata_limits(metadata)
+        return metadata, first_timestamp or datetime.now().isoformat(), message_count
+    def _initialize_metadata(self) -> Dict[str, Any]:
+        """Initialize empty metadata structure."""
+        return {
+            "files_analyzed": [],
+            "files_edited": [],
+            "tools_used": [],
+            "concepts": [],
+            "ast_elements": [],
+            "has_code_blocks": False,
+            "total_messages": 0,
+            "project_path": None,
+            "pattern_analysis": {},
+            "avg_quality_score": 0.0
+        }
+    def _process_line(self, line: str, metadata: Dict[str, Any]) -> Optional[Tuple[str, bool]]:
+        """
+        Process a single line from the JSONL file.
+        Returns: (text_content, is_message) or None
+        """
+        try:
+            data = json.loads(line)
+            # Extract project path from cwd
+            if metadata["project_path"] is None and 'cwd' in data:
+                metadata["project_path"] = data.get('cwd')
+            # Handle message entries
+            if 'message' in data and data['message']:
+                return self._process_message_entry(data['message'], metadata)
+            # Handle top-level tool entries
+            entry_type = data.get('type')
+            if entry_type in ('tool_result', 'tool_use'):
+                return self._process_tool_entry(data, metadata)
+        except json.JSONDecodeError:
+            # Expected for non-JSON lines, skip silently
+            pass
+        except (KeyError, TypeError, ValueError) as e:
+            # Log specific parsing errors for debugging
+            logger.debug(f"Error parsing line: {e}")
+        return None
+    def _process_message_entry(self, message: Dict[str, Any], metadata: Dict[str, Any]) -> Optional[Tuple[str, bool]]:
+        """Process a message entry."""
+        role = message.get('role')
+        content = message.get('content')
+        if not role or not content:
+            return None
+        # Check if it's a countable message
+        is_user_or_assistant = role in ['user', 'assistant']
+        # Process content
+        text_content = self.processor_factory.process_content(content, metadata)
+        return text_content, is_user_or_assistant
+    def _process_tool_entry(self, data: Dict[str, Any], metadata: Dict[str, Any]) -> Optional[Tuple[str, bool]]:
+        """Process a top-level tool entry."""
+        entry_type = data.get('type')
+        text_parts = []
+        if entry_type == 'tool_use':
+            tool_name = data.get('name', 'unknown')
+            tool_input = str(data.get('input', ''))[:500]
+            text_parts.append(f"[Tool: {tool_name}] {tool_input}")
+            # Track tool usage
+            if tool_name and tool_name not in metadata['tools_used']:
+                metadata['tools_used'].append(tool_name)
+        elif entry_type == 'tool_result':
+            result_content = self._extract_tool_result_content(data)
+            text_parts.append(f"[Result] {result_content[:1000]}")
+        content = "\n".join(text_parts)
+        # Tool entries should not count as messages (only user/assistant messages count)
+        return (content, False) if content else None
+    def _extract_tool_result_content(self, data: Dict[str, Any]) -> str:
+        """Extract content from tool result data."""
+        result_content = data.get('content')
+        if isinstance(result_content, list):
+            flat = []
+            for item in result_content:
+                if isinstance(item, dict) and item.get('type') == 'text':
+                    flat.append(item.get('text', ''))
+                elif isinstance(item, str):
+                    flat.append(item)
+            result_content = "\n".join(flat)
+        if not result_content:
+            result_content = data.get('result', '')
+        return str(result_content)
+    def _extract_timestamp(self, line: str) -> Optional[str]:
+        """Extract timestamp from a line if present."""
+        try:
+            data = json.loads(line)
+            return data.get('timestamp')
+        except (json.JSONDecodeError, TypeError) as e:
+            logger.debug(f"Failed to extract timestamp: {e}")
+            return None
+    def _post_process_metadata(self, metadata: Dict[str, Any], all_text: list, file_path: str):
+        """Post-process collected metadata."""
+        # Extract concepts from collected text
+        if all_text:
+            combined_text = ' '.join(all_text[:MAX_CONCEPT_MESSAGES])
+            metadata['concepts'] = extract_concepts(combined_text)
+        # Run AST-GREP pattern analysis if available
+        self._run_pattern_analysis(metadata)
+    def _run_pattern_analysis(self, metadata: Dict[str, Any]):
+        """Run AST-GREP pattern analysis on mentioned files."""
+        pattern_quality = {}
+        avg_quality_score = 0.0
+        try:
+            # Update patterns first
+            from update_patterns import check_and_update_patterns
+            check_and_update_patterns()
+            # Import analyzer
+            from ast_grep_final_analyzer import FinalASTGrepAnalyzer
+            analyzer = FinalASTGrepAnalyzer()
+            # Analyze files
+            files_to_analyze = list(set(
+                metadata['files_edited'] + metadata['files_analyzed'][:10]
+            ))
+            quality_scores = []
+            for file_path in files_to_analyze:
+                # Expand file path for proper checking
+                expanded_path = os.path.expanduser(file_path) if file_path.startswith('~') else file_path
+                if self._is_code_file(expanded_path) and os.path.exists(expanded_path):
+                    try:
+                        result = analyzer.analyze_file(expanded_path)
+                        metrics = result['quality_metrics']
+                        pattern_quality[file_path] = {
+                            'score': metrics['quality_score'],
+                            'good_patterns': metrics['good_patterns_found'],
+                            'bad_patterns': metrics['bad_patterns_found'],
+                            'issues': metrics['total_issues']
+                        }
+                        quality_scores.append(metrics['quality_score'])
+                    except (IOError, OSError) as e:
+                        logger.debug(f"Could not read file {file_path}: {e}")
+                    except (KeyError, ValueError) as e:
+                        logger.debug(f"Error parsing AST results for {file_path}: {e}")
+                    except Exception as e:
+                        logger.warning(f"Unexpected error analyzing {file_path}: {e}")
+            # Calculate average quality
+            if quality_scores:
+                avg_quality_score = sum(quality_scores) / len(quality_scores)
+        except Exception as e:
+            logger.debug(f"AST analysis not available: {e}")
+        metadata['pattern_analysis'] = pattern_quality
+        metadata['avg_quality_score'] = round(avg_quality_score, 3)
+    def _is_code_file(self, file_path: str) -> bool:
+        """Check if file is a code file."""
+        if not file_path:
+            return False
+        extensions = ['.py', '.ts', '.js', '.tsx', '.jsx']
+        return any(file_path.endswith(ext) for ext in extensions)
+    def _apply_metadata_limits(self, metadata: Dict[str, Any]):
+        """Apply size limits to metadata arrays."""
+        metadata['files_analyzed'] = metadata['files_analyzed'][:MAX_FILES_ANALYZED]
+        metadata['files_edited'] = metadata['files_edited'][:MAX_FILES_EDITED]
+        metadata['tools_used'] = metadata['tools_used'][:MAX_TOOLS_USED]
+        metadata['ast_elements'] = metadata['ast_elements'][:MAX_AST_ELEMENTS]

package/scripts/session_quality_tracker.py CHANGED Viewed

@@ -647,6 +647,8 @@ if __name__ == "__main__":
     parser.add_argument('--project-name', help='Name of the project for cache file')
     parser.add_argument('--use-tracker', action='store_true',
                         help='Use session edit tracker for analysis')
+    parser.add_argument('--update-cache-only', action='store_true',
+                        help='Only update cache without printing report')
     args = parser.parse_args()
     # If external project specified, change to that directory
@@ -658,4 +660,12 @@ if __name__ == "__main__":
         # This will be used in the main() function for cache naming
         os.environ['QUALITY_PROJECT_NAME'] = args.project_name
+    # For cache-only mode, suppress output
+    if args.update_cache_only:
+        # Redirect logger to null
+        import os
+        import sys
+        sys.stdout = open(os.devnull, 'w')
+        sys.stderr = open(os.devnull, 'w')
     main(use_tracker=args.use_tracker)

package/scripts/unified_state_manager.py CHANGED Viewed

@@ -21,7 +21,7 @@ import logging
 import sys
 from pathlib import Path
 from datetime import datetime, timedelta, timezone
-from typing import Dict, Any, Optional, List, Set
+from typing import Dict, Any, Optional, List, Set, Union
 from contextlib import contextmanager
 # Try to import filelock, fall back to platform-specific implementation
@@ -62,14 +62,17 @@ class UnifiedStateManager:
     LOCK_TIMEOUT = 5.0
     LOCK_EXPIRY = timedelta(seconds=30)
-    def __init__(self, state_file: Optional[Path] = None):
+    def __init__(self, state_file: Optional[Union[Path, str]] = None):
         """
         Initialize the unified state manager.
         Args:
             state_file: Path to the state file (defaults to ~/.claude-self-reflect/config/unified-state.json)
         """
-        self.state_file = state_file or Path.home() / ".claude-self-reflect" / "config" / "unified-state.json"
+        if state_file:
+            self.state_file = Path(state_file) if isinstance(state_file, str) else state_file
+        else:
+            self.state_file = Path.home() / ".claude-self-reflect" / "config" / "unified-state.json"
         self.lock_file = self.state_file.with_suffix('.lock')
         self.temp_file = self.state_file.with_suffix('.tmp')
         self._file_lock = None
@@ -127,7 +130,7 @@ class UnifiedStateManager:
         if HAS_FILELOCK:
             lock = filelock.FileLock(str(self.lock_file), timeout=timeout)
             try:
-                with lock.acquire(timeout=timeout):
+                with lock:
                     yield lock
             except filelock.Timeout:
                 raise TimeoutError(f"Could not acquire lock within {timeout} seconds")

package/mcp-server/src/test_quality.py DELETED Viewed

@@ -1,153 +0,0 @@
-#!/usr/bin/env python3
-"""
-Test file with intentional quality issues for testing quality-fixer agent.
-This file contains patterns that should be fixed:
-- sync file operations that should be async
-- global variables
-- print statements
-- long functions
-"""
-import os
-import json
-import asyncio
-import logging
-import aiofiles
-from typing import List, Dict, Any
-# Set up logger instead of print statements
-logger = logging.getLogger(__name__)
-# Configuration management class instead of global variables
-class ConfigManager:
-    def __init__(self):
-        self.config = None
-        self.counter = 0
-async def load_config(config_manager: ConfigManager) -> Dict[str, Any]:
-    """Load config using async file operations."""
-    # Async file operation using aiofiles
-    async with aiofiles.open("config.json", "r") as f:
-        content = await f.read()
-        config_manager.config = json.loads(content)
-    logger.info(f"Config loaded: {config_manager.config}")
-    return config_manager.config
-async def save_data(data: Dict[str, Any], config_manager: ConfigManager) -> None:
-    """Save data using async operations."""
-    config_manager.counter += 1
-    # Async file operation using aiofiles
-    async with aiofiles.open("data.json", "w") as f:
-        await f.write(json.dumps(data))
-    logger.info(f"Data saved, counter: {config_manager.counter}")
-def validate_items(items: List[str]) -> List[str]:
-    """Validate input items."""
-    valid_items = []
-    for item in items:
-        if not item:
-            logger.warning(f"Invalid item: {item}")
-            continue
-        valid_items.append(item)
-    return valid_items
-def process_items(items: List[str]) -> List[str]:
-    """Process each item."""
-    return [item.upper() for item in items]
-def filter_results(results: List[str]) -> List[str]:
-    """Filter results by length."""
-    return [result for result in results if len(result) > 3]
-def create_summary(items: List[str], results: List[str], filtered: List[str]) -> Dict[str, int]:
-    """Create processing summary."""
-    return {
-        "total": len(items),
-        "processed": len(results),
-        "filtered": len(filtered)
-    }
-async def save_results(filtered: List[str]) -> None:
-    """Save results to file asynchronously."""
-    async with aiofiles.open("results.txt", "w") as f:
-        for item in filtered:
-            await f.write(f"{item}\n")
-async def process_items_improved(items: List[str], config_manager: ConfigManager) -> Dict[str, Any]:
-    """Improved function broken down into smaller functions."""
-    # Step 1: Validate items
-    valid_items = validate_items(items)
-    # Step 2: Process each item
-    results = process_items(valid_items)
-    # Step 3: Filter results
-    filtered = filter_results(results)
-    # Step 4: Sort results
-    filtered.sort()
-    # Step 5: Create summary
-    summary = create_summary(items, results, filtered)
-    # Step 6: Log summary
-    logger.info(f"Processing complete: {summary}")
-    # Step 7: Save results asynchronously
-    await save_results(filtered)
-    # Step 8: Update counter
-    config_manager.counter += len(filtered)
-    # Step 9: Create report
-    report = {
-        "summary": summary,
-        "results": filtered,
-        "counter": config_manager.counter
-    }
-    return report
-async def debug_function() -> None:
-    """Function with debug statements."""
-    logger.debug("Debug: Starting function")
-    # Reading file asynchronously
-    if os.path.exists("debug.log"):
-        async with aiofiles.open("debug.log", "r") as f:
-            log_data = await f.read()
-            logger.debug(f"Log data: {log_data}")
-    logger.debug("Debug: Function complete")
-# Using var instead of let/const (for JS patterns if analyzed)
-var_example = "This would be flagged in JS"
-async def main() -> None:
-    """Main execution function."""
-    # Set up logging
-    logging.basicConfig(level=logging.INFO)
-    # Initialize config manager
-    config_manager = ConfigManager()
-    logger.info("Starting application...")
-    try:
-        # Note: These operations would fail without actual files, but structure is correct
-        await load_config(config_manager)
-        await process_items_improved(["test", "data", "example"], config_manager)
-        await debug_function()
-    except FileNotFoundError:
-        logger.warning("Required files not found - this is expected in test context")
-    except Exception as e:
-        logger.error(f"Application error: {e}")
-    logger.info("Application complete!")
-if __name__ == "__main__":
-    # Run async main function
-    asyncio.run(main())