npm - claude-self-reflect - Versions diffs - 3.2.4 → 3.3.0 - Mend

claude-self-reflect 3.2.4 → 3.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/.claude/agents/claude-self-reflect-test.md +595 -528
package/.claude/agents/reflection-specialist.md +59 -3
package/README.md +14 -5
package/mcp-server/run-mcp.sh +49 -5
package/mcp-server/src/app_context.py +64 -0
package/mcp-server/src/config.py +57 -0
package/mcp-server/src/connection_pool.py +286 -0
package/mcp-server/src/decay_manager.py +106 -0
package/mcp-server/src/embedding_manager.py +64 -40
package/mcp-server/src/embeddings_old.py +141 -0
package/mcp-server/src/models.py +64 -0
package/mcp-server/src/parallel_search.py +371 -0
package/mcp-server/src/project_resolver.py +5 -0
package/mcp-server/src/reflection_tools.py +206 -0
package/mcp-server/src/rich_formatting.py +196 -0
package/mcp-server/src/search_tools.py +826 -0
package/mcp-server/src/server.py +127 -1720
package/mcp-server/src/temporal_design.py +132 -0
package/mcp-server/src/temporal_tools.py +597 -0
package/mcp-server/src/temporal_utils.py +384 -0
package/mcp-server/src/utils.py +150 -67
package/package.json +10 -1
package/scripts/add-timestamp-indexes.py +134 -0
package/scripts/check-collections.py +29 -0
package/scripts/debug-august-parsing.py +76 -0
package/scripts/debug-import-single.py +91 -0
package/scripts/debug-project-resolver.py +82 -0
package/scripts/debug-temporal-tools.py +135 -0
package/scripts/delta-metadata-update.py +547 -0
package/scripts/import-conversations-unified.py +53 -2
package/scripts/precompact-hook.sh +33 -0
package/scripts/streaming-watcher.py +1443 -0
package/scripts/utils.py +39 -0

package/mcp-server/src/search_tools.py ADDED Viewed

@@ -0,0 +1,826 @@
+"""Search tools for Claude Self Reflect MCP server."""
+import os
+import json
+import logging
+import time
+from typing import Optional, List, Dict, Any
+from datetime import datetime, timezone
+from pathlib import Path
+from fastmcp import Context
+from pydantic import Field
+from qdrant_client import AsyncQdrantClient
+from qdrant_client.models import PointStruct
+from .parallel_search import parallel_search_collections
+from .rich_formatting import format_search_results_rich
+logger = logging.getLogger(__name__)
+class SearchTools:
+    """Handles all search operations for the MCP server."""
+    def __init__(
+        self,
+        qdrant_client: AsyncQdrantClient,
+        qdrant_url: str,
+        get_embedding_manager,
+        normalize_project_name,
+        enable_memory_decay: bool,
+        decay_weight: float,
+        decay_scale_days: float,
+        use_native_decay: bool,
+        native_decay_available: bool,
+        decay_manager=None,
+        project_resolver=None  # Add project resolver
+    ):
+        """Initialize search tools with dependencies."""
+        self.qdrant_client = qdrant_client
+        self.qdrant_url = qdrant_url
+        self.get_embedding_manager = get_embedding_manager
+        self.normalize_project_name = normalize_project_name
+        self.enable_memory_decay = enable_memory_decay
+        self.decay_weight = decay_weight
+        self.decay_scale_days = decay_scale_days
+        self.use_native_decay = use_native_decay
+        self.native_decay_available = native_decay_available
+        self.decay_manager = decay_manager
+        self.project_resolver = project_resolver
+        # Helper functions will be implemented as methods
+    def get_project_from_cwd(self, cwd: str) -> Optional[str]:
+        """Extract project name from current working directory."""
+        from pathlib import Path
+        path_parts = Path(cwd).parts
+        if 'projects' in path_parts:
+            idx = path_parts.index('projects')
+            if idx + 1 < len(path_parts):
+                return path_parts[idx + 1]
+        elif '.claude' in path_parts:
+            # If we're in a .claude directory, go up to find project
+            for i, part in enumerate(path_parts):
+                if part == '.claude' and i > 0:
+                    return path_parts[i - 1]
+        # If still no project detected, use the last directory name
+        return Path(cwd).name
+    async def perform_search(
+        self,
+        ctx: Context,
+        query: str,
+        collection_name: str,
+        limit: int,
+        min_score: float
+    ) -> List[Dict[str, Any]]:
+        """Perform semantic search on a single collection."""
+        try:
+            # Generate embedding for query
+            embedding_manager = self.get_embedding_manager()
+            # Determine embedding type based on collection name
+            embedding_type = 'voyage' if collection_name.endswith('_voyage') else 'local'
+            query_embedding = await embedding_manager.generate_embedding(query, force_type=embedding_type)
+            # Search the collection
+            search_results = await self.qdrant_client.search(
+                collection_name=collection_name,
+                query_vector=query_embedding,
+                limit=limit,
+                score_threshold=min_score
+            )
+            # Convert results to dict format
+            results = []
+            for result in search_results:
+                results.append({
+                    'conversation_id': result.payload.get('conversation_id'),
+                    'timestamp': result.payload.get('timestamp'),
+                    'content': result.payload.get('content', ''),
+                    'score': result.score,
+                    'collection': collection_name,
+                    'payload': result.payload
+                })
+            return results
+        except Exception as e:
+            await ctx.debug(f"Error searching {collection_name}: {e}")
+            return []
+    def apply_decay_to_results(self, results: List[Dict], current_time: datetime) -> List[Dict]:
+        """Apply time-based decay to search results."""
+        if not self.enable_memory_decay:
+            return results
+        for result in results:
+            try:
+                # Parse timestamp
+                timestamp_str = result.get('timestamp')
+                if timestamp_str:
+                    from datetime import datetime, timezone
+                    timestamp = datetime.fromisoformat(timestamp_str.replace('Z', '+00:00'))
+                    # Calculate age in days
+                    age = (current_time - timestamp).total_seconds() / 86400
+                    # Apply exponential decay
+                    decay_factor = pow(2, -age / self.decay_scale_days)
+                    # Adjust score
+                    original_score = result['score']
+                    result['score'] = original_score * (1 - self.decay_weight) + decay_factor * self.decay_weight
+                    result['original_score'] = original_score
+                    result['decay_factor'] = decay_factor
+            except Exception as e:
+                logger.warning(f"Error applying decay to result: {e}")
+        return results
+    def format_search_results(
+        self,
+        results: List[Dict],
+        query: str,
+        brief: bool = False,
+        include_raw: bool = False,
+        response_format: str = "xml"
+    ) -> str:
+        """Format search results for display."""
+        if not results:
+            return "<search_results><message>No matching conversations found</message></search_results>"
+        if response_format == "markdown":
+            output = f"# Search Results for: {query}\n\n"
+            for i, result in enumerate(results, 1):
+                output += f"## Result {i}\n"
+                output += f"**Score:** {result['score']:.3f}\n"
+                output += f"**Timestamp:** {result.get('timestamp', 'N/A')}\n"
+                output += f"**Conversation ID:** {result.get('conversation_id', 'N/A')}\n\n"
+                if not brief:
+                    # Handle both 'content' and 'excerpt' fields
+                    content = result.get('content', result.get('excerpt', ''))
+                    output += f"**Content:**\n```\n{content[:500]}{'...' if len(content) > 500 else ''}\n```\n\n"
+                if include_raw:
+                    output += f"**Raw Payload:**\n```json\n{json.dumps(result.get('payload', {}), indent=2)}\n```\n\n"
+        else:
+            # XML format (default)
+            output = f"<search_results>\n<query>{query}</query>\n<count>{len(results)}</count>\n"
+            for i, result in enumerate(results, 1):
+                output += f"<result index=\"{i}\">\n"
+                output += f"  <score>{result['score']:.3f}</score>\n"
+                output += f"  <timestamp>{result.get('timestamp', 'N/A')}</timestamp>\n"
+                output += f"  <conversation_id>{result.get('conversation_id', 'N/A')}</conversation_id>\n"
+                if not brief:
+                    # Handle both 'content' and 'excerpt' fields
+                    content = result.get('content', result.get('excerpt', ''))
+                    truncated = content[:500] + ('...' if len(content) > 500 else '')
+                    output += f"  <content><![CDATA[{truncated}]]></content>\n"
+                if include_raw:
+                    output += f"  <raw_payload>{json.dumps(result.get('payload', {}))}</raw_payload>\n"
+                output += "</result>\n"
+            output += "</search_results>"
+        return output
+    async def reflect_on_past(
+        self,
+        ctx: Context,
+        query: str,
+        limit: int = 5,
+        min_score: float = 0.3,
+        use_decay: int = -1,
+        project: Optional[str] = None,
+        mode: str = "full",
+        brief: bool = False,
+        include_raw: bool = False,
+        response_format: str = "xml"
+    ) -> str:
+        """Search for relevant past conversations using semantic search with optional time decay."""
+        await ctx.debug(f"Searching for: {query}, project={project}, mode={mode}, decay={use_decay}")
+        try:
+            # Track timing for performance metrics
+            start_time = time.time()
+            timing_info = {}
+            # Determine project scope
+            target_project = project
+            if project is None:
+                cwd = os.environ.get('MCP_CLIENT_CWD', os.getcwd())
+                target_project = self.get_project_from_cwd(cwd)
+                await ctx.debug(f"Inferred project from CWD: {target_project}")
+            # Handle special cases
+            if mode == "quick":
+                return await self.quick_search(ctx, query, min_score, target_project)
+            elif mode == "summary":
+                return await self.search_summary(ctx, query, target_project)
+            # Get relevant collections based on project
+            await ctx.debug(f"Project resolver: {self.project_resolver is not None}, Target project: '{target_project}'")
+            if self.project_resolver and target_project and target_project != 'all':
+                # Use ProjectResolver to find matching collections
+                collection_names = self.project_resolver.find_collections_for_project(target_project)
+                await ctx.debug(f"ProjectResolver found {len(collection_names)} collections for '{target_project}'")
+                # Get collection objects
+                collections_response = await self.qdrant_client.get_collections()
+                all_collections = collections_response.collections
+                filtered_collections = [
+                    c for c in all_collections
+                    if c.name in collection_names
+                ]
+                await ctx.debug(f"Filtered to {len(filtered_collections)} collections from {len(all_collections)} total")
+            else:
+                # Use all collections except reflections
+                collections_response = await self.qdrant_client.get_collections()
+                collections = collections_response.collections
+                filtered_collections = [
+                    c for c in collections
+                    if not c.name.startswith('reflections')
+                ]
+                await ctx.debug(f"Searching across {len(filtered_collections)} collections")
+            if not filtered_collections:
+                return "<search_results><message>No collections found for the specified project</message></search_results>"
+            # Perform PARALLEL search across collections to avoid freeze
+            collection_names = [c.name for c in filtered_collections]
+            await ctx.debug(f"Starting parallel search across {len(collection_names)} collections")
+            # Create embedding function wrapper for parallel search
+            embedding_manager = self.get_embedding_manager()
+            async def generate_embedding_func(text: str, force_type: str = 'local'):
+                return await embedding_manager.generate_embedding(text, force_type=force_type)
+            # Track embedding generation timing
+            timing_info['embedding_start'] = time.time()
+            # Use parallel search to avoid sequential processing freeze
+            all_results, search_timing = await parallel_search_collections(
+                collections_to_search=collection_names,
+                query=query,
+                qdrant_client=self.qdrant_client,
+                ctx=ctx,
+                limit=limit * 2,  # Get more results initially
+                min_score=min_score,
+                should_use_decay=use_decay == 1,
+                target_project=target_project,
+                generate_embedding_func=generate_embedding_func,
+                constants={'DECAY_SCALE_DAYS': self.decay_scale_days},
+                max_concurrent=10  # Limit concurrent searches to avoid overload
+            )
+            # Update timing info with search timing
+            timing_info['embedding_end'] = time.time()  # Embeddings are generated inside parallel_search
+            timing_info['search_all_start'] = timing_info.get('embedding_start', time.time())
+            timing_info['search_all_end'] = time.time()
+            # search_timing is a list of collection timings, not a dict
+            await ctx.debug(f"Parallel search completed with {len(all_results)} total results")
+            # Debug: Log some details about results
+            if all_results:
+                await ctx.debug(f"Top result score: {all_results[0]['score']:.4f}")
+            else:
+                await ctx.debug(f"No results found. Timing info: {timing_info}")
+            if not all_results:
+                return "<search_results><message>No matching conversations found</message></search_results>"
+            # Sort and limit results
+            all_results.sort(key=lambda x: x['score'], reverse=True)
+            final_results = all_results[:limit]
+            # Use rich formatting for default XML format
+            if response_format == "xml" and not brief:
+                # Try to get indexing status for rich display
+                indexing_status = None
+                # TODO: Add indexing status retrieval here if needed
+                return format_search_results_rich(
+                    results=final_results,
+                    query=query,
+                    target_project=target_project,
+                    collections_searched=len(collection_names),
+                    timing_info=timing_info,
+                    start_time=start_time,
+                    brief=brief,
+                    include_raw=include_raw,
+                    indexing_status=indexing_status
+                )
+            else:
+                # Fall back to standard formatting for markdown or brief mode
+                return self.format_search_results(
+                    final_results,
+                    query,
+                    brief=brief,
+                    include_raw=include_raw,
+                    response_format=response_format
+                )
+        except Exception as e:
+            logger.error(f"Search failed: {e}", exc_info=True)
+            return f"<search_results><error>Search failed: {str(e)}</error></search_results>"
+    async def quick_search(
+        self,
+        ctx: Context,
+        query: str,
+        min_score: float = 0.3,
+        project: Optional[str] = None
+    ) -> str:
+        """Quick search that returns only the count and top result for fast overview."""
+        await ctx.debug(f"Quick search for: {query}, project={project}")
+        try:
+            # Determine project scope
+            target_project = project
+            if project is None:
+                cwd = os.environ.get('MCP_CLIENT_CWD', os.getcwd())
+                target_project = self.get_project_from_cwd(cwd)
+            # Get collections based on project
+            if self.project_resolver and target_project and target_project != 'all':
+                # Use ProjectResolver to find matching collections
+                collection_names = self.project_resolver.find_collections_for_project(target_project)
+                collections_response = await self.qdrant_client.get_collections()
+                all_collections = collections_response.collections
+                filtered_collections = [
+                    c for c in all_collections
+                    if c.name in collection_names
+                ]
+            else:
+                # Use all collections except reflections
+                collections_response = await self.qdrant_client.get_collections()
+                collections = collections_response.collections
+                filtered_collections = [
+                    c for c in collections
+                    if not c.name.startswith('reflections')
+                ]
+            # Quick PARALLEL count across collections
+            collection_names = [c.name for c in filtered_collections]
+            # Create embedding function wrapper
+            embedding_manager = self.get_embedding_manager()
+            async def generate_embedding_func(text: str, force_type: str = 'local'):
+                return await embedding_manager.generate_embedding(text, force_type=force_type)
+            # Use parallel search for quick check
+            all_results, _ = await parallel_search_collections(
+                collections_to_search=collection_names,
+                query=query,
+                qdrant_client=self.qdrant_client,
+                ctx=ctx,
+                limit=1,  # Only need top result from each collection
+                min_score=min_score,
+                should_use_decay=False,  # Quick search doesn't use decay
+                target_project=target_project,
+                generate_embedding_func=generate_embedding_func,
+                constants={'DECAY_SCALE_DAYS': self.decay_scale_days},
+                max_concurrent=20  # Higher concurrency for quick search
+            )
+            # Count collections with results and find top result
+            collections_with_matches = len(set(r.get('collection_name', r.get('collection', '')) for r in all_results))
+            top_result = max(all_results, key=lambda x: x.get('score', 0)) if all_results else None
+            top_score = top_result.get('score', 0) if top_result else 0
+            # Format quick search response
+            if not top_result:
+                return "<quick_search><count>0</count><message>No matches found</message></quick_search>"
+            return f"""<quick_search>
+<count>{collections_with_matches} collections with matches</count>
+<top_result>
+  <score>{top_result['score']:.3f}</score>
+  <timestamp>{top_result.get('timestamp', 'N/A')}</timestamp>
+  <preview>{top_result.get('excerpt', top_result.get('content', ''))[:200]}...</preview>
+</top_result>
+</quick_search>"""
+        except Exception as e:
+            logger.error(f"Quick search failed: {e}", exc_info=True)
+            return f"<quick_search><error>Quick search failed: {str(e)}</error></quick_search>"
+    async def search_summary(
+        self,
+        ctx: Context,
+        query: str,
+        project: Optional[str] = None
+    ) -> str:
+        """Get aggregated insights from search results without individual result details."""
+        await ctx.debug(f"Getting search summary for: {query}, project={project}")
+        try:
+            # Determine project scope
+            target_project = project
+            if project is None:
+                cwd = os.environ.get('MCP_CLIENT_CWD', os.getcwd())
+                target_project = self.get_project_from_cwd(cwd)
+            # Get collections based on project
+            if self.project_resolver and target_project and target_project != 'all':
+                # Use ProjectResolver to find matching collections
+                collection_names = self.project_resolver.find_collections_for_project(target_project)
+                collections_response = await self.qdrant_client.get_collections()
+                all_collections = collections_response.collections
+                filtered_collections = [
+                    c for c in all_collections
+                    if c.name in collection_names
+                ]
+            else:
+                # Use all collections except reflections
+                collections_response = await self.qdrant_client.get_collections()
+                collections = collections_response.collections
+                filtered_collections = [
+                    c for c in collections
+                    if not c.name.startswith('reflections')
+                ]
+            # Gather results for summary using PARALLEL search
+            collection_names = [c.name for c in filtered_collections]
+            # Create embedding function wrapper
+            embedding_manager = self.get_embedding_manager()
+            async def generate_embedding_func(text: str, force_type: str = 'local'):
+                return await embedding_manager.generate_embedding(text, force_type=force_type)
+            # Use parallel search for summary
+            all_results, _ = await parallel_search_collections(
+                collections_to_search=collection_names,
+                query=query,
+                qdrant_client=self.qdrant_client,
+                ctx=ctx,
+                limit=10,  # Get more results for summary
+                min_score=0.0,  # Get all results for aggregation
+                should_use_decay=False,  # Summary doesn't use decay
+                target_project=target_project,
+                generate_embedding_func=generate_embedding_func,
+                constants={'DECAY_SCALE_DAYS': self.decay_scale_days},
+                max_concurrent=15  # Balanced concurrency
+            )
+            if not all_results:
+                return "<search_summary><message>No matches found</message></search_summary>"
+            # Sort and get top results
+            all_results.sort(key=lambda x: x['score'], reverse=True)
+            top_results = all_results[:10]
+            # Analyze patterns
+            avg_score = sum(r['score'] for r in top_results) / len(top_results)
+            collections_found = len(set(r.get('collection_name', r.get('collection', '')) for r in top_results))
+            # Extract common concepts if available
+            all_concepts = []
+            for r in top_results:
+                if 'payload' in r and 'concepts' in r['payload']:
+                    all_concepts.extend(r['payload']['concepts'])
+            from collections import Counter
+            concept_counts = Counter(all_concepts).most_common(5)
+            return f"""<search_summary>
+<query>{query}</query>
+<total_matches>{len(all_results)}</total_matches>
+<average_score>{avg_score:.3f}</average_score>
+<collections_matched>{collections_found}</collections_matched>
+<top_concepts>{', '.join([c[0] for c in concept_counts]) if concept_counts else 'N/A'}</top_concepts>
+<insight>Found {len(all_results)} matches across {collections_found} collections with average relevance of {avg_score:.3f}</insight>
+</search_summary>"""
+        except Exception as e:
+            logger.error(f"Search summary failed: {e}", exc_info=True)
+            return f"<search_summary><error>Search summary failed: {str(e)}</error></search_summary>"
+    async def get_more_results(
+        self,
+        ctx: Context,
+        query: str,
+        offset: int = 3,
+        limit: int = 3,
+        min_score: float = 0.3,
+        project: Optional[str] = None
+    ) -> str:
+        """Get additional search results after an initial search (pagination support)."""
+        await ctx.debug(f"Getting more results for: {query}, offset={offset}, limit={limit}")
+        try:
+            # Determine project scope
+            target_project = project
+            if project is None:
+                cwd = os.environ.get('MCP_CLIENT_CWD', os.getcwd())
+                target_project = self.get_project_from_cwd(cwd)
+            # Get collections based on project
+            if self.project_resolver and target_project and target_project != 'all':
+                # Use ProjectResolver to find matching collections
+                collection_names = self.project_resolver.find_collections_for_project(target_project)
+                collections_response = await self.qdrant_client.get_collections()
+                all_collections = collections_response.collections
+                filtered_collections = [
+                    c for c in all_collections
+                    if c.name in collection_names
+                ]
+            else:
+                # Use all collections except reflections
+                collections_response = await self.qdrant_client.get_collections()
+                collections = collections_response.collections
+                filtered_collections = [
+                    c for c in collections
+                    if not c.name.startswith('reflections')
+                ]
+            # Gather all results using PARALLEL search
+            collection_names = [c.name for c in filtered_collections]
+            # Create embedding function wrapper
+            embedding_manager = self.get_embedding_manager()
+            async def generate_embedding_func(text: str, force_type: str = 'local'):
+                return await embedding_manager.generate_embedding(text, force_type=force_type)
+            # Use parallel search for pagination
+            all_results, _ = await parallel_search_collections(
+                collections_to_search=collection_names,
+                query=query,
+                qdrant_client=self.qdrant_client,
+                ctx=ctx,
+                limit=offset + limit,  # Get more results than needed to handle offset
+                min_score=min_score,
+                should_use_decay=False,  # Pagination doesn't use decay
+                target_project=target_project,
+                generate_embedding_func=generate_embedding_func,
+                constants={'DECAY_SCALE_DAYS': self.decay_scale_days},
+                max_concurrent=10  # Standard concurrency
+            )
+            if not all_results:
+                return "<more_results><message>No more results found</message></more_results>"
+            # Sort all results by score
+            all_results.sort(key=lambda x: x['score'], reverse=True)
+            # Apply offset and limit
+            paginated_results = all_results[offset:offset + limit]
+            if not paginated_results:
+                return f"<more_results><message>No results at offset {offset}</message></more_results>"
+            # Format paginated results
+            output = f"<more_results>\n<query>{query}</query>\n"
+            output += f"<offset>{offset}</offset>\n"
+            output += f"<limit>{limit}</limit>\n"
+            output += f"<total_available>{len(all_results)}</total_available>\n"
+            output += f"<results_returned>{len(paginated_results)}</results_returned>\n"
+            for i, result in enumerate(paginated_results, 1):
+                output += f"<result index=\"{offset + i}\">\n"
+                output += f"  <score>{result['score']:.3f}</score>\n"
+                output += f"  <timestamp>{result.get('timestamp', 'N/A')}</timestamp>\n"
+                output += f"  <preview>{result.get('content', '')[:200]}...</preview>\n"
+                output += "</result>\n"
+            output += "</more_results>"
+            return output
+        except Exception as e:
+            logger.error(f"Get more results failed: {e}", exc_info=True)
+            return f"<more_results><error>Failed to get more results: {str(e)}</error></more_results>"
+    async def search_by_file(
+        self,
+        ctx: Context,
+        file_path: str,
+        limit: int = 10,
+        project: Optional[str] = None
+    ) -> str:
+        """Search for conversations that analyzed a specific file."""
+        await ctx.debug(f"Searching for file: {file_path}, project={project}")
+        try:
+            # Normalize file path
+            normalized_path = str(Path(file_path).resolve())
+            # Search for file mentions in metadata
+            collections_response = await self.qdrant_client.get_collections()
+            collections = collections_response.collections
+            # Define async function to search a single collection
+            async def search_collection(collection_name: str):
+                try:
+                    # Search by payload filter
+                    search_results = await self.qdrant_client.search(
+                        collection_name=collection_name,
+                        query_vector=[0] * 384,  # Dummy vector for metadata search
+                        limit=limit,
+                        query_filter={
+                            "must": [
+                                {
+                                    "key": "files_analyzed",
+                                    "match": {"any": [normalized_path]}
+                                }
+                            ]
+                        }
+                    )
+                    results = []
+                    for result in search_results:
+                        results.append({
+                            'conversation_id': result.payload.get('conversation_id'),
+                            'timestamp': result.payload.get('timestamp'),
+                            'content': result.payload.get('content', ''),
+                            'files_analyzed': result.payload.get('files_analyzed', []),
+                            'score': result.score
+                        })
+                    return results
+                except Exception as e:
+                    await ctx.debug(f"Error searching {collection_name}: {e}")
+                    return []
+            # Use asyncio.gather for PARALLEL search across all collections
+            import asyncio
+            search_tasks = [search_collection(c.name) for c in collections]
+            # Limit concurrent searches to avoid overload
+            batch_size = 20
+            all_results = []
+            for i in range(0, len(search_tasks), batch_size):
+                batch = search_tasks[i:i+batch_size]
+                batch_results = await asyncio.gather(*batch)
+                for results in batch_results:
+                    all_results.extend(results)
+            # Format results
+            if not all_results:
+                return f"<file_search><message>No conversations found analyzing {file_path}</message></file_search>"
+            return self.format_search_results(all_results, f"file:{file_path}")
+        except Exception as e:
+            logger.error(f"File search failed: {e}", exc_info=True)
+            return f"<file_search><error>File search failed: {str(e)}</error></file_search>"
+    async def search_by_concept(
+        self,
+        ctx: Context,
+        concept: str,
+        limit: int = 10,
+        project: Optional[str] = None,
+        include_files: bool = True
+    ) -> str:
+        """Search for conversations about a specific development concept."""
+        await ctx.debug(f"Searching for concept: {concept}, project={project}")
+        try:
+            # Search using concept as query with semantic search
+            results = await self.reflect_on_past(
+                ctx, concept, limit=limit, project=project
+            )
+            # Enhance results with concept-specific formatting
+            # This is a simplified version - actual implementation would analyze concepts
+            return results
+        except Exception as e:
+            logger.error(f"Concept search failed: {e}", exc_info=True)
+            return f"<concept_search><error>Concept search failed: {str(e)}</error></concept_search>"
+    async def get_next_results(
+        self,
+        ctx: Context,
+        query: str,
+        offset: int = 3,
+        limit: int = 3,
+        min_score: float = 0.3,
+        project: Optional[str] = None
+    ) -> str:
+        """Get additional search results after an initial search (pagination support)."""
+        # This is an alias for get_more_results
+        return await self.get_more_results(ctx, query, offset, limit, min_score, project)
+def register_search_tools(
+    mcp,
+    qdrant_client: AsyncQdrantClient,
+    qdrant_url: str,
+    get_embedding_manager,
+    normalize_project_name,
+    enable_memory_decay: bool,
+    decay_weight: float,
+    decay_scale_days: float,
+    use_native_decay: bool,
+    native_decay_available: bool,
+    decay_manager=None,
+    project_resolver=None  # Add project resolver
+):
+    """Register search tools with the MCP server."""
+    tools = SearchTools(
+        qdrant_client,
+        qdrant_url,
+        get_embedding_manager,
+        normalize_project_name,
+        enable_memory_decay,
+        decay_weight,
+        decay_scale_days,
+        use_native_decay,
+        native_decay_available,
+        decay_manager,
+        project_resolver  # Pass the resolver
+    )
+    @mcp.tool()
+    async def reflect_on_past(
+        ctx: Context,
+        query: str = Field(description="The search query to find semantically similar conversations"),
+        limit: int = Field(default=5, description="Maximum number of results to return"),
+        min_score: float = Field(default=0.3, description="Minimum similarity score (0-1)"),
+        use_decay: int = Field(default=-1, description="Apply time-based decay: 1=enable, 0=disable, -1=use environment default (accepts int or str)"),
+        project: Optional[str] = Field(default=None, description="Search specific project only. If not provided, searches current project based on working directory. Use 'all' to search across all projects."),
+        mode: str = Field(default="full", description="Search mode: 'full' (all results with details), 'quick' (count + top result only), 'summary' (aggregated insights without individual results)"),
+        brief: bool = Field(default=False, description="Brief mode: returns minimal information for faster response"),
+        include_raw: bool = Field(default=False, description="Include raw Qdrant payload data for debugging (increases response size)"),
+        response_format: str = Field(default="xml", description="Response format: 'xml' or 'markdown'")
+    ) -> str:
+        """Search for relevant past conversations using semantic search with optional time decay."""
+        return await tools.reflect_on_past(ctx, query, limit, min_score, use_decay, project, mode, brief, include_raw, response_format)
+    @mcp.tool()
+    async def quick_search(
+        ctx: Context,
+        query: str = Field(description="The search query to find semantically similar conversations"),
+        min_score: float = Field(default=0.3, description="Minimum similarity score (0-1)"),
+        project: Optional[str] = Field(default=None, description="Search specific project only. If not provided, searches current project based on working directory. Use 'all' to search across all projects.")
+    ) -> str:
+        """Quick search that returns only the count and top result for fast overview."""
+        return await tools.quick_search(ctx, query, min_score, project)
+    @mcp.tool()
+    async def search_summary(
+        ctx: Context,
+        query: str = Field(description="The search query to find semantically similar conversations"),
+        project: Optional[str] = Field(default=None, description="Search specific project only. If not provided, searches current project based on working directory. Use 'all' to search across all projects.")
+    ) -> str:
+        """Get aggregated insights from search results without individual result details."""
+        return await tools.search_summary(ctx, query, project)
+    @mcp.tool()
+    async def get_more_results(
+        ctx: Context,
+        query: str = Field(description="The original search query"),
+        offset: int = Field(default=3, description="Number of results to skip (for pagination)"),
+        limit: int = Field(default=3, description="Number of additional results to return"),
+        min_score: float = Field(default=0.3, description="Minimum similarity score (0-1)"),
+        project: Optional[str] = Field(default=None, description="Search specific project only")
+    ) -> str:
+        """Get additional search results after an initial search (pagination support)."""
+        return await tools.get_more_results(ctx, query, offset, limit, min_score, project)
+    @mcp.tool()
+    async def search_by_file(
+        ctx: Context,
+        file_path: str = Field(description="The file path to search for in conversations"),
+        limit: int = Field(default=10, description="Maximum number of results to return"),
+        project: Optional[str] = Field(default=None, description="Search specific project only. Use 'all' to search across all projects.")
+    ) -> str:
+        """Search for conversations that analyzed a specific file."""
+        return await tools.search_by_file(ctx, file_path, limit, project)
+    @mcp.tool()
+    async def search_by_concept(
+        ctx: Context,
+        concept: str = Field(description="The concept to search for (e.g., 'security', 'docker', 'testing')"),
+        limit: int = Field(default=10, description="Maximum number of results to return"),
+        project: Optional[str] = Field(default=None, description="Search specific project only. Use 'all' to search across all projects."),
+        include_files: bool = Field(default=True, description="Include file information in results")
+    ) -> str:
+        """Search for conversations about a specific development concept."""
+        return await tools.search_by_concept(ctx, concept, limit, project, include_files)
+    @mcp.tool()
+    async def get_next_results(
+        ctx: Context,
+        query: str = Field(description="The original search query"),
+        offset: int = Field(default=3, description="Number of results to skip (for pagination)"),
+        limit: int = Field(default=3, description="Number of additional results to return"),
+        min_score: float = Field(default=0.3, description="Minimum similarity score (0-1)"),
+        project: Optional[str] = Field(default=None, description="Search specific project only")
+    ) -> str:
+        """Get additional search results after an initial search (pagination support)."""
+        return await tools.get_next_results(ctx, query, offset, limit, min_score, project)
+    logger.info("Search tools registered successfully")