PyPI - ragtime-cli - Versions diffs - 0.2.10__py3-none-any.whl → 0.2.11__py3-none-any.whl - Mend

ragtime-cli 0.2.10py3-none-any.whl → 0.2.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/METADATA +21 -3
{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/RECORD +11 -11
src/cli.py +10 -2
src/config.py +4 -3
src/db.py +23 -2
src/mcp_server.py +9 -3
src/memory.py +33 -14
{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/WHEEL +0 -0
{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/entry_points.txt +0 -0
{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/licenses/LICENSE +0 -0
{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/top_level.txt +0 -0

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: ragtime-cli
-Version: 0.2.10
+Version: 0.2.11
 Summary: Local-first memory and RAG system for Claude Code - semantic search over code, docs, and team knowledge
 Author-email: Bret Martineau <bretwardjames@gmail.com>
 License-Expression: MIT
@@ -121,6 +121,10 @@ ragtime search "useAsyncState" --type code
 # Search only docs
 ragtime search "authentication" --type docs --namespace app
+# Hybrid search: semantic + keyword filtering
+# Use -r/--require to ensure terms appear in results
+ragtime search "error handling" -r mobile -r dart
 # Reindex memory files
 ragtime reindex
@@ -233,9 +237,9 @@ ragtime setup-ghp
 ```yaml
 docs:
-  paths: ["docs", ".ragtime"]
+  paths: ["docs"]
   patterns: ["**/*.md"]
-  exclude: ["**/node_modules/**"]
+  exclude: ["**/node_modules/**", "**/.ragtime/**"]
 code:
   paths: ["."]
@@ -259,6 +263,20 @@ This is intentional - embeddings work better on focused summaries than large cod
 For Claude/MCP usage: The search tool description instructs Claude to read returned file paths for full implementations before making code changes.
+### Hybrid Search
+Semantic search can lose qualifiers - "error handling in mobile app" might return web app results because "error handling" dominates the embedding. Use `require_terms` to ensure specific words appear:
+```bash
+# CLI
+ragtime search "error handling" -r mobile -r dart
+# MCP
+search(query="error handling", require_terms=["mobile", "dart"])
+```
+This combines semantic similarity (finds conceptually related content) with keyword filtering (ensures qualifiers aren't ignored).
 ## Code Indexing
 The code indexer extracts meaningful symbols from your codebase:

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/RECORD RENAMED Viewed

@@ -1,10 +1,10 @@
-ragtime_cli-0.2.10.dist-info/licenses/LICENSE,sha256=9A0wJs2PRDciGRH4F8JUJ-aMKYQyq_gVu2ixrXs-l5A,1070
+ragtime_cli-0.2.11.dist-info/licenses/LICENSE,sha256=9A0wJs2PRDciGRH4F8JUJ-aMKYQyq_gVu2ixrXs-l5A,1070
 src/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-src/cli.py,sha256=3Cn4D1W4Wok0mJB1fiBdynnCaDo4FWJo8Zay3Tp_ycQ,73978
-src/config.py,sha256=qyn5ADjPwvQlhwSJHwzat1v449b7MKEzIHr37Q5qhCc,4497
-src/db.py,sha256=dxdGNhM-0Ke8yjcp69LTPS4L5vpGue-_2HwBPNvD2bg,7101
-src/mcp_server.py,sha256=l834kmwumb9egzz5Sscfm8DdpPJLcqK7qX6a3sZ3EVk,21036
-src/memory.py,sha256=qd-29w2rfkDzr1qIzxRgi9cr7skxjw8nSKhj7qjt1v4,14506
+src/cli.py,sha256=HDZNFg5shUU1s6JLi9Wn_TydEXx-92JCginJYgH3BlE,74375
+src/config.py,sha256=tQ6gPLr4ksn2bJPIUjtELFr-k01Eg4g-LDo3GNE6P0Q,4600
+src/db.py,sha256=ueSThFXkhI5MFwXICkNW3zqCawGDi3kqFQnbm4st_Ew,8186
+src/mcp_server.py,sha256=SvkoGkBqoaZkW3KXiE5qHbbkTIjby94mcxMXgJKv8ik,21559
+src/memory.py,sha256=lmDgC9AH24dog6dvbGgHt95TANUgdBZSnLcqM0isx10,15639
 src/commands/audit.md,sha256=Xkucm-gfBIMalK9wf7NBbyejpsqBTUAGGlb7GxMtMPY,5137
 src/commands/create-pr.md,sha256=u6-jVkDP_6bJQp6ImK039eY9F6B9E2KlAVlvLY-WV6Q,9483
 src/commands/generate-docs.md,sha256=9W2Yy-PDyC3p5k39uEb31z5YAHkSKsQLg6gV3tLgSnQ,7015
@@ -18,8 +18,8 @@ src/commands/start.md,sha256=qoqhkMgET74DBx8YPIT1-wqCiVBUDxlmevigsCinHSY,6506
 src/indexers/__init__.py,sha256=MYoCPZUpHakMX1s2vWnc9shjWfx_X1_0JzUhpKhnKUQ,454
 src/indexers/code.py,sha256=G2TbiKbWj0e7DV5KsU8-Ggw6ziDb4zTuZ4Bu3ryV4g8,18059
 src/indexers/docs.py,sha256=nyewQ4Ug4SCuhne4TuLDlUDzz9GH2STInddj81ocz50,3555
-ragtime_cli-0.2.10.dist-info/METADATA,sha256=UeWRU7V51UjtrulR1sNF1CsH2gMA3fjn9FMtMRjOqrw,10619
-ragtime_cli-0.2.10.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
-ragtime_cli-0.2.10.dist-info/entry_points.txt,sha256=cWLbeyMxZNbew-THS3bHXTpCRXt1EaUy5QUOXGXLjl4,75
-ragtime_cli-0.2.10.dist-info/top_level.txt,sha256=74rtVfumQlgAPzR5_2CgYN24MB0XARCg0t-gzk6gTrM,4
-ragtime_cli-0.2.10.dist-info/RECORD,,
+ragtime_cli-0.2.11.dist-info/METADATA,sha256=M0M_WyDQE5zDvpoMeo3RG18NJNRUw6IMOVqKh4mexVY,11269
+ragtime_cli-0.2.11.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+ragtime_cli-0.2.11.dist-info/entry_points.txt,sha256=cWLbeyMxZNbew-THS3bHXTpCRXt1EaUy5QUOXGXLjl4,75
+ragtime_cli-0.2.11.dist-info/top_level.txt,sha256=74rtVfumQlgAPzR5_2CgYN24MB0XARCg0t-gzk6gTrM,4
+ragtime_cli-0.2.11.dist-info/RECORD,,

src/cli.py CHANGED Viewed

@@ -469,12 +469,19 @@ def index(path: Path, index_type: str, clear: bool):
 @click.option("--path", type=click.Path(exists=True, path_type=Path), default=".")
 @click.option("--type", "type_filter", type=click.Choice(["all", "docs", "code"]), default="all")
 @click.option("--namespace", "-n", help="Filter by namespace")
+@click.option("--require", "-r", "require_terms", multiple=True,
+              help="Terms that MUST appear in results (repeatable)")
 @click.option("--include-archive", is_flag=True, help="Also search archived branches")
 @click.option("--limit", "-l", default=5, help="Max results")
 @click.option("--verbose", "-v", is_flag=True, help="Show full content")
 def search(query: str, path: Path, type_filter: str, namespace: str,
-           include_archive: bool, limit: int, verbose: bool):
-    """Search indexed content."""
+           require_terms: tuple, include_archive: bool, limit: int, verbose: bool):
+    """
+    Hybrid search: semantic similarity + keyword filtering.
+    Use --require/-r to ensure specific terms appear in results.
+    Example: ragtime search "error handling" -r mobile -r dart
+    """
     path = Path(path).resolve()
     db = get_db(path)
@@ -485,6 +492,7 @@ def search(query: str, path: Path, type_filter: str, namespace: str,
         limit=limit,
         type_filter=type_arg,
         namespace=namespace,
+        require_terms=list(require_terms) if require_terms else None,
     )
     if not results:

src/config.py CHANGED Viewed

@@ -12,13 +12,14 @@ import yaml
 @dataclass
 class DocsConfig:
     """Configuration for docs indexing."""
-    paths: list[str] = field(default_factory=lambda: ["docs", ".ragtime"])
+    # Note: .ragtime/ is NOT included here - memories are indexed separately via 'reindex'
+    # to avoid duplicate entries (same file indexed as both doc and memory)
+    paths: list[str] = field(default_factory=lambda: ["docs"])
     patterns: list[str] = field(default_factory=lambda: ["**/*.md"])
     exclude: list[str] = field(default_factory=lambda: [
         "**/node_modules/**",
         "**/.git/**",
-        "**/.ragtime/index/**",
-        "**/.ragtime/branches/.*",  # Exclude synced (dot-prefixed) branches
+        "**/.ragtime/**",  # Memories indexed separately
     ])

src/db.py CHANGED Viewed

@@ -84,16 +84,20 @@ class RagtimeDB:
         limit: int = 10,
         type_filter: str | None = None,
         namespace: str | None = None,
+        require_terms: list[str] | None = None,
         **filters,
     ) -> list[dict]:
         """
-        Semantic search over indexed content.
+        Hybrid search: semantic similarity + keyword filtering.
         Args:
             query: Natural language search query
             limit: Max results to return
             type_filter: "code" or "docs" (None = both)
             namespace: Filter by namespace (for docs)
+            require_terms: List of terms that MUST appear in results (case-insensitive).
+                          Use for scoped queries like "error handling in mobile" with
+                          require_terms=["mobile"] to ensure "mobile" isn't ignored.
             **filters: Additional metadata filters (None values are ignored)
         Returns:
@@ -121,9 +125,12 @@ class RagtimeDB:
         else:
             where = {"$and": conditions}
+        # When using require_terms, fetch more results since we'll filter some out
+        fetch_limit = limit * 5 if require_terms else limit
         results = self.collection.query(
             query_texts=[query],
-            n_results=limit,
+            n_results=fetch_limit,
             where=where,
         )
@@ -131,12 +138,26 @@ class RagtimeDB:
         output = []
         if results["documents"] and results["documents"][0]:
             for i, doc in enumerate(results["documents"][0]):
+                # Hybrid filtering: ensure required terms appear
+                if require_terms:
+                    doc_lower = doc.lower()
+                    # Also check file path in metadata for code/file matches
+                    file_path = (results["metadatas"][0][i].get("file", "") or "").lower()
+                    combined_text = f"{doc_lower} {file_path}"
+                    if not all(term.lower() in combined_text for term in require_terms):
+                        continue
                 output.append({
                     "content": doc,
                     "metadata": results["metadatas"][0][i] if results["metadatas"] else {},
                     "distance": results["distances"][0][i] if results["distances"] else None,
                 })
+                # Stop once we have enough
+                if len(output) >= limit:
+                    break
         return output
     def delete(self, ids: list[str]) -> None:

src/mcp_server.py CHANGED Viewed

@@ -132,7 +132,7 @@ class RagtimeMCPServer:
             },
             {
                 "name": "search",
-                "description": "Semantic search over indexed code and docs. Returns function signatures, class definitions, and doc summaries with file paths and line numbers. IMPORTANT: Results are summaries only - use the Read tool on returned file paths to see full implementations before making code changes or decisions.",
+                "description": "Hybrid search over indexed code and docs (semantic + keyword). Returns function signatures, class definitions, and doc summaries with file paths and line numbers. IMPORTANT: Results are summaries only - use the Read tool on returned file paths to see full implementations before making code changes or decisions.",
                 "inputSchema": {
                     "type": "object",
                     "properties": {
@@ -152,6 +152,11 @@ class RagtimeMCPServer:
                             "type": "string",
                             "description": "Filter by component"
                         },
+                        "require_terms": {
+                            "type": "array",
+                            "items": {"type": "string"},
+                            "description": "Terms that MUST appear in results (case-insensitive). Use for scoped queries like 'error handling in mobile' with require_terms=['mobile'] to ensure the qualifier isn't lost in semantic search."
+                        },
                         "limit": {
                             "type": "integer",
                             "default": 10,
@@ -333,13 +338,14 @@ class RagtimeMCPServer:
         }
     def _search(self, args: dict) -> dict:
-        """Search indexed content."""
+        """Search indexed content with hybrid semantic + keyword matching."""
         results = self.db.search(
             query=args["query"],
             limit=args.get("limit", 10),
             namespace=args.get("namespace"),
             type_filter=args.get("type"),
             component=args.get("component"),
+            require_terms=args.get("require_terms"),
         )
         return {
@@ -487,7 +493,7 @@ class RagtimeMCPServer:
                         "protocolVersion": "2024-11-05",
                         "serverInfo": {
                             "name": "ragtime",
-                            "version": "0.2.10",
+                            "version": "0.2.11",
                         },
                         "capabilities": {
                             "tools": {},

src/memory.py CHANGED Viewed

@@ -207,25 +207,41 @@ class MemoryStore:
     def get(self, memory_id: str) -> Optional[Memory]:
         """Get a memory by ID."""
-        # Search in ChromaDB to find the file
-        results = self.db.collection.get(ids=[memory_id])
+        # Search in ChromaDB to find the memory
+        results = self.db.collection.get(ids=[memory_id], include=["documents", "metadatas"])
         if not results["ids"]:
             return None
         metadata = results["metadatas"][0]
+        content = results["documents"][0] if results["documents"] else ""
         file_rel_path = metadata.get("file", "")
-        if not file_rel_path:
-            return None
-        file_path = self.memory_dir / file_rel_path
-        if file_path.exists():
-            # Pass relative_to so the memory preserves its actual file path
-            return Memory.from_file(file_path, relative_to=self.memory_dir)
+        # Try to read from file first (has full frontmatter data)
+        if file_rel_path:
+            file_path = self.memory_dir / file_rel_path
+            if file_path.exists():
+                return Memory.from_file(file_path, relative_to=self.memory_dir)
-        return None
+        # Fall back to constructing from ChromaDB data
+        # This handles cases where file path is wrong or file was deleted
+        return Memory(
+            id=memory_id,
+            content=content,
+            namespace=metadata.get("namespace", "unknown"),
+            type=metadata.get("type", "unknown"),
+            component=metadata.get("component"),
+            confidence=metadata.get("confidence", "medium"),
+            confidence_reason=metadata.get("confidence_reason"),
+            source=metadata.get("source", "unknown"),
+            status=metadata.get("status", "active"),
+            added=metadata.get("added", ""),
+            author=metadata.get("author"),
+            issue=metadata.get("issue"),
+            epic=metadata.get("epic"),
+            branch=metadata.get("branch"),
+            _file_path=file_rel_path,
+        )
     def delete(self, memory_id: str) -> bool:
         """Delete a memory by ID."""
@@ -322,10 +338,13 @@ class MemoryStore:
         if component:
             conditions.append({"component": component})
+        # Exclude docs/code entries - they use type="docs" or type="code"
+        # while memories use types like "architecture", "feature", etc.
+        # This is especially important for wildcard queries
+        conditions.append({"type": {"$nin": ["docs", "code"]}})
         # Build where clause with $and if multiple conditions
-        if len(conditions) == 0:
-            where = None
-        elif len(conditions) == 1:
+        if len(conditions) == 1:
             where = conditions[0]
         else:
             where = {"$and": conditions}

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/WHEEL RENAMED Viewed

File without changes

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{ragtime_cli-0.2.10.dist-info → ragtime_cli-0.2.11.dist-info}/top_level.txt RENAMED Viewed

File without changes

ragtime-cli 0.2.10__py3-none-any.whl → 0.2.11__py3-none-any.whl

ragtime-cli 0.2.10py3-none-any.whl → 0.2.11py3-none-any.whl