PyPI - alma-memory - Versions diffs - 0.4.0__py3-none-any.whl → 0.5.1__py3-none-any.whl - Mend

alma-memory 0.4.0py3-none-any.whl → 0.5.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (94) hide show

alma/__init__.py +121 -45
alma/confidence/__init__.py +1 -1
alma/confidence/engine.py +92 -58
alma/confidence/types.py +34 -14
alma/config/loader.py +3 -2
alma/consolidation/__init__.py +23 -0
alma/consolidation/engine.py +678 -0
alma/consolidation/prompts.py +84 -0
alma/core.py +136 -28
alma/domains/__init__.py +6 -6
alma/domains/factory.py +12 -9
alma/domains/schemas.py +17 -3
alma/domains/types.py +8 -4
alma/events/__init__.py +75 -0
alma/events/emitter.py +284 -0
alma/events/storage_mixin.py +246 -0
alma/events/types.py +126 -0
alma/events/webhook.py +425 -0
alma/exceptions.py +49 -0
alma/extraction/__init__.py +31 -0
alma/extraction/auto_learner.py +265 -0
alma/extraction/extractor.py +420 -0
alma/graph/__init__.py +106 -0
alma/graph/backends/__init__.py +32 -0
alma/graph/backends/kuzu.py +624 -0
alma/graph/backends/memgraph.py +432 -0
alma/graph/backends/memory.py +236 -0
alma/graph/backends/neo4j.py +417 -0
alma/graph/base.py +159 -0
alma/graph/extraction.py +198 -0
alma/graph/store.py +860 -0
alma/harness/__init__.py +4 -4
alma/harness/base.py +18 -9
alma/harness/domains.py +27 -11
alma/initializer/__init__.py +1 -1
alma/initializer/initializer.py +51 -43
alma/initializer/types.py +25 -17
alma/integration/__init__.py +9 -9
alma/integration/claude_agents.py +32 -20
alma/integration/helena.py +32 -22
alma/integration/victor.py +57 -33
alma/learning/__init__.py +27 -27
alma/learning/forgetting.py +198 -148
alma/learning/heuristic_extractor.py +40 -24
alma/learning/protocols.py +65 -17
alma/learning/validation.py +7 -2
alma/mcp/__init__.py +4 -4
alma/mcp/__main__.py +2 -1
alma/mcp/resources.py +17 -16
alma/mcp/server.py +102 -44
alma/mcp/tools.py +180 -45
alma/observability/__init__.py +84 -0
alma/observability/config.py +302 -0
alma/observability/logging.py +424 -0
alma/observability/metrics.py +583 -0
alma/observability/tracing.py +440 -0
alma/progress/__init__.py +3 -3
alma/progress/tracker.py +26 -20
alma/progress/types.py +8 -12
alma/py.typed +0 -0
alma/retrieval/__init__.py +11 -11
alma/retrieval/cache.py +20 -21
alma/retrieval/embeddings.py +4 -4
alma/retrieval/engine.py +179 -39
alma/retrieval/scoring.py +73 -63
alma/session/__init__.py +2 -2
alma/session/manager.py +5 -5
alma/session/types.py +5 -4
alma/storage/__init__.py +70 -0
alma/storage/azure_cosmos.py +414 -133
alma/storage/base.py +215 -4
alma/storage/chroma.py +1443 -0
alma/storage/constants.py +103 -0
alma/storage/file_based.py +59 -28
alma/storage/migrations/__init__.py +21 -0
alma/storage/migrations/base.py +321 -0
alma/storage/migrations/runner.py +323 -0
alma/storage/migrations/version_stores.py +337 -0
alma/storage/migrations/versions/__init__.py +11 -0
alma/storage/migrations/versions/v1_0_0.py +373 -0
alma/storage/pinecone.py +1080 -0
alma/storage/postgresql.py +1559 -0
alma/storage/qdrant.py +1306 -0
alma/storage/sqlite_local.py +504 -60
alma/testing/__init__.py +46 -0
alma/testing/factories.py +301 -0
alma/testing/mocks.py +389 -0
alma/types.py +62 -14
alma_memory-0.5.1.dist-info/METADATA +939 -0
alma_memory-0.5.1.dist-info/RECORD +93 -0
{alma_memory-0.4.0.dist-info → alma_memory-0.5.1.dist-info}/WHEEL +1 -1
alma_memory-0.4.0.dist-info/METADATA +0 -488
alma_memory-0.4.0.dist-info/RECORD +0 -52
{alma_memory-0.4.0.dist-info → alma_memory-0.5.1.dist-info}/top_level.txt +0 -0

alma/storage/sqlite_local.py CHANGED Viewed

@@ -6,28 +6,31 @@ This is the recommended backend for local development and testing.
 """
 import json
-import sqlite3
 import logging
-import numpy as np
-from pathlib import Path
-from datetime import datetime, timezone
-from typing import Optional, List, Dict, Any, Tuple
+import sqlite3
 from contextlib import contextmanager
+from datetime import datetime, timezone
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple
+import numpy as np
+from alma.storage.base import StorageBackend
+from alma.storage.constants import SQLITE_TABLE_NAMES, MemoryType
 from alma.types import (
+    AntiPattern,
+    DomainKnowledge,
     Heuristic,
     Outcome,
     UserPreference,
-    DomainKnowledge,
-    AntiPattern,
 )
-from alma.storage.base import StorageBackend
 logger = logging.getLogger(__name__)
 # Try to import FAISS, fall back to numpy-based search if not available
 try:
     import faiss
     FAISS_AVAILABLE = True
 except ImportError:
     FAISS_AVAILABLE = False
@@ -54,6 +57,7 @@ class SQLiteStorage(StorageBackend):
         self,
         db_path: Path,
         embedding_dim: int = 384,  # Default for all-MiniLM-L6-v2
+        auto_migrate: bool = True,
     ):
         """
         Initialize SQLite storage.
@@ -61,19 +65,29 @@ class SQLiteStorage(StorageBackend):
         Args:
             db_path: Path to SQLite database file
             embedding_dim: Dimension of embedding vectors
+            auto_migrate: If True, automatically apply pending migrations on startup
         """
         self.db_path = Path(db_path)
         self.db_path.parent.mkdir(parents=True, exist_ok=True)
         self.embedding_dim = embedding_dim
+        # Migration support (lazy-loaded)
+        self._migration_runner = None
+        self._version_store = None
         # Initialize database
         self._init_database()
         # Initialize FAISS indices (one per memory type)
         self._indices: Dict[str, Any] = {}
         self._id_maps: Dict[str, List[str]] = {}  # memory_type -> [memory_ids]
+        self._index_dirty: Dict[str, bool] = {}  # Track which indexes need rebuilding
         self._load_faiss_indices()
+        # Auto-migrate if enabled
+        if auto_migrate:
+            self._ensure_migrated()
     @classmethod
     def from_config(cls, config: Dict[str, Any]) -> "SQLiteStorage":
         """Create instance from configuration."""
@@ -149,6 +163,10 @@ class SQLiteStorage(StorageBackend):
                 "CREATE INDEX IF NOT EXISTS idx_outcomes_task_type "
                 "ON outcomes(project_id, agent, task_type)"
             )
+            cursor.execute(
+                "CREATE INDEX IF NOT EXISTS idx_outcomes_timestamp "
+                "ON outcomes(project_id, timestamp)"
+            )
             # User preferences table
             cursor.execute("""
@@ -222,9 +240,14 @@ class SQLiteStorage(StorageBackend):
                 "ON embeddings(memory_type)"
             )
-    def _load_faiss_indices(self):
-        """Load or create FAISS indices for each memory type."""
-        memory_types = ["heuristics", "outcomes", "domain_knowledge", "anti_patterns"]
+    def _load_faiss_indices(self, memory_types: Optional[List[str]] = None):
+        """Load or create FAISS indices for specified memory types.
+        Args:
+            memory_types: List of memory types to load. If None, loads all types.
+        """
+        if memory_types is None:
+            memory_types = list(MemoryType.VECTOR_ENABLED)
         for memory_type in memory_types:
             if FAISS_AVAILABLE:
@@ -235,6 +258,7 @@ class SQLiteStorage(StorageBackend):
                 self._indices[memory_type] = []
             self._id_maps[memory_type] = []
+            self._index_dirty[memory_type] = False  # Mark as fresh after rebuild
             # Load existing embeddings
             with self._get_connection() as conn:
@@ -257,6 +281,19 @@ class SQLiteStorage(StorageBackend):
                     else:
                         self._indices[memory_type].append(embedding)
+    def _ensure_index_fresh(self, memory_type: str) -> None:
+        """Rebuild index for a memory type if it has been marked dirty.
+        This implements lazy rebuilding - indexes are only rebuilt when
+        actually needed for search, not immediately on every delete.
+        Args:
+            memory_type: The type of memory index to check/rebuild.
+        """
+        if self._index_dirty.get(memory_type, False):
+            logger.debug(f"Rebuilding dirty index for {memory_type}")
+            self._load_faiss_indices([memory_type])
     def _add_to_index(
         self,
         memory_type: str,
@@ -296,6 +333,9 @@ class SQLiteStorage(StorageBackend):
         top_k: int,
     ) -> List[Tuple[str, float]]:
         """Search FAISS index for similar embeddings."""
+        # Ensure index is up-to-date before searching (lazy rebuild)
+        self._ensure_index_fresh(memory_type)
         if not self._id_maps[memory_type]:
             return []
@@ -304,10 +344,12 @@ class SQLiteStorage(StorageBackend):
         if FAISS_AVAILABLE:
             # Normalize for cosine similarity (IndexFlatIP)
             faiss.normalize_L2(query)
-            scores, indices = self._indices[memory_type].search(query, min(top_k, len(self._id_maps[memory_type])))
+            scores, indices = self._indices[memory_type].search(
+                query, min(top_k, len(self._id_maps[memory_type]))
+            )
             results = []
-            for score, idx in zip(scores[0], indices[0]):
+            for score, idx in zip(scores[0], indices[0], strict=False):
                 if idx >= 0 and idx < len(self._id_maps[memory_type]):
                     results.append((self._id_maps[memory_type][idx], float(score)))
             return results
@@ -354,14 +396,18 @@ class SQLiteStorage(StorageBackend):
                     heuristic.confidence,
                     heuristic.occurrence_count,
                     heuristic.success_count,
-                    heuristic.last_validated.isoformat() if heuristic.last_validated else None,
+                    (
+                        heuristic.last_validated.isoformat()
+                        if heuristic.last_validated
+                        else None
+                    ),
                     heuristic.created_at.isoformat() if heuristic.created_at else None,
                     json.dumps(heuristic.metadata) if heuristic.metadata else None,
                 ),
             )
         # Add embedding to index
-        self._add_to_index("heuristics", heuristic.id, heuristic.embedding)
+        self._add_to_index(MemoryType.HEURISTICS, heuristic.id, heuristic.embedding)
         logger.debug(f"Saved heuristic: {heuristic.id}")
         return heuristic.id
@@ -393,7 +439,7 @@ class SQLiteStorage(StorageBackend):
             )
         # Add embedding to index
-        self._add_to_index("outcomes", outcome.id, outcome.embedding)
+        self._add_to_index(MemoryType.OUTCOMES, outcome.id, outcome.embedding)
         logger.debug(f"Saved outcome: {outcome.id}")
         return outcome.id
@@ -439,13 +485,19 @@ class SQLiteStorage(StorageBackend):
                     knowledge.fact,
                     knowledge.source,
                     knowledge.confidence,
-                    knowledge.last_verified.isoformat() if knowledge.last_verified else None,
+                    (
+                        knowledge.last_verified.isoformat()
+                        if knowledge.last_verified
+                        else None
+                    ),
                     json.dumps(knowledge.metadata) if knowledge.metadata else None,
                 ),
             )
         # Add embedding to index
-        self._add_to_index("domain_knowledge", knowledge.id, knowledge.embedding)
+        self._add_to_index(
+            MemoryType.DOMAIN_KNOWLEDGE, knowledge.id, knowledge.embedding
+        )
         logger.debug(f"Saved domain knowledge: {knowledge.id}")
         return knowledge.id
@@ -468,17 +520,150 @@ class SQLiteStorage(StorageBackend):
                     anti_pattern.why_bad,
                     anti_pattern.better_alternative,
                     anti_pattern.occurrence_count,
-                    anti_pattern.last_seen.isoformat() if anti_pattern.last_seen else None,
-                    anti_pattern.created_at.isoformat() if anti_pattern.created_at else None,
-                    json.dumps(anti_pattern.metadata) if anti_pattern.metadata else None,
+                    (
+                        anti_pattern.last_seen.isoformat()
+                        if anti_pattern.last_seen
+                        else None
+                    ),
+                    (
+                        anti_pattern.created_at.isoformat()
+                        if anti_pattern.created_at
+                        else None
+                    ),
+                    (
+                        json.dumps(anti_pattern.metadata)
+                        if anti_pattern.metadata
+                        else None
+                    ),
                 ),
             )
         # Add embedding to index
-        self._add_to_index("anti_patterns", anti_pattern.id, anti_pattern.embedding)
+        self._add_to_index(
+            MemoryType.ANTI_PATTERNS, anti_pattern.id, anti_pattern.embedding
+        )
         logger.debug(f"Saved anti-pattern: {anti_pattern.id}")
         return anti_pattern.id
+    # ==================== BATCH WRITE OPERATIONS ====================
+    def save_heuristics(self, heuristics: List[Heuristic]) -> List[str]:
+        """Save multiple heuristics in a batch using executemany."""
+        if not heuristics:
+            return []
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            cursor.executemany(
+                """
+                INSERT OR REPLACE INTO heuristics
+                (id, agent, project_id, condition, strategy, confidence,
+                 occurrence_count, success_count, last_validated, created_at, metadata)
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                """,
+                [
+                    (
+                        h.id,
+                        h.agent,
+                        h.project_id,
+                        h.condition,
+                        h.strategy,
+                        h.confidence,
+                        h.occurrence_count,
+                        h.success_count,
+                        h.last_validated.isoformat() if h.last_validated else None,
+                        h.created_at.isoformat() if h.created_at else None,
+                        json.dumps(h.metadata) if h.metadata else None,
+                    )
+                    for h in heuristics
+                ],
+            )
+        # Add embeddings to index
+        for h in heuristics:
+            self._add_to_index(MemoryType.HEURISTICS, h.id, h.embedding)
+        logger.debug(f"Batch saved {len(heuristics)} heuristics")
+        return [h.id for h in heuristics]
+    def save_outcomes(self, outcomes: List[Outcome]) -> List[str]:
+        """Save multiple outcomes in a batch using executemany."""
+        if not outcomes:
+            return []
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            cursor.executemany(
+                """
+                INSERT OR REPLACE INTO outcomes
+                (id, agent, project_id, task_type, task_description, success,
+                 strategy_used, duration_ms, error_message, user_feedback, timestamp, metadata)
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?, ?)
+                """,
+                [
+                    (
+                        o.id,
+                        o.agent,
+                        o.project_id,
+                        o.task_type,
+                        o.task_description,
+                        1 if o.success else 0,
+                        o.strategy_used,
+                        o.duration_ms,
+                        o.error_message,
+                        o.user_feedback,
+                        o.timestamp.isoformat() if o.timestamp else None,
+                        json.dumps(o.metadata) if o.metadata else None,
+                    )
+                    for o in outcomes
+                ],
+            )
+        # Add embeddings to index
+        for o in outcomes:
+            self._add_to_index(MemoryType.OUTCOMES, o.id, o.embedding)
+        logger.debug(f"Batch saved {len(outcomes)} outcomes")
+        return [o.id for o in outcomes]
+    def save_domain_knowledge_batch(
+        self, knowledge_items: List[DomainKnowledge]
+    ) -> List[str]:
+        """Save multiple domain knowledge items in a batch using executemany."""
+        if not knowledge_items:
+            return []
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            cursor.executemany(
+                """
+                INSERT OR REPLACE INTO domain_knowledge
+                (id, agent, project_id, domain, fact, source, confidence, last_verified, metadata)
+                VALUES (?, ?, ?, ?, ?, ?, ?, ?, ?)
+                """,
+                [
+                    (
+                        k.id,
+                        k.agent,
+                        k.project_id,
+                        k.domain,
+                        k.fact,
+                        k.source,
+                        k.confidence,
+                        k.last_verified.isoformat() if k.last_verified else None,
+                        json.dumps(k.metadata) if k.metadata else None,
+                    )
+                    for k in knowledge_items
+                ],
+            )
+        # Add embeddings to index
+        for k in knowledge_items:
+            self._add_to_index(MemoryType.DOMAIN_KNOWLEDGE, k.id, k.embedding)
+        logger.debug(f"Batch saved {len(knowledge_items)} domain knowledge items")
+        return [k.id for k in knowledge_items]
     # ==================== READ OPERATIONS ====================
     def get_heuristics(
@@ -493,7 +678,9 @@ class SQLiteStorage(StorageBackend):
         # If embedding provided, use vector search to get candidate IDs
         candidate_ids = None
         if embedding:
-            search_results = self._search_index("heuristics", embedding, top_k * 2)
+            search_results = self._search_index(
+                MemoryType.HEURISTICS, embedding, top_k * 2
+            )
             candidate_ids = [id for id, _ in search_results]
         with self._get_connection() as conn:
@@ -531,7 +718,9 @@ class SQLiteStorage(StorageBackend):
         """Get outcomes with optional vector search."""
         candidate_ids = None
         if embedding:
-            search_results = self._search_index("outcomes", embedding, top_k * 2)
+            search_results = self._search_index(
+                MemoryType.OUTCOMES, embedding, top_k * 2
+            )
             candidate_ids = [id for id, _ in search_results]
         with self._get_connection() as conn:
@@ -596,7 +785,9 @@ class SQLiteStorage(StorageBackend):
         """Get domain knowledge with optional vector search."""
         candidate_ids = None
         if embedding:
-            search_results = self._search_index("domain_knowledge", embedding, top_k * 2)
+            search_results = self._search_index(
+                MemoryType.DOMAIN_KNOWLEDGE, embedding, top_k * 2
+            )
             candidate_ids = [id for id, _ in search_results]
         with self._get_connection() as conn:
@@ -636,7 +827,9 @@ class SQLiteStorage(StorageBackend):
         """Get anti-patterns with optional vector search."""
         candidate_ids = None
         if embedding:
-            search_results = self._search_index("anti_patterns", embedding, top_k * 2)
+            search_results = self._search_index(
+                MemoryType.ANTI_PATTERNS, embedding, top_k * 2
+            )
             candidate_ids = [id for id, _ in search_results]
         with self._get_connection() as conn:
@@ -662,6 +855,175 @@ class SQLiteStorage(StorageBackend):
         return [self._row_to_anti_pattern(row) for row in rows]
+    # ==================== MULTI-AGENT MEMORY SHARING ====================
+    def get_heuristics_for_agents(
+        self,
+        project_id: str,
+        agents: List[str],
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+        min_confidence: float = 0.0,
+    ) -> List[Heuristic]:
+        """Get heuristics from multiple agents using optimized IN query."""
+        if not agents:
+            return []
+        candidate_ids = None
+        if embedding:
+            search_results = self._search_index(
+                MemoryType.HEURISTICS, embedding, top_k * 2 * len(agents)
+            )
+            candidate_ids = [id for id, _ in search_results]
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            placeholders = ",".join("?" * len(agents))
+            query = f"SELECT * FROM heuristics WHERE project_id = ? AND confidence >= ? AND agent IN ({placeholders})"
+            params: List[Any] = [project_id, min_confidence] + list(agents)
+            if candidate_ids is not None:
+                id_placeholders = ",".join("?" * len(candidate_ids))
+                query += f" AND id IN ({id_placeholders})"
+                params.extend(candidate_ids)
+            query += " ORDER BY confidence DESC LIMIT ?"
+            params.append(top_k * len(agents))
+            cursor.execute(query, params)
+            rows = cursor.fetchall()
+        return [self._row_to_heuristic(row) for row in rows]
+    def get_outcomes_for_agents(
+        self,
+        project_id: str,
+        agents: List[str],
+        task_type: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+        success_only: bool = False,
+    ) -> List[Outcome]:
+        """Get outcomes from multiple agents using optimized IN query."""
+        if not agents:
+            return []
+        candidate_ids = None
+        if embedding:
+            search_results = self._search_index(
+                MemoryType.OUTCOMES, embedding, top_k * 2 * len(agents)
+            )
+            candidate_ids = [id for id, _ in search_results]
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            placeholders = ",".join("?" * len(agents))
+            query = f"SELECT * FROM outcomes WHERE project_id = ? AND agent IN ({placeholders})"
+            params: List[Any] = [project_id] + list(agents)
+            if task_type:
+                query += " AND task_type = ?"
+                params.append(task_type)
+            if success_only:
+                query += " AND success = 1"
+            if candidate_ids is not None:
+                id_placeholders = ",".join("?" * len(candidate_ids))
+                query += f" AND id IN ({id_placeholders})"
+                params.extend(candidate_ids)
+            query += " ORDER BY timestamp DESC LIMIT ?"
+            params.append(top_k * len(agents))
+            cursor.execute(query, params)
+            rows = cursor.fetchall()
+        return [self._row_to_outcome(row) for row in rows]
+    def get_domain_knowledge_for_agents(
+        self,
+        project_id: str,
+        agents: List[str],
+        domain: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+    ) -> List[DomainKnowledge]:
+        """Get domain knowledge from multiple agents using optimized IN query."""
+        if not agents:
+            return []
+        candidate_ids = None
+        if embedding:
+            search_results = self._search_index(
+                MemoryType.DOMAIN_KNOWLEDGE, embedding, top_k * 2 * len(agents)
+            )
+            candidate_ids = [id for id, _ in search_results]
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            placeholders = ",".join("?" * len(agents))
+            query = f"SELECT * FROM domain_knowledge WHERE project_id = ? AND agent IN ({placeholders})"
+            params: List[Any] = [project_id] + list(agents)
+            if domain:
+                query += " AND domain = ?"
+                params.append(domain)
+            if candidate_ids is not None:
+                id_placeholders = ",".join("?" * len(candidate_ids))
+                query += f" AND id IN ({id_placeholders})"
+                params.extend(candidate_ids)
+            query += " ORDER BY confidence DESC LIMIT ?"
+            params.append(top_k * len(agents))
+            cursor.execute(query, params)
+            rows = cursor.fetchall()
+        return [self._row_to_domain_knowledge(row) for row in rows]
+    def get_anti_patterns_for_agents(
+        self,
+        project_id: str,
+        agents: List[str],
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+    ) -> List[AntiPattern]:
+        """Get anti-patterns from multiple agents using optimized IN query."""
+        if not agents:
+            return []
+        candidate_ids = None
+        if embedding:
+            search_results = self._search_index(
+                MemoryType.ANTI_PATTERNS, embedding, top_k * 2 * len(agents)
+            )
+            candidate_ids = [id for id, _ in search_results]
+        with self._get_connection() as conn:
+            cursor = conn.cursor()
+            placeholders = ",".join("?" * len(agents))
+            query = f"SELECT * FROM anti_patterns WHERE project_id = ? AND agent IN ({placeholders})"
+            params: List[Any] = [project_id] + list(agents)
+            if candidate_ids is not None:
+                id_placeholders = ",".join("?" * len(candidate_ids))
+                query += f" AND id IN ({id_placeholders})"
+                params.extend(candidate_ids)
+            query += " ORDER BY occurrence_count DESC LIMIT ?"
+            params.append(top_k * len(agents))
+            cursor.execute(query, params)
+            rows = cursor.fetchall()
+        return [self._row_to_anti_pattern(row) for row in rows]
     # ==================== UPDATE OPERATIONS ====================
     def update_heuristic(
@@ -792,19 +1154,22 @@ class SQLiteStorage(StorageBackend):
         with self._get_connection() as conn:
             cursor = conn.cursor()
-            tables = ["heuristics", "outcomes", "domain_knowledge", "anti_patterns"]
-            for table in tables:
-                query = f"SELECT COUNT(*) FROM {table} WHERE project_id = ?"
-                params: List[Any] = [project_id]
-                if agent:
-                    query += " AND agent = ?"
-                    params.append(agent)
-                cursor.execute(query, params)
-                stats[f"{table}_count"] = cursor.fetchone()[0]
-            # Preferences don't have project_id
-            cursor.execute("SELECT COUNT(*) FROM preferences")
-            stats["preferences_count"] = cursor.fetchone()[0]
+            # Use canonical memory types for stats
+            for memory_type in MemoryType.ALL:
+                if memory_type == MemoryType.PREFERENCES:
+                    # Preferences don't have project_id
+                    cursor.execute(
+                        f"SELECT COUNT(*) FROM {SQLITE_TABLE_NAMES[memory_type]}"
+                    )
+                    stats[f"{memory_type}_count"] = cursor.fetchone()[0]
+                else:
+                    query = f"SELECT COUNT(*) FROM {SQLITE_TABLE_NAMES[memory_type]} WHERE project_id = ?"
+                    params: List[Any] = [project_id]
+                    if agent:
+                        query += " AND agent = ?"
+                        params.append(agent)
+                    cursor.execute(query, params)
+                    stats[f"{memory_type}_count"] = cursor.fetchone()[0]
             # Embedding counts
             cursor.execute("SELECT COUNT(*) FROM embeddings")
@@ -944,17 +1309,16 @@ class SQLiteStorage(StorageBackend):
         with self._get_connection() as conn:
             # Also remove from embedding index
             conn.execute(
-                "DELETE FROM embeddings WHERE memory_type = 'heuristic' AND memory_id = ?",
-                (heuristic_id,),
+                "DELETE FROM embeddings WHERE memory_type = ? AND memory_id = ?",
+                (MemoryType.HEURISTICS, heuristic_id),
             )
             cursor = conn.execute(
-                "DELETE FROM heuristics WHERE id = ?",
+                f"DELETE FROM {SQLITE_TABLE_NAMES[MemoryType.HEURISTICS]} WHERE id = ?",
                 (heuristic_id,),
             )
             if cursor.rowcount > 0:
-                # Rebuild index if we had one
-                if "heuristic" in self._indices:
-                    self._load_faiss_indices()
+                # Mark index as dirty for lazy rebuild on next search
+                self._index_dirty[MemoryType.HEURISTICS] = True
                 return True
             return False
@@ -963,16 +1327,16 @@ class SQLiteStorage(StorageBackend):
         with self._get_connection() as conn:
             # Also remove from embedding index
             conn.execute(
-                "DELETE FROM embeddings WHERE memory_type = 'outcome' AND memory_id = ?",
-                (outcome_id,),
+                "DELETE FROM embeddings WHERE memory_type = ? AND memory_id = ?",
+                (MemoryType.OUTCOMES, outcome_id),
             )
             cursor = conn.execute(
-                "DELETE FROM outcomes WHERE id = ?",
+                f"DELETE FROM {SQLITE_TABLE_NAMES[MemoryType.OUTCOMES]} WHERE id = ?",
                 (outcome_id,),
             )
             if cursor.rowcount > 0:
-                if "outcome" in self._indices:
-                    self._load_faiss_indices()
+                # Mark index as dirty for lazy rebuild on next search
+                self._index_dirty[MemoryType.OUTCOMES] = True
                 return True
             return False
@@ -981,16 +1345,16 @@ class SQLiteStorage(StorageBackend):
         with self._get_connection() as conn:
             # Also remove from embedding index
             conn.execute(
-                "DELETE FROM embeddings WHERE memory_type = 'domain_knowledge' AND memory_id = ?",
-                (knowledge_id,),
+                "DELETE FROM embeddings WHERE memory_type = ? AND memory_id = ?",
+                (MemoryType.DOMAIN_KNOWLEDGE, knowledge_id),
             )
             cursor = conn.execute(
-                "DELETE FROM domain_knowledge WHERE id = ?",
+                f"DELETE FROM {SQLITE_TABLE_NAMES[MemoryType.DOMAIN_KNOWLEDGE]} WHERE id = ?",
                 (knowledge_id,),
             )
             if cursor.rowcount > 0:
-                if "domain_knowledge" in self._indices:
-                    self._load_faiss_indices()
+                # Mark index as dirty for lazy rebuild on next search
+                self._index_dirty[MemoryType.DOMAIN_KNOWLEDGE] = True
                 return True
             return False
@@ -999,15 +1363,95 @@ class SQLiteStorage(StorageBackend):
         with self._get_connection() as conn:
             # Also remove from embedding index
             conn.execute(
-                "DELETE FROM embeddings WHERE memory_type = 'anti_pattern' AND memory_id = ?",
-                (anti_pattern_id,),
+                "DELETE FROM embeddings WHERE memory_type = ? AND memory_id = ?",
+                (MemoryType.ANTI_PATTERNS, anti_pattern_id),
             )
             cursor = conn.execute(
-                "DELETE FROM anti_patterns WHERE id = ?",
+                f"DELETE FROM {SQLITE_TABLE_NAMES[MemoryType.ANTI_PATTERNS]} WHERE id = ?",
                 (anti_pattern_id,),
             )
             if cursor.rowcount > 0:
-                if "anti_pattern" in self._indices:
-                    self._load_faiss_indices()
+                # Mark index as dirty for lazy rebuild on next search
+                self._index_dirty[MemoryType.ANTI_PATTERNS] = True
                 return True
             return False
+    # ==================== MIGRATION SUPPORT ====================
+    def _get_version_store(self):
+        """Get or create the version store."""
+        if self._version_store is None:
+            from alma.storage.migrations.version_stores import SQLiteVersionStore
+            self._version_store = SQLiteVersionStore(self.db_path)
+        return self._version_store
+    def _get_migration_runner(self):
+        """Get or create the migration runner."""
+        if self._migration_runner is None:
+            from alma.storage.migrations.runner import MigrationRunner
+            from alma.storage.migrations.versions import v1_0_0  # noqa: F401
+            self._migration_runner = MigrationRunner(
+                version_store=self._get_version_store(),
+                backend="sqlite",
+            )
+        return self._migration_runner
+    def _ensure_migrated(self) -> None:
+        """Ensure database is migrated to latest version."""
+        runner = self._get_migration_runner()
+        if runner.needs_migration():
+            with self._get_connection() as conn:
+                applied = runner.migrate(conn)
+                if applied:
+                    logger.info(f"Applied {len(applied)} migrations: {applied}")
+    def get_schema_version(self) -> Optional[str]:
+        """Get the current schema version."""
+        return self._get_version_store().get_current_version()
+    def get_migration_status(self) -> Dict[str, Any]:
+        """Get migration status information."""
+        runner = self._get_migration_runner()
+        status = runner.get_status()
+        status["migration_supported"] = True
+        return status
+    def migrate(
+        self,
+        target_version: Optional[str] = None,
+        dry_run: bool = False,
+    ) -> List[str]:
+        """
+        Apply pending schema migrations.
+        Args:
+            target_version: Optional target version (applies all if not specified)
+            dry_run: If True, show what would be done without making changes
+        Returns:
+            List of applied migration versions
+        """
+        runner = self._get_migration_runner()
+        with self._get_connection() as conn:
+            return runner.migrate(conn, target_version=target_version, dry_run=dry_run)
+    def rollback(
+        self,
+        target_version: str,
+        dry_run: bool = False,
+    ) -> List[str]:
+        """
+        Roll back schema to a previous version.
+        Args:
+            target_version: Version to roll back to
+            dry_run: If True, show what would be done without making changes
+        Returns:
+            List of rolled back migration versions
+        """
+        runner = self._get_migration_runner()
+        with self._get_connection() as conn:
+            return runner.rollback(conn, target_version=target_version, dry_run=dry_run)

alma-memory 0.4.0__py3-none-any.whl → 0.5.1__py3-none-any.whl

alma-memory 0.4.0py3-none-any.whl → 0.5.1py3-none-any.whl