PyPI - alma-memory - Versions diffs - 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl - Mend

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (111) hide show

alma/__init__.py +296 -226
alma/compression/__init__.py +33 -0
alma/compression/pipeline.py +980 -0
alma/confidence/__init__.py +47 -47
alma/confidence/engine.py +540 -540
alma/confidence/types.py +351 -351
alma/config/loader.py +157 -157
alma/consolidation/__init__.py +23 -23
alma/consolidation/engine.py +678 -678
alma/consolidation/prompts.py +84 -84
alma/core.py +1189 -430
alma/domains/__init__.py +30 -30
alma/domains/factory.py +359 -359
alma/domains/schemas.py +448 -448
alma/domains/types.py +272 -272
alma/events/__init__.py +75 -75
alma/events/emitter.py +285 -284
alma/events/storage_mixin.py +246 -246
alma/events/types.py +126 -126
alma/events/webhook.py +425 -425
alma/exceptions.py +49 -49
alma/extraction/__init__.py +31 -31
alma/extraction/auto_learner.py +265 -265
alma/extraction/extractor.py +420 -420
alma/graph/__init__.py +106 -106
alma/graph/backends/__init__.py +32 -32
alma/graph/backends/kuzu.py +624 -624
alma/graph/backends/memgraph.py +432 -432
alma/graph/backends/memory.py +236 -236
alma/graph/backends/neo4j.py +417 -417
alma/graph/base.py +159 -159
alma/graph/extraction.py +198 -198
alma/graph/store.py +860 -860
alma/harness/__init__.py +35 -35
alma/harness/base.py +386 -386
alma/harness/domains.py +705 -705
alma/initializer/__init__.py +37 -37
alma/initializer/initializer.py +418 -418
alma/initializer/types.py +250 -250
alma/integration/__init__.py +62 -62
alma/integration/claude_agents.py +444 -444
alma/integration/helena.py +423 -423
alma/integration/victor.py +471 -471
alma/learning/__init__.py +101 -86
alma/learning/decay.py +878 -0
alma/learning/forgetting.py +1446 -1446
alma/learning/heuristic_extractor.py +390 -390
alma/learning/protocols.py +374 -374
alma/learning/validation.py +346 -346
alma/mcp/__init__.py +123 -45
alma/mcp/__main__.py +156 -156
alma/mcp/resources.py +122 -122
alma/mcp/server.py +955 -591
alma/mcp/tools.py +3254 -509
alma/observability/__init__.py +91 -84
alma/observability/config.py +302 -302
alma/observability/guidelines.py +170 -0
alma/observability/logging.py +424 -424
alma/observability/metrics.py +583 -583
alma/observability/tracing.py +440 -440
alma/progress/__init__.py +21 -21
alma/progress/tracker.py +607 -607
alma/progress/types.py +250 -250
alma/retrieval/__init__.py +134 -53
alma/retrieval/budget.py +525 -0
alma/retrieval/cache.py +1304 -1061
alma/retrieval/embeddings.py +202 -202
alma/retrieval/engine.py +850 -427
alma/retrieval/modes.py +365 -0
alma/retrieval/progressive.py +560 -0
alma/retrieval/scoring.py +344 -344
alma/retrieval/trust_scoring.py +637 -0
alma/retrieval/verification.py +797 -0
alma/session/__init__.py +19 -19
alma/session/manager.py +442 -399
alma/session/types.py +288 -288
alma/storage/__init__.py +101 -90
alma/storage/archive.py +233 -0
alma/storage/azure_cosmos.py +1259 -1259
alma/storage/base.py +1083 -583
alma/storage/chroma.py +1443 -1443
alma/storage/constants.py +103 -103
alma/storage/file_based.py +614 -614
alma/storage/migrations/__init__.py +21 -21
alma/storage/migrations/base.py +321 -321
alma/storage/migrations/runner.py +323 -323
alma/storage/migrations/version_stores.py +337 -337
alma/storage/migrations/versions/__init__.py +11 -11
alma/storage/migrations/versions/v1_0_0.py +373 -373
alma/storage/migrations/versions/v1_1_0_workflow_context.py +551 -0
alma/storage/pinecone.py +1080 -1080
alma/storage/postgresql.py +1948 -1559
alma/storage/qdrant.py +1306 -1306
alma/storage/sqlite_local.py +3041 -1457
alma/testing/__init__.py +46 -46
alma/testing/factories.py +301 -301
alma/testing/mocks.py +389 -389
alma/types.py +292 -264
alma/utils/__init__.py +19 -0
alma/utils/tokenizer.py +521 -0
alma/workflow/__init__.py +83 -0
alma/workflow/artifacts.py +170 -0
alma/workflow/checkpoint.py +311 -0
alma/workflow/context.py +228 -0
alma/workflow/outcomes.py +189 -0
alma/workflow/reducers.py +393 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/METADATA +210 -72
alma_memory-0.7.0.dist-info/RECORD +112 -0
alma_memory-0.5.1.dist-info/RECORD +0 -93
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/WHEEL +0 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/top_level.txt +0 -0

alma/storage/azure_cosmos.py CHANGED Viewed

@@ -1,1259 +1,1259 @@
-"""
-ALMA Azure Cosmos DB Storage Backend.
-Production storage using Azure Cosmos DB with vector search capabilities.
-Uses Azure Key Vault for secrets management.
-Requirements:
-    pip install azure-cosmos azure-identity azure-keyvault-secrets
-Configuration (config.yaml):
-    alma:
-      storage: azure
-      azure:
-        endpoint: ${AZURE_COSMOS_ENDPOINT}
-        key: ${KEYVAULT:cosmos-db-key}
-        database: alma-memory
-        embedding_dim: 384
-"""
-import logging
-from datetime import datetime, timezone
-from typing import Any, Dict, List, Optional
-from alma.storage.base import StorageBackend
-from alma.storage.constants import AZURE_COSMOS_CONTAINER_NAMES, MemoryType
-from alma.types import (
-    AntiPattern,
-    DomainKnowledge,
-    Heuristic,
-    Outcome,
-    UserPreference,
-)
-logger = logging.getLogger(__name__)
-# Try to import Azure SDK
-try:
-    from azure.cosmos import CosmosClient, PartitionKey, exceptions
-    from azure.cosmos.container import ContainerProxy
-    from azure.cosmos.database import DatabaseProxy
-    AZURE_COSMOS_AVAILABLE = True
-except ImportError:
-    AZURE_COSMOS_AVAILABLE = False
-    # Define placeholders for type hints when SDK not available
-    CosmosClient = None  # type: ignore
-    PartitionKey = None  # type: ignore
-    exceptions = None  # type: ignore
-    ContainerProxy = Any  # type: ignore
-    DatabaseProxy = Any  # type: ignore
-    logger.warning(
-        "azure-cosmos package not installed. Install with: pip install azure-cosmos"
-    )
-class AzureCosmosStorage(StorageBackend):
-    """
-    Azure Cosmos DB storage backend with vector search.
-    Uses:
-    - NoSQL API for document storage
-    - DiskANN vector indexing for similarity search
-    - Partition key: project_id for efficient queries
-    Container structure (uses canonical memory type names with alma_ prefix):
-    - alma_heuristics: Heuristics with vector embeddings
-    - alma_outcomes: Task outcomes with vector embeddings
-    - alma_preferences: User preferences (no vectors)
-    - alma_domain_knowledge: Domain knowledge with vector embeddings
-    - alma_anti_patterns: Anti-patterns with vector embeddings
-    Container names are derived from alma.storage.constants.AZURE_COSMOS_CONTAINER_NAMES
-    for consistency across all storage backends.
-    """
-    # Use canonical container names from constants
-    CONTAINER_NAMES = AZURE_COSMOS_CONTAINER_NAMES
-    def __init__(
-        self,
-        endpoint: str,
-        key: str,
-        database_name: str = "alma-memory",
-        embedding_dim: int = 384,
-        create_if_not_exists: bool = True,
-    ):
-        """
-        Initialize Azure Cosmos DB storage.
-        Args:
-            endpoint: Cosmos DB account endpoint
-            key: Cosmos DB account key
-            database_name: Name of the database
-            embedding_dim: Dimension of embedding vectors
-            create_if_not_exists: Create database/containers if missing
-        """
-        if not AZURE_COSMOS_AVAILABLE:
-            raise ImportError(
-                "azure-cosmos package required. Install with: pip install azure-cosmos"
-            )
-        self.endpoint = endpoint
-        self.database_name = database_name
-        self.embedding_dim = embedding_dim
-        # Initialize client
-        self.client = CosmosClient(endpoint, credential=key)
-        # Get or create database
-        if create_if_not_exists:
-            self.database = self.client.create_database_if_not_exists(id=database_name)
-            self._init_containers()
-        else:
-            self.database = self.client.get_database_client(database_name)
-        # Cache container clients
-        self._containers: Dict[str, ContainerProxy] = {}
-        for key_name, container_name in self.CONTAINER_NAMES.items():
-            self._containers[key_name] = self.database.get_container_client(
-                container_name
-            )
-        # Cache for partition key mappings: {container_key: {doc_id: partition_key}}
-        # This reduces RU consumption by avoiding cross-partition queries
-        self._partition_key_cache: Dict[str, Dict[str, str]] = {
-            mt: {} for mt in MemoryType.ALL
-        }
-        # Maximum cache size per container to prevent memory issues
-        self._cache_max_size = 1000
-        logger.info(f"Connected to Azure Cosmos DB: {database_name}")
-    @classmethod
-    def from_config(cls, config: Dict[str, Any]) -> "AzureCosmosStorage":
-        """Create instance from configuration."""
-        azure_config = config.get("azure", {})
-        endpoint = azure_config.get("endpoint")
-        key = azure_config.get("key")
-        if not endpoint or not key:
-            raise ValueError(
-                "Azure Cosmos DB requires 'azure.endpoint' and 'azure.key' in config"
-            )
-        return cls(
-            endpoint=endpoint,
-            key=key,
-            database_name=azure_config.get("database", "alma-memory"),
-            embedding_dim=azure_config.get("embedding_dim", 384),
-            create_if_not_exists=azure_config.get("create_if_not_exists", True),
-        )
-    def _init_containers(self):
-        """Initialize containers with vector search indexing."""
-        # Container configs with indexing policies (using canonical memory types)
-        container_configs = {
-            MemoryType.HEURISTICS: {
-                "partition_key": "/project_id",
-                "vector_path": "/embedding",
-                "vector_indexes": True,
-            },
-            MemoryType.OUTCOMES: {
-                "partition_key": "/project_id",
-                "vector_path": "/embedding",
-                "vector_indexes": True,
-            },
-            MemoryType.PREFERENCES: {
-                "partition_key": "/user_id",
-                "vector_path": None,
-                "vector_indexes": False,
-            },
-            MemoryType.DOMAIN_KNOWLEDGE: {
-                "partition_key": "/project_id",
-                "vector_path": "/embedding",
-                "vector_indexes": True,
-            },
-            MemoryType.ANTI_PATTERNS: {
-                "partition_key": "/project_id",
-                "vector_path": "/embedding",
-                "vector_indexes": True,
-            },
-        }
-        for key_name, cfg in container_configs.items():
-            container_name = self.CONTAINER_NAMES[key_name]
-            # Build indexing policy
-            indexing_policy = {
-                "indexingMode": "consistent",
-                "automatic": True,
-                "includedPaths": [{"path": "/*"}],
-                "excludedPaths": [{"path": '/"_etag"/?'}],
-            }
-            # Add vector embedding policy if needed
-            vector_embedding_policy = None
-            if cfg["vector_indexes"] and cfg["vector_path"]:
-                # Exclude vector path from regular indexing
-                indexing_policy["excludedPaths"].append(
-                    {"path": f"{cfg['vector_path']}/*"}
-                )
-                # Vector embedding policy for DiskANN
-                vector_embedding_policy = {
-                    "vectorEmbeddings": [
-                        {
-                            "path": cfg["vector_path"],
-                            "dataType": "float32",
-                            "dimensions": self.embedding_dim,
-                            "distanceFunction": "cosine",
-                        }
-                    ]
-                }
-            try:
-                container_properties = {
-                    "id": container_name,
-                    "partition_key": PartitionKey(path=cfg["partition_key"]),
-                    "indexing_policy": indexing_policy,
-                }
-                if vector_embedding_policy:
-                    container_properties["vector_embedding_policy"] = (
-                        vector_embedding_policy
-                    )
-                self.database.create_container_if_not_exists(**container_properties)
-                logger.debug(f"Container ready: {container_name}")
-            except exceptions.CosmosHttpResponseError as e:
-                if e.status_code == 409:
-                    logger.debug(f"Container already exists: {container_name}")
-                else:
-                    raise
-    def _get_container(self, container_key: str) -> ContainerProxy:
-        """Get container client by key."""
-        return self._containers[container_key]
-    def _cache_partition_key(
-        self, container_key: str, doc_id: str, partition_key: str
-    ) -> None:
-        """
-        Cache the partition key mapping for a document.
-        This enables point reads for future operations, reducing RU consumption
-        by avoiding expensive cross-partition queries.
-        """
-        cache = self._partition_key_cache[container_key]
-        # Evict oldest entries if cache is full (simple FIFO eviction)
-        if len(cache) >= self._cache_max_size:
-            # Remove first 10% of entries
-            keys_to_remove = list(cache.keys())[: self._cache_max_size // 10]
-            for key in keys_to_remove:
-                del cache[key]
-        cache[doc_id] = partition_key
-    def _get_cached_partition_key(
-        self, container_key: str, doc_id: str
-    ) -> Optional[str]:
-        """
-        Get cached partition key for a document if available.
-        Returns None if the partition key is not cached.
-        """
-        return self._partition_key_cache.get(container_key, {}).get(doc_id)
-    def _invalidate_partition_key_cache(self, container_key: str, doc_id: str) -> None:
-        """Remove a document from the partition key cache."""
-        cache = self._partition_key_cache.get(container_key, {})
-        cache.pop(doc_id, None)
-    def _point_read_document(
-        self,
-        container_key: str,
-        doc_id: str,
-        partition_key: Optional[str] = None,
-    ) -> Optional[Dict[str, Any]]:
-        """
-        Attempt to read a document using a point read (1 RU) instead of a query.
-        If partition_key is provided, performs a direct point read.
-        If partition_key is not provided but is cached, uses the cached value.
-        If neither is available, falls back to a cross-partition query.
-        Args:
-            container_key: The container key (e.g., 'heuristics', 'knowledge')
-            doc_id: The document ID
-            partition_key: Optional partition key for direct point read
-        Returns:
-            The document if found, None otherwise
-        """
-        container = self._get_container(container_key)
-        # Try to get partition key from cache if not provided
-        if partition_key is None:
-            partition_key = self._get_cached_partition_key(container_key, doc_id)
-        # If we have a partition key, use point read (1 RU)
-        if partition_key is not None:
-            try:
-                doc = container.read_item(item=doc_id, partition_key=partition_key)
-                # Refresh cache on successful read
-                self._cache_partition_key(container_key, doc_id, partition_key)
-                return doc
-            except exceptions.CosmosResourceNotFoundError:
-                # Document not found or partition key was wrong
-                self._invalidate_partition_key_cache(container_key, doc_id)
-                # Fall through to cross-partition query
-            except Exception as e:
-                logger.warning(f"Point read failed for {doc_id}: {e}")
-                # Fall through to cross-partition query
-        # Fallback: Cross-partition query (expensive but necessary without partition key)
-        logger.debug(
-            f"Using cross-partition query for {doc_id} in {container_key} "
-            "(consider providing project_id for better performance)"
-        )
-        query = "SELECT * FROM c WHERE c.id = @id"
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=[{"name": "@id", "value": doc_id}],
-                enable_cross_partition_query=True,
-            )
-        )
-        if items:
-            doc = items[0]
-            # Cache the partition key for future operations
-            pk_field = self._get_partition_key_field(container_key)
-            if pk_field and pk_field in doc:
-                self._cache_partition_key(container_key, doc_id, doc[pk_field])
-            return doc
-        return None
-    def _get_partition_key_field(self, container_key: str) -> Optional[str]:
-        """Get the partition key field name for a container."""
-        partition_key_fields = {
-            MemoryType.HEURISTICS: "project_id",
-            MemoryType.OUTCOMES: "project_id",
-            MemoryType.PREFERENCES: "user_id",
-            MemoryType.DOMAIN_KNOWLEDGE: "project_id",
-            MemoryType.ANTI_PATTERNS: "project_id",
-        }
-        return partition_key_fields.get(container_key)
-    # ==================== WRITE OPERATIONS ====================
-    def save_heuristic(self, heuristic: Heuristic) -> str:
-        """Save a heuristic."""
-        container = self._get_container(MemoryType.HEURISTICS)
-        doc = {
-            "id": heuristic.id,
-            "agent": heuristic.agent,
-            "project_id": heuristic.project_id,
-            "condition": heuristic.condition,
-            "strategy": heuristic.strategy,
-            "confidence": heuristic.confidence,
-            "occurrence_count": heuristic.occurrence_count,
-            "success_count": heuristic.success_count,
-            "last_validated": (
-                heuristic.last_validated.isoformat()
-                if heuristic.last_validated
-                else None
-            ),
-            "created_at": (
-                heuristic.created_at.isoformat() if heuristic.created_at else None
-            ),
-            "metadata": heuristic.metadata or {},
-            "embedding": heuristic.embedding,
-            "type": "heuristic",
-        }
-        container.upsert_item(doc)
-        # Cache partition key for efficient future updates
-        self._cache_partition_key(
-            MemoryType.HEURISTICS, heuristic.id, heuristic.project_id
-        )
-        logger.debug(f"Saved heuristic: {heuristic.id}")
-        return heuristic.id
-    def save_outcome(self, outcome: Outcome) -> str:
-        """Save an outcome."""
-        container = self._get_container(MemoryType.OUTCOMES)
-        doc = {
-            "id": outcome.id,
-            "agent": outcome.agent,
-            "project_id": outcome.project_id,
-            "task_type": outcome.task_type,
-            "task_description": outcome.task_description,
-            "success": outcome.success,
-            "strategy_used": outcome.strategy_used,
-            "duration_ms": outcome.duration_ms,
-            "error_message": outcome.error_message,
-            "user_feedback": outcome.user_feedback,
-            "timestamp": outcome.timestamp.isoformat() if outcome.timestamp else None,
-            "metadata": outcome.metadata or {},
-            "embedding": outcome.embedding,
-            "type": "outcome",
-        }
-        container.upsert_item(doc)
-        # Cache partition key for efficient future updates
-        self._cache_partition_key(MemoryType.OUTCOMES, outcome.id, outcome.project_id)
-        logger.debug(f"Saved outcome: {outcome.id}")
-        return outcome.id
-    def save_user_preference(self, preference: UserPreference) -> str:
-        """Save a user preference."""
-        container = self._get_container(MemoryType.PREFERENCES)
-        doc = {
-            "id": preference.id,
-            "user_id": preference.user_id,
-            "category": preference.category,
-            "preference": preference.preference,
-            "source": preference.source,
-            "confidence": preference.confidence,
-            "timestamp": (
-                preference.timestamp.isoformat() if preference.timestamp else None
-            ),
-            "metadata": preference.metadata or {},
-            "type": "preference",
-        }
-        container.upsert_item(doc)
-        # Cache partition key for efficient future updates
-        self._cache_partition_key(
-            MemoryType.PREFERENCES, preference.id, preference.user_id
-        )
-        logger.debug(f"Saved preference: {preference.id}")
-        return preference.id
-    def save_domain_knowledge(self, knowledge: DomainKnowledge) -> str:
-        """Save domain knowledge."""
-        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
-        doc = {
-            "id": knowledge.id,
-            "agent": knowledge.agent,
-            "project_id": knowledge.project_id,
-            "domain": knowledge.domain,
-            "fact": knowledge.fact,
-            "source": knowledge.source,
-            "confidence": knowledge.confidence,
-            "last_verified": (
-                knowledge.last_verified.isoformat() if knowledge.last_verified else None
-            ),
-            "metadata": knowledge.metadata or {},
-            "embedding": knowledge.embedding,
-            "type": "domain_knowledge",
-        }
-        container.upsert_item(doc)
-        # Cache partition key for efficient future updates
-        self._cache_partition_key(
-            MemoryType.DOMAIN_KNOWLEDGE, knowledge.id, knowledge.project_id
-        )
-        logger.debug(f"Saved domain knowledge: {knowledge.id}")
-        return knowledge.id
-    def save_anti_pattern(self, anti_pattern: AntiPattern) -> str:
-        """Save an anti-pattern."""
-        container = self._get_container(MemoryType.ANTI_PATTERNS)
-        doc = {
-            "id": anti_pattern.id,
-            "agent": anti_pattern.agent,
-            "project_id": anti_pattern.project_id,
-            "pattern": anti_pattern.pattern,
-            "why_bad": anti_pattern.why_bad,
-            "better_alternative": anti_pattern.better_alternative,
-            "occurrence_count": anti_pattern.occurrence_count,
-            "last_seen": (
-                anti_pattern.last_seen.isoformat() if anti_pattern.last_seen else None
-            ),
-            "created_at": (
-                anti_pattern.created_at.isoformat() if anti_pattern.created_at else None
-            ),
-            "metadata": anti_pattern.metadata or {},
-            "embedding": anti_pattern.embedding,
-            "type": "anti_pattern",
-        }
-        container.upsert_item(doc)
-        # Cache partition key for efficient future updates
-        self._cache_partition_key(
-            MemoryType.ANTI_PATTERNS, anti_pattern.id, anti_pattern.project_id
-        )
-        logger.debug(f"Saved anti-pattern: {anti_pattern.id}")
-        return anti_pattern.id
-    # ==================== READ OPERATIONS ====================
-    def get_heuristics(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-        embedding: Optional[List[float]] = None,
-        top_k: int = 5,
-        min_confidence: float = 0.0,
-    ) -> List[Heuristic]:
-        """Get heuristics with optional vector search."""
-        container = self._get_container(MemoryType.HEURISTICS)
-        if embedding:
-            # Vector search query
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            AND c.confidence >= @min_confidence
-            """
-            if agent:
-                query += " AND c.agent = @agent"
-            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-                {"name": "@min_confidence", "value": min_confidence},
-                {"name": "@embedding", "value": embedding},
-            ]
-            if agent:
-                parameters.append({"name": "@agent", "value": agent})
-        else:
-            # Regular query
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            AND c.confidence >= @min_confidence
-            """
-            if agent:
-                query += " AND c.agent = @agent"
-            query += " ORDER BY c.confidence DESC"
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-                {"name": "@min_confidence", "value": min_confidence},
-            ]
-            if agent:
-                parameters.append({"name": "@agent", "value": agent})
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        # Cache partition keys for efficient future updates
-        for doc in items:
-            self._cache_partition_key(
-                MemoryType.HEURISTICS, doc["id"], doc["project_id"]
-            )
-        return [self._doc_to_heuristic(doc) for doc in items]
-    def get_outcomes(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-        task_type: Optional[str] = None,
-        embedding: Optional[List[float]] = None,
-        top_k: int = 5,
-        success_only: bool = False,
-    ) -> List[Outcome]:
-        """Get outcomes with optional vector search."""
-        container = self._get_container(MemoryType.OUTCOMES)
-        if embedding:
-            # Vector search query
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-                {"name": "@embedding", "value": embedding},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            if task_type:
-                query += " AND c.task_type = @task_type"
-                parameters.append({"name": "@task_type", "value": task_type})
-            if success_only:
-                query += " AND c.success = true"
-            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
-        else:
-            # Regular query
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            if task_type:
-                query += " AND c.task_type = @task_type"
-                parameters.append({"name": "@task_type", "value": task_type})
-            if success_only:
-                query += " AND c.success = true"
-            query += " ORDER BY c.timestamp DESC"
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        # Cache partition keys for efficient future updates
-        for doc in items:
-            self._cache_partition_key(MemoryType.OUTCOMES, doc["id"], doc["project_id"])
-        return [self._doc_to_outcome(doc) for doc in items]
-    def get_user_preferences(
-        self,
-        user_id: str,
-        category: Optional[str] = None,
-    ) -> List[UserPreference]:
-        """Get user preferences."""
-        container = self._get_container(MemoryType.PREFERENCES)
-        query = "SELECT * FROM c WHERE c.user_id = @user_id"
-        parameters = [{"name": "@user_id", "value": user_id}]
-        if category:
-            query += " AND c.category = @category"
-            parameters.append({"name": "@category", "value": category})
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=user_id,
-            )
-        )
-        # Cache partition keys for efficient future updates
-        for doc in items:
-            self._cache_partition_key(MemoryType.PREFERENCES, doc["id"], doc["user_id"])
-        return [self._doc_to_preference(doc) for doc in items]
-    def get_domain_knowledge(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-        domain: Optional[str] = None,
-        embedding: Optional[List[float]] = None,
-        top_k: int = 5,
-    ) -> List[DomainKnowledge]:
-        """Get domain knowledge with optional vector search."""
-        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
-        if embedding:
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-                {"name": "@embedding", "value": embedding},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            if domain:
-                query += " AND c.domain = @domain"
-                parameters.append({"name": "@domain", "value": domain})
-            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
-        else:
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            if domain:
-                query += " AND c.domain = @domain"
-                parameters.append({"name": "@domain", "value": domain})
-            query += " ORDER BY c.confidence DESC"
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        # Cache partition keys for efficient future updates
-        for doc in items:
-            self._cache_partition_key(
-                MemoryType.DOMAIN_KNOWLEDGE, doc["id"], doc["project_id"]
-            )
-        return [self._doc_to_domain_knowledge(doc) for doc in items]
-    def get_anti_patterns(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-        embedding: Optional[List[float]] = None,
-        top_k: int = 5,
-    ) -> List[AntiPattern]:
-        """Get anti-patterns with optional vector search."""
-        container = self._get_container(MemoryType.ANTI_PATTERNS)
-        if embedding:
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-                {"name": "@embedding", "value": embedding},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
-        else:
-            query = """
-            SELECT TOP @top_k *
-            FROM c
-            WHERE c.project_id = @project_id
-            """
-            parameters = [
-                {"name": "@top_k", "value": top_k},
-                {"name": "@project_id", "value": project_id},
-            ]
-            if agent:
-                query += " AND c.agent = @agent"
-                parameters.append({"name": "@agent", "value": agent})
-            query += " ORDER BY c.occurrence_count DESC"
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        # Cache partition keys for efficient future updates
-        for doc in items:
-            self._cache_partition_key(
-                MemoryType.ANTI_PATTERNS, doc["id"], doc["project_id"]
-            )
-        return [self._doc_to_anti_pattern(doc) for doc in items]
-    # ==================== UPDATE OPERATIONS ====================
-    def update_heuristic(
-        self,
-        heuristic_id: str,
-        updates: Dict[str, Any],
-        project_id: Optional[str] = None,
-    ) -> bool:
-        """
-        Update a heuristic's fields.
-        Args:
-            heuristic_id: The heuristic document ID
-            updates: Dictionary of fields to update
-            project_id: Optional partition key for efficient point read (1 RU).
-                       If not provided, will attempt cache lookup, then
-                       fall back to cross-partition query (more expensive).
-        Returns:
-            True if update succeeded, False if document not found
-        """
-        container = self._get_container(MemoryType.HEURISTICS)
-        # Use optimized point read with cache fallback
-        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
-        if not doc:
-            return False
-        # Apply updates
-        for key, value in updates.items():
-            if isinstance(value, datetime):
-                doc[key] = value.isoformat()
-            else:
-                doc[key] = value
-        container.replace_item(item=heuristic_id, body=doc)
-        return True
-    def increment_heuristic_occurrence(
-        self,
-        heuristic_id: str,
-        success: bool,
-        project_id: Optional[str] = None,
-    ) -> bool:
-        """
-        Increment heuristic occurrence count.
-        Args:
-            heuristic_id: The heuristic document ID
-            success: Whether this occurrence was successful
-            project_id: Optional partition key for efficient point read (1 RU).
-                       If not provided, will attempt cache lookup, then
-                       fall back to cross-partition query (more expensive).
-        Returns:
-            True if update succeeded, False if document not found
-        """
-        container = self._get_container(MemoryType.HEURISTICS)
-        # Use optimized point read with cache fallback
-        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
-        if not doc:
-            return False
-        doc["occurrence_count"] = doc.get("occurrence_count", 0) + 1
-        if success:
-            doc["success_count"] = doc.get("success_count", 0) + 1
-        doc["last_validated"] = datetime.now(timezone.utc).isoformat()
-        container.replace_item(item=heuristic_id, body=doc)
-        return True
-    def update_heuristic_confidence(
-        self,
-        heuristic_id: str,
-        new_confidence: float,
-        project_id: Optional[str] = None,
-    ) -> bool:
-        """
-        Update confidence score for a heuristic.
-        Args:
-            heuristic_id: The heuristic document ID
-            new_confidence: The new confidence value
-            project_id: Optional partition key for efficient point read (1 RU).
-                       If not provided, will attempt cache lookup, then
-                       fall back to cross-partition query (more expensive).
-        Returns:
-            True if update succeeded, False if document not found
-        Performance Note:
-            - With project_id: 1 RU for point read + write cost
-            - With cached partition key: 1 RU for point read + write cost
-            - Without either: Cross-partition query (variable, higher RUs)
-        """
-        container = self._get_container(MemoryType.HEURISTICS)
-        # Use optimized point read with cache fallback
-        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
-        if not doc:
-            return False
-        doc["confidence"] = new_confidence
-        container.replace_item(item=heuristic_id, body=doc)
-        logger.debug(
-            f"Updated heuristic confidence: {heuristic_id} -> {new_confidence}"
-        )
-        return True
-    def update_knowledge_confidence(
-        self,
-        knowledge_id: str,
-        new_confidence: float,
-        project_id: Optional[str] = None,
-    ) -> bool:
-        """
-        Update confidence score for domain knowledge.
-        Args:
-            knowledge_id: The knowledge document ID
-            new_confidence: The new confidence value
-            project_id: Optional partition key for efficient point read (1 RU).
-                       If not provided, will attempt cache lookup, then
-                       fall back to cross-partition query (more expensive).
-        Returns:
-            True if update succeeded, False if document not found
-        Performance Note:
-            - With project_id: 1 RU for point read + write cost
-            - With cached partition key: 1 RU for point read + write cost
-            - Without either: Cross-partition query (variable, higher RUs)
-        """
-        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
-        # Use optimized point read with cache fallback
-        doc = self._point_read_document(
-            MemoryType.DOMAIN_KNOWLEDGE, knowledge_id, project_id
-        )
-        if not doc:
-            return False
-        doc["confidence"] = new_confidence
-        container.replace_item(item=knowledge_id, body=doc)
-        logger.debug(
-            f"Updated knowledge confidence: {knowledge_id} -> {new_confidence}"
-        )
-        return True
-    # ==================== DELETE OPERATIONS ====================
-    def delete_outcomes_older_than(
-        self,
-        project_id: str,
-        older_than: datetime,
-        agent: Optional[str] = None,
-    ) -> int:
-        """Delete old outcomes."""
-        container = self._get_container(MemoryType.OUTCOMES)
-        query = """
-        SELECT c.id FROM c
-        WHERE c.project_id = @project_id
-        AND c.timestamp < @older_than
-        """
-        parameters = [
-            {"name": "@project_id", "value": project_id},
-            {"name": "@older_than", "value": older_than.isoformat()},
-        ]
-        if agent:
-            query += " AND c.agent = @agent"
-            parameters.append({"name": "@agent", "value": agent})
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        deleted = 0
-        for item in items:
-            try:
-                container.delete_item(item=item["id"], partition_key=project_id)
-                deleted += 1
-            except exceptions.CosmosResourceNotFoundError:
-                pass
-        logger.info(f"Deleted {deleted} old outcomes")
-        return deleted
-    def delete_low_confidence_heuristics(
-        self,
-        project_id: str,
-        below_confidence: float,
-        agent: Optional[str] = None,
-    ) -> int:
-        """Delete low-confidence heuristics."""
-        container = self._get_container(MemoryType.HEURISTICS)
-        query = """
-        SELECT c.id FROM c
-        WHERE c.project_id = @project_id
-        AND c.confidence < @below_confidence
-        """
-        parameters = [
-            {"name": "@project_id", "value": project_id},
-            {"name": "@below_confidence", "value": below_confidence},
-        ]
-        if agent:
-            query += " AND c.agent = @agent"
-            parameters.append({"name": "@agent", "value": agent})
-        items = list(
-            container.query_items(
-                query=query,
-                parameters=parameters,
-                enable_cross_partition_query=False,
-                partition_key=project_id,
-            )
-        )
-        deleted = 0
-        for item in items:
-            try:
-                container.delete_item(item=item["id"], partition_key=project_id)
-                deleted += 1
-            except exceptions.CosmosResourceNotFoundError:
-                pass
-        logger.info(f"Deleted {deleted} low-confidence heuristics")
-        return deleted
-    def delete_heuristic(
-        self, heuristic_id: str, project_id: Optional[str] = None
-    ) -> bool:
-        """
-        Delete a specific heuristic by ID.
-        Args:
-            heuristic_id: The heuristic document ID
-            project_id: Optional partition key for efficient point read (1 RU).
-                       If not provided, will attempt cache lookup, then
-                       fall back to cross-partition query (more expensive).
-        Returns:
-            True if deletion succeeded, False if document not found
-        """
-        container = self._get_container(MemoryType.HEURISTICS)
-        # Try to get partition key from cache if not provided
-        if project_id is None:
-            project_id = self._get_cached_partition_key(
-                MemoryType.HEURISTICS, heuristic_id
-            )
-        # If we have a partition key, try direct delete
-        if project_id is not None:
-            try:
-                container.delete_item(item=heuristic_id, partition_key=project_id)
-                self._invalidate_partition_key_cache(
-                    MemoryType.HEURISTICS, heuristic_id
-                )
-                return True
-            except exceptions.CosmosResourceNotFoundError:
-                # Document not found or partition key was wrong
-                self._invalidate_partition_key_cache(
-                    MemoryType.HEURISTICS, heuristic_id
-                )
-                # Fall through to cross-partition lookup
-        # Fallback: Cross-partition query to find the document
-        logger.debug(
-            f"Using cross-partition query for delete {heuristic_id} "
-            "(consider providing project_id for better performance)"
-        )
-        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, None)
-        if not doc:
-            return False
-        project_id = doc["project_id"]
-        try:
-            container.delete_item(item=heuristic_id, partition_key=project_id)
-            self._invalidate_partition_key_cache(MemoryType.HEURISTICS, heuristic_id)
-            return True
-        except exceptions.CosmosResourceNotFoundError:
-            return False
-    # ==================== STATS ====================
-    def get_stats(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-    ) -> Dict[str, Any]:
-        """Get memory statistics."""
-        stats = {
-            "project_id": project_id,
-            "agent": agent,
-            "storage_type": "azure_cosmos",
-            "database": self.database_name,
-        }
-        # Count items in each container using canonical memory types
-        for memory_type in MemoryType.ALL:
-            container = self._get_container(memory_type)
-            if memory_type == MemoryType.PREFERENCES:
-                # Preferences use user_id, not project_id
-                result = list(
-                    container.query_items(
-                        query="SELECT VALUE COUNT(1) FROM c",
-                        enable_cross_partition_query=True,
-                    )
-                )
-            else:
-                query = "SELECT VALUE COUNT(1) FROM c WHERE c.project_id = @project_id"
-                parameters = [{"name": "@project_id", "value": project_id}]
-                if agent:
-                    query = """
-                    SELECT VALUE COUNT(1) FROM c
-                    WHERE c.project_id = @project_id AND c.agent = @agent
-                    """
-                    parameters.append({"name": "@agent", "value": agent})
-                result = list(
-                    container.query_items(
-                        query=query,
-                        parameters=parameters,
-                        enable_cross_partition_query=False,
-                        partition_key=project_id,
-                    )
-                )
-            stats[f"{memory_type}_count"] = result[0] if result else 0
-        stats["total_count"] = sum(
-            stats.get(k, 0) for k in stats if k.endswith("_count")
-        )
-        return stats
-    # ==================== HELPERS ====================
-    def _parse_datetime(self, value: Any) -> Optional[datetime]:
-        """Parse datetime from string."""
-        if value is None:
-            return None
-        if isinstance(value, datetime):
-            return value
-        try:
-            return datetime.fromisoformat(value.replace("Z", "+00:00"))
-        except (ValueError, AttributeError):
-            return None
-    def _doc_to_heuristic(self, doc: Dict[str, Any]) -> Heuristic:
-        """Convert Cosmos DB document to Heuristic."""
-        return Heuristic(
-            id=doc["id"],
-            agent=doc["agent"],
-            project_id=doc["project_id"],
-            condition=doc["condition"],
-            strategy=doc["strategy"],
-            confidence=doc.get("confidence", 0.0),
-            occurrence_count=doc.get("occurrence_count", 0),
-            success_count=doc.get("success_count", 0),
-            last_validated=self._parse_datetime(doc.get("last_validated"))
-            or datetime.now(timezone.utc),
-            created_at=self._parse_datetime(doc.get("created_at"))
-            or datetime.now(timezone.utc),
-            embedding=doc.get("embedding"),
-            metadata=doc.get("metadata", {}),
-        )
-    def _doc_to_outcome(self, doc: Dict[str, Any]) -> Outcome:
-        """Convert Cosmos DB document to Outcome."""
-        return Outcome(
-            id=doc["id"],
-            agent=doc["agent"],
-            project_id=doc["project_id"],
-            task_type=doc.get("task_type", "general"),
-            task_description=doc["task_description"],
-            success=doc.get("success", False),
-            strategy_used=doc.get("strategy_used", ""),
-            duration_ms=doc.get("duration_ms"),
-            error_message=doc.get("error_message"),
-            user_feedback=doc.get("user_feedback"),
-            timestamp=self._parse_datetime(doc.get("timestamp"))
-            or datetime.now(timezone.utc),
-            embedding=doc.get("embedding"),
-            metadata=doc.get("metadata", {}),
-        )
-    def _doc_to_preference(self, doc: Dict[str, Any]) -> UserPreference:
-        """Convert Cosmos DB document to UserPreference."""
-        return UserPreference(
-            id=doc["id"],
-            user_id=doc["user_id"],
-            category=doc.get("category", "general"),
-            preference=doc["preference"],
-            source=doc.get("source", "unknown"),
-            confidence=doc.get("confidence", 1.0),
-            timestamp=self._parse_datetime(doc.get("timestamp"))
-            or datetime.now(timezone.utc),
-            metadata=doc.get("metadata", {}),
-        )
-    def _doc_to_domain_knowledge(self, doc: Dict[str, Any]) -> DomainKnowledge:
-        """Convert Cosmos DB document to DomainKnowledge."""
-        return DomainKnowledge(
-            id=doc["id"],
-            agent=doc["agent"],
-            project_id=doc["project_id"],
-            domain=doc.get("domain", "general"),
-            fact=doc["fact"],
-            source=doc.get("source", "unknown"),
-            confidence=doc.get("confidence", 1.0),
-            last_verified=self._parse_datetime(doc.get("last_verified"))
-            or datetime.now(timezone.utc),
-            embedding=doc.get("embedding"),
-            metadata=doc.get("metadata", {}),
-        )
-    def _doc_to_anti_pattern(self, doc: Dict[str, Any]) -> AntiPattern:
-        """Convert Cosmos DB document to AntiPattern."""
-        return AntiPattern(
-            id=doc["id"],
-            agent=doc["agent"],
-            project_id=doc["project_id"],
-            pattern=doc["pattern"],
-            why_bad=doc.get("why_bad", ""),
-            better_alternative=doc.get("better_alternative", ""),
-            occurrence_count=doc.get("occurrence_count", 1),
-            last_seen=self._parse_datetime(doc.get("last_seen"))
-            or datetime.now(timezone.utc),
-            created_at=self._parse_datetime(doc.get("created_at"))
-            or datetime.now(timezone.utc),
-            embedding=doc.get("embedding"),
-            metadata=doc.get("metadata", {}),
-        )
+"""
+ALMA Azure Cosmos DB Storage Backend.
+Production storage using Azure Cosmos DB with vector search capabilities.
+Uses Azure Key Vault for secrets management.
+Requirements:
+    pip install azure-cosmos azure-identity azure-keyvault-secrets
+Configuration (config.yaml):
+    alma:
+      storage: azure
+      azure:
+        endpoint: ${AZURE_COSMOS_ENDPOINT}
+        key: ${KEYVAULT:cosmos-db-key}
+        database: alma-memory
+        embedding_dim: 384
+"""
+import logging
+from datetime import datetime, timezone
+from typing import Any, Dict, List, Optional
+from alma.storage.base import StorageBackend
+from alma.storage.constants import AZURE_COSMOS_CONTAINER_NAMES, MemoryType
+from alma.types import (
+    AntiPattern,
+    DomainKnowledge,
+    Heuristic,
+    Outcome,
+    UserPreference,
+)
+logger = logging.getLogger(__name__)
+# Try to import Azure SDK
+try:
+    from azure.cosmos import CosmosClient, PartitionKey, exceptions
+    from azure.cosmos.container import ContainerProxy
+    from azure.cosmos.database import DatabaseProxy
+    AZURE_COSMOS_AVAILABLE = True
+except ImportError:
+    AZURE_COSMOS_AVAILABLE = False
+    # Define placeholders for type hints when SDK not available
+    CosmosClient = None  # type: ignore
+    PartitionKey = None  # type: ignore
+    exceptions = None  # type: ignore
+    ContainerProxy = Any  # type: ignore
+    DatabaseProxy = Any  # type: ignore
+    logger.warning(
+        "azure-cosmos package not installed. Install with: pip install azure-cosmos"
+    )
+class AzureCosmosStorage(StorageBackend):
+    """
+    Azure Cosmos DB storage backend with vector search.
+    Uses:
+    - NoSQL API for document storage
+    - DiskANN vector indexing for similarity search
+    - Partition key: project_id for efficient queries
+    Container structure (uses canonical memory type names with alma_ prefix):
+    - alma_heuristics: Heuristics with vector embeddings
+    - alma_outcomes: Task outcomes with vector embeddings
+    - alma_preferences: User preferences (no vectors)
+    - alma_domain_knowledge: Domain knowledge with vector embeddings
+    - alma_anti_patterns: Anti-patterns with vector embeddings
+    Container names are derived from alma.storage.constants.AZURE_COSMOS_CONTAINER_NAMES
+    for consistency across all storage backends.
+    """
+    # Use canonical container names from constants
+    CONTAINER_NAMES = AZURE_COSMOS_CONTAINER_NAMES
+    def __init__(
+        self,
+        endpoint: str,
+        key: str,
+        database_name: str = "alma-memory",
+        embedding_dim: int = 384,
+        create_if_not_exists: bool = True,
+    ):
+        """
+        Initialize Azure Cosmos DB storage.
+        Args:
+            endpoint: Cosmos DB account endpoint
+            key: Cosmos DB account key
+            database_name: Name of the database
+            embedding_dim: Dimension of embedding vectors
+            create_if_not_exists: Create database/containers if missing
+        """
+        if not AZURE_COSMOS_AVAILABLE:
+            raise ImportError(
+                "azure-cosmos package required. Install with: pip install azure-cosmos"
+            )
+        self.endpoint = endpoint
+        self.database_name = database_name
+        self.embedding_dim = embedding_dim
+        # Initialize client
+        self.client = CosmosClient(endpoint, credential=key)
+        # Get or create database
+        if create_if_not_exists:
+            self.database = self.client.create_database_if_not_exists(id=database_name)
+            self._init_containers()
+        else:
+            self.database = self.client.get_database_client(database_name)
+        # Cache container clients
+        self._containers: Dict[str, ContainerProxy] = {}
+        for key_name, container_name in self.CONTAINER_NAMES.items():
+            self._containers[key_name] = self.database.get_container_client(
+                container_name
+            )
+        # Cache for partition key mappings: {container_key: {doc_id: partition_key}}
+        # This reduces RU consumption by avoiding cross-partition queries
+        self._partition_key_cache: Dict[str, Dict[str, str]] = {
+            mt: {} for mt in MemoryType.ALL
+        }
+        # Maximum cache size per container to prevent memory issues
+        self._cache_max_size = 1000
+        logger.info(f"Connected to Azure Cosmos DB: {database_name}")
+    @classmethod
+    def from_config(cls, config: Dict[str, Any]) -> "AzureCosmosStorage":
+        """Create instance from configuration."""
+        azure_config = config.get("azure", {})
+        endpoint = azure_config.get("endpoint")
+        key = azure_config.get("key")
+        if not endpoint or not key:
+            raise ValueError(
+                "Azure Cosmos DB requires 'azure.endpoint' and 'azure.key' in config"
+            )
+        return cls(
+            endpoint=endpoint,
+            key=key,
+            database_name=azure_config.get("database", "alma-memory"),
+            embedding_dim=azure_config.get("embedding_dim", 384),
+            create_if_not_exists=azure_config.get("create_if_not_exists", True),
+        )
+    def _init_containers(self):
+        """Initialize containers with vector search indexing."""
+        # Container configs with indexing policies (using canonical memory types)
+        container_configs = {
+            MemoryType.HEURISTICS: {
+                "partition_key": "/project_id",
+                "vector_path": "/embedding",
+                "vector_indexes": True,
+            },
+            MemoryType.OUTCOMES: {
+                "partition_key": "/project_id",
+                "vector_path": "/embedding",
+                "vector_indexes": True,
+            },
+            MemoryType.PREFERENCES: {
+                "partition_key": "/user_id",
+                "vector_path": None,
+                "vector_indexes": False,
+            },
+            MemoryType.DOMAIN_KNOWLEDGE: {
+                "partition_key": "/project_id",
+                "vector_path": "/embedding",
+                "vector_indexes": True,
+            },
+            MemoryType.ANTI_PATTERNS: {
+                "partition_key": "/project_id",
+                "vector_path": "/embedding",
+                "vector_indexes": True,
+            },
+        }
+        for key_name, cfg in container_configs.items():
+            container_name = self.CONTAINER_NAMES[key_name]
+            # Build indexing policy
+            indexing_policy = {
+                "indexingMode": "consistent",
+                "automatic": True,
+                "includedPaths": [{"path": "/*"}],
+                "excludedPaths": [{"path": '/"_etag"/?'}],
+            }
+            # Add vector embedding policy if needed
+            vector_embedding_policy = None
+            if cfg["vector_indexes"] and cfg["vector_path"]:
+                # Exclude vector path from regular indexing
+                indexing_policy["excludedPaths"].append(
+                    {"path": f"{cfg['vector_path']}/*"}
+                )
+                # Vector embedding policy for DiskANN
+                vector_embedding_policy = {
+                    "vectorEmbeddings": [
+                        {
+                            "path": cfg["vector_path"],
+                            "dataType": "float32",
+                            "dimensions": self.embedding_dim,
+                            "distanceFunction": "cosine",
+                        }
+                    ]
+                }
+            try:
+                container_properties = {
+                    "id": container_name,
+                    "partition_key": PartitionKey(path=cfg["partition_key"]),
+                    "indexing_policy": indexing_policy,
+                }
+                if vector_embedding_policy:
+                    container_properties["vector_embedding_policy"] = (
+                        vector_embedding_policy
+                    )
+                self.database.create_container_if_not_exists(**container_properties)
+                logger.debug(f"Container ready: {container_name}")
+            except exceptions.CosmosHttpResponseError as e:
+                if e.status_code == 409:
+                    logger.debug(f"Container already exists: {container_name}")
+                else:
+                    raise
+    def _get_container(self, container_key: str) -> ContainerProxy:
+        """Get container client by key."""
+        return self._containers[container_key]
+    def _cache_partition_key(
+        self, container_key: str, doc_id: str, partition_key: str
+    ) -> None:
+        """
+        Cache the partition key mapping for a document.
+        This enables point reads for future operations, reducing RU consumption
+        by avoiding expensive cross-partition queries.
+        """
+        cache = self._partition_key_cache[container_key]
+        # Evict oldest entries if cache is full (simple FIFO eviction)
+        if len(cache) >= self._cache_max_size:
+            # Remove first 10% of entries
+            keys_to_remove = list(cache.keys())[: self._cache_max_size // 10]
+            for key in keys_to_remove:
+                del cache[key]
+        cache[doc_id] = partition_key
+    def _get_cached_partition_key(
+        self, container_key: str, doc_id: str
+    ) -> Optional[str]:
+        """
+        Get cached partition key for a document if available.
+        Returns None if the partition key is not cached.
+        """
+        return self._partition_key_cache.get(container_key, {}).get(doc_id)
+    def _invalidate_partition_key_cache(self, container_key: str, doc_id: str) -> None:
+        """Remove a document from the partition key cache."""
+        cache = self._partition_key_cache.get(container_key, {})
+        cache.pop(doc_id, None)
+    def _point_read_document(
+        self,
+        container_key: str,
+        doc_id: str,
+        partition_key: Optional[str] = None,
+    ) -> Optional[Dict[str, Any]]:
+        """
+        Attempt to read a document using a point read (1 RU) instead of a query.
+        If partition_key is provided, performs a direct point read.
+        If partition_key is not provided but is cached, uses the cached value.
+        If neither is available, falls back to a cross-partition query.
+        Args:
+            container_key: The container key (e.g., 'heuristics', 'knowledge')
+            doc_id: The document ID
+            partition_key: Optional partition key for direct point read
+        Returns:
+            The document if found, None otherwise
+        """
+        container = self._get_container(container_key)
+        # Try to get partition key from cache if not provided
+        if partition_key is None:
+            partition_key = self._get_cached_partition_key(container_key, doc_id)
+        # If we have a partition key, use point read (1 RU)
+        if partition_key is not None:
+            try:
+                doc = container.read_item(item=doc_id, partition_key=partition_key)
+                # Refresh cache on successful read
+                self._cache_partition_key(container_key, doc_id, partition_key)
+                return doc
+            except exceptions.CosmosResourceNotFoundError:
+                # Document not found or partition key was wrong
+                self._invalidate_partition_key_cache(container_key, doc_id)
+                # Fall through to cross-partition query
+            except Exception as e:
+                logger.warning(f"Point read failed for {doc_id}: {e}")
+                # Fall through to cross-partition query
+        # Fallback: Cross-partition query (expensive but necessary without partition key)
+        logger.debug(
+            f"Using cross-partition query for {doc_id} in {container_key} "
+            "(consider providing project_id for better performance)"
+        )
+        query = "SELECT * FROM c WHERE c.id = @id"
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=[{"name": "@id", "value": doc_id}],
+                enable_cross_partition_query=True,
+            )
+        )
+        if items:
+            doc = items[0]
+            # Cache the partition key for future operations
+            pk_field = self._get_partition_key_field(container_key)
+            if pk_field and pk_field in doc:
+                self._cache_partition_key(container_key, doc_id, doc[pk_field])
+            return doc
+        return None
+    def _get_partition_key_field(self, container_key: str) -> Optional[str]:
+        """Get the partition key field name for a container."""
+        partition_key_fields = {
+            MemoryType.HEURISTICS: "project_id",
+            MemoryType.OUTCOMES: "project_id",
+            MemoryType.PREFERENCES: "user_id",
+            MemoryType.DOMAIN_KNOWLEDGE: "project_id",
+            MemoryType.ANTI_PATTERNS: "project_id",
+        }
+        return partition_key_fields.get(container_key)
+    # ==================== WRITE OPERATIONS ====================
+    def save_heuristic(self, heuristic: Heuristic) -> str:
+        """Save a heuristic."""
+        container = self._get_container(MemoryType.HEURISTICS)
+        doc = {
+            "id": heuristic.id,
+            "agent": heuristic.agent,
+            "project_id": heuristic.project_id,
+            "condition": heuristic.condition,
+            "strategy": heuristic.strategy,
+            "confidence": heuristic.confidence,
+            "occurrence_count": heuristic.occurrence_count,
+            "success_count": heuristic.success_count,
+            "last_validated": (
+                heuristic.last_validated.isoformat()
+                if heuristic.last_validated
+                else None
+            ),
+            "created_at": (
+                heuristic.created_at.isoformat() if heuristic.created_at else None
+            ),
+            "metadata": heuristic.metadata or {},
+            "embedding": heuristic.embedding,
+            "type": "heuristic",
+        }
+        container.upsert_item(doc)
+        # Cache partition key for efficient future updates
+        self._cache_partition_key(
+            MemoryType.HEURISTICS, heuristic.id, heuristic.project_id
+        )
+        logger.debug(f"Saved heuristic: {heuristic.id}")
+        return heuristic.id
+    def save_outcome(self, outcome: Outcome) -> str:
+        """Save an outcome."""
+        container = self._get_container(MemoryType.OUTCOMES)
+        doc = {
+            "id": outcome.id,
+            "agent": outcome.agent,
+            "project_id": outcome.project_id,
+            "task_type": outcome.task_type,
+            "task_description": outcome.task_description,
+            "success": outcome.success,
+            "strategy_used": outcome.strategy_used,
+            "duration_ms": outcome.duration_ms,
+            "error_message": outcome.error_message,
+            "user_feedback": outcome.user_feedback,
+            "timestamp": outcome.timestamp.isoformat() if outcome.timestamp else None,
+            "metadata": outcome.metadata or {},
+            "embedding": outcome.embedding,
+            "type": "outcome",
+        }
+        container.upsert_item(doc)
+        # Cache partition key for efficient future updates
+        self._cache_partition_key(MemoryType.OUTCOMES, outcome.id, outcome.project_id)
+        logger.debug(f"Saved outcome: {outcome.id}")
+        return outcome.id
+    def save_user_preference(self, preference: UserPreference) -> str:
+        """Save a user preference."""
+        container = self._get_container(MemoryType.PREFERENCES)
+        doc = {
+            "id": preference.id,
+            "user_id": preference.user_id,
+            "category": preference.category,
+            "preference": preference.preference,
+            "source": preference.source,
+            "confidence": preference.confidence,
+            "timestamp": (
+                preference.timestamp.isoformat() if preference.timestamp else None
+            ),
+            "metadata": preference.metadata or {},
+            "type": "preference",
+        }
+        container.upsert_item(doc)
+        # Cache partition key for efficient future updates
+        self._cache_partition_key(
+            MemoryType.PREFERENCES, preference.id, preference.user_id
+        )
+        logger.debug(f"Saved preference: {preference.id}")
+        return preference.id
+    def save_domain_knowledge(self, knowledge: DomainKnowledge) -> str:
+        """Save domain knowledge."""
+        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
+        doc = {
+            "id": knowledge.id,
+            "agent": knowledge.agent,
+            "project_id": knowledge.project_id,
+            "domain": knowledge.domain,
+            "fact": knowledge.fact,
+            "source": knowledge.source,
+            "confidence": knowledge.confidence,
+            "last_verified": (
+                knowledge.last_verified.isoformat() if knowledge.last_verified else None
+            ),
+            "metadata": knowledge.metadata or {},
+            "embedding": knowledge.embedding,
+            "type": "domain_knowledge",
+        }
+        container.upsert_item(doc)
+        # Cache partition key for efficient future updates
+        self._cache_partition_key(
+            MemoryType.DOMAIN_KNOWLEDGE, knowledge.id, knowledge.project_id
+        )
+        logger.debug(f"Saved domain knowledge: {knowledge.id}")
+        return knowledge.id
+    def save_anti_pattern(self, anti_pattern: AntiPattern) -> str:
+        """Save an anti-pattern."""
+        container = self._get_container(MemoryType.ANTI_PATTERNS)
+        doc = {
+            "id": anti_pattern.id,
+            "agent": anti_pattern.agent,
+            "project_id": anti_pattern.project_id,
+            "pattern": anti_pattern.pattern,
+            "why_bad": anti_pattern.why_bad,
+            "better_alternative": anti_pattern.better_alternative,
+            "occurrence_count": anti_pattern.occurrence_count,
+            "last_seen": (
+                anti_pattern.last_seen.isoformat() if anti_pattern.last_seen else None
+            ),
+            "created_at": (
+                anti_pattern.created_at.isoformat() if anti_pattern.created_at else None
+            ),
+            "metadata": anti_pattern.metadata or {},
+            "embedding": anti_pattern.embedding,
+            "type": "anti_pattern",
+        }
+        container.upsert_item(doc)
+        # Cache partition key for efficient future updates
+        self._cache_partition_key(
+            MemoryType.ANTI_PATTERNS, anti_pattern.id, anti_pattern.project_id
+        )
+        logger.debug(f"Saved anti-pattern: {anti_pattern.id}")
+        return anti_pattern.id
+    # ==================== READ OPERATIONS ====================
+    def get_heuristics(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+        min_confidence: float = 0.0,
+    ) -> List[Heuristic]:
+        """Get heuristics with optional vector search."""
+        container = self._get_container(MemoryType.HEURISTICS)
+        if embedding:
+            # Vector search query
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            AND c.confidence >= @min_confidence
+            """
+            if agent:
+                query += " AND c.agent = @agent"
+            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+                {"name": "@min_confidence", "value": min_confidence},
+                {"name": "@embedding", "value": embedding},
+            ]
+            if agent:
+                parameters.append({"name": "@agent", "value": agent})
+        else:
+            # Regular query
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            AND c.confidence >= @min_confidence
+            """
+            if agent:
+                query += " AND c.agent = @agent"
+            query += " ORDER BY c.confidence DESC"
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+                {"name": "@min_confidence", "value": min_confidence},
+            ]
+            if agent:
+                parameters.append({"name": "@agent", "value": agent})
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        # Cache partition keys for efficient future updates
+        for doc in items:
+            self._cache_partition_key(
+                MemoryType.HEURISTICS, doc["id"], doc["project_id"]
+            )
+        return [self._doc_to_heuristic(doc) for doc in items]
+    def get_outcomes(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+        task_type: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+        success_only: bool = False,
+    ) -> List[Outcome]:
+        """Get outcomes with optional vector search."""
+        container = self._get_container(MemoryType.OUTCOMES)
+        if embedding:
+            # Vector search query
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+                {"name": "@embedding", "value": embedding},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            if task_type:
+                query += " AND c.task_type = @task_type"
+                parameters.append({"name": "@task_type", "value": task_type})
+            if success_only:
+                query += " AND c.success = true"
+            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
+        else:
+            # Regular query
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            if task_type:
+                query += " AND c.task_type = @task_type"
+                parameters.append({"name": "@task_type", "value": task_type})
+            if success_only:
+                query += " AND c.success = true"
+            query += " ORDER BY c.timestamp DESC"
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        # Cache partition keys for efficient future updates
+        for doc in items:
+            self._cache_partition_key(MemoryType.OUTCOMES, doc["id"], doc["project_id"])
+        return [self._doc_to_outcome(doc) for doc in items]
+    def get_user_preferences(
+        self,
+        user_id: str,
+        category: Optional[str] = None,
+    ) -> List[UserPreference]:
+        """Get user preferences."""
+        container = self._get_container(MemoryType.PREFERENCES)
+        query = "SELECT * FROM c WHERE c.user_id = @user_id"
+        parameters = [{"name": "@user_id", "value": user_id}]
+        if category:
+            query += " AND c.category = @category"
+            parameters.append({"name": "@category", "value": category})
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=user_id,
+            )
+        )
+        # Cache partition keys for efficient future updates
+        for doc in items:
+            self._cache_partition_key(MemoryType.PREFERENCES, doc["id"], doc["user_id"])
+        return [self._doc_to_preference(doc) for doc in items]
+    def get_domain_knowledge(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+        domain: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+    ) -> List[DomainKnowledge]:
+        """Get domain knowledge with optional vector search."""
+        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
+        if embedding:
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+                {"name": "@embedding", "value": embedding},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            if domain:
+                query += " AND c.domain = @domain"
+                parameters.append({"name": "@domain", "value": domain})
+            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
+        else:
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            if domain:
+                query += " AND c.domain = @domain"
+                parameters.append({"name": "@domain", "value": domain})
+            query += " ORDER BY c.confidence DESC"
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        # Cache partition keys for efficient future updates
+        for doc in items:
+            self._cache_partition_key(
+                MemoryType.DOMAIN_KNOWLEDGE, doc["id"], doc["project_id"]
+            )
+        return [self._doc_to_domain_knowledge(doc) for doc in items]
+    def get_anti_patterns(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+        embedding: Optional[List[float]] = None,
+        top_k: int = 5,
+    ) -> List[AntiPattern]:
+        """Get anti-patterns with optional vector search."""
+        container = self._get_container(MemoryType.ANTI_PATTERNS)
+        if embedding:
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+                {"name": "@embedding", "value": embedding},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            query += " ORDER BY VectorDistance(c.embedding, @embedding)"
+        else:
+            query = """
+            SELECT TOP @top_k *
+            FROM c
+            WHERE c.project_id = @project_id
+            """
+            parameters = [
+                {"name": "@top_k", "value": top_k},
+                {"name": "@project_id", "value": project_id},
+            ]
+            if agent:
+                query += " AND c.agent = @agent"
+                parameters.append({"name": "@agent", "value": agent})
+            query += " ORDER BY c.occurrence_count DESC"
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        # Cache partition keys for efficient future updates
+        for doc in items:
+            self._cache_partition_key(
+                MemoryType.ANTI_PATTERNS, doc["id"], doc["project_id"]
+            )
+        return [self._doc_to_anti_pattern(doc) for doc in items]
+    # ==================== UPDATE OPERATIONS ====================
+    def update_heuristic(
+        self,
+        heuristic_id: str,
+        updates: Dict[str, Any],
+        project_id: Optional[str] = None,
+    ) -> bool:
+        """
+        Update a heuristic's fields.
+        Args:
+            heuristic_id: The heuristic document ID
+            updates: Dictionary of fields to update
+            project_id: Optional partition key for efficient point read (1 RU).
+                       If not provided, will attempt cache lookup, then
+                       fall back to cross-partition query (more expensive).
+        Returns:
+            True if update succeeded, False if document not found
+        """
+        container = self._get_container(MemoryType.HEURISTICS)
+        # Use optimized point read with cache fallback
+        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
+        if not doc:
+            return False
+        # Apply updates
+        for key, value in updates.items():
+            if isinstance(value, datetime):
+                doc[key] = value.isoformat()
+            else:
+                doc[key] = value
+        container.replace_item(item=heuristic_id, body=doc)
+        return True
+    def increment_heuristic_occurrence(
+        self,
+        heuristic_id: str,
+        success: bool,
+        project_id: Optional[str] = None,
+    ) -> bool:
+        """
+        Increment heuristic occurrence count.
+        Args:
+            heuristic_id: The heuristic document ID
+            success: Whether this occurrence was successful
+            project_id: Optional partition key for efficient point read (1 RU).
+                       If not provided, will attempt cache lookup, then
+                       fall back to cross-partition query (more expensive).
+        Returns:
+            True if update succeeded, False if document not found
+        """
+        container = self._get_container(MemoryType.HEURISTICS)
+        # Use optimized point read with cache fallback
+        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
+        if not doc:
+            return False
+        doc["occurrence_count"] = doc.get("occurrence_count", 0) + 1
+        if success:
+            doc["success_count"] = doc.get("success_count", 0) + 1
+        doc["last_validated"] = datetime.now(timezone.utc).isoformat()
+        container.replace_item(item=heuristic_id, body=doc)
+        return True
+    def update_heuristic_confidence(
+        self,
+        heuristic_id: str,
+        new_confidence: float,
+        project_id: Optional[str] = None,
+    ) -> bool:
+        """
+        Update confidence score for a heuristic.
+        Args:
+            heuristic_id: The heuristic document ID
+            new_confidence: The new confidence value
+            project_id: Optional partition key for efficient point read (1 RU).
+                       If not provided, will attempt cache lookup, then
+                       fall back to cross-partition query (more expensive).
+        Returns:
+            True if update succeeded, False if document not found
+        Performance Note:
+            - With project_id: 1 RU for point read + write cost
+            - With cached partition key: 1 RU for point read + write cost
+            - Without either: Cross-partition query (variable, higher RUs)
+        """
+        container = self._get_container(MemoryType.HEURISTICS)
+        # Use optimized point read with cache fallback
+        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, project_id)
+        if not doc:
+            return False
+        doc["confidence"] = new_confidence
+        container.replace_item(item=heuristic_id, body=doc)
+        logger.debug(
+            f"Updated heuristic confidence: {heuristic_id} -> {new_confidence}"
+        )
+        return True
+    def update_knowledge_confidence(
+        self,
+        knowledge_id: str,
+        new_confidence: float,
+        project_id: Optional[str] = None,
+    ) -> bool:
+        """
+        Update confidence score for domain knowledge.
+        Args:
+            knowledge_id: The knowledge document ID
+            new_confidence: The new confidence value
+            project_id: Optional partition key for efficient point read (1 RU).
+                       If not provided, will attempt cache lookup, then
+                       fall back to cross-partition query (more expensive).
+        Returns:
+            True if update succeeded, False if document not found
+        Performance Note:
+            - With project_id: 1 RU for point read + write cost
+            - With cached partition key: 1 RU for point read + write cost
+            - Without either: Cross-partition query (variable, higher RUs)
+        """
+        container = self._get_container(MemoryType.DOMAIN_KNOWLEDGE)
+        # Use optimized point read with cache fallback
+        doc = self._point_read_document(
+            MemoryType.DOMAIN_KNOWLEDGE, knowledge_id, project_id
+        )
+        if not doc:
+            return False
+        doc["confidence"] = new_confidence
+        container.replace_item(item=knowledge_id, body=doc)
+        logger.debug(
+            f"Updated knowledge confidence: {knowledge_id} -> {new_confidence}"
+        )
+        return True
+    # ==================== DELETE OPERATIONS ====================
+    def delete_outcomes_older_than(
+        self,
+        project_id: str,
+        older_than: datetime,
+        agent: Optional[str] = None,
+    ) -> int:
+        """Delete old outcomes."""
+        container = self._get_container(MemoryType.OUTCOMES)
+        query = """
+        SELECT c.id FROM c
+        WHERE c.project_id = @project_id
+        AND c.timestamp < @older_than
+        """
+        parameters = [
+            {"name": "@project_id", "value": project_id},
+            {"name": "@older_than", "value": older_than.isoformat()},
+        ]
+        if agent:
+            query += " AND c.agent = @agent"
+            parameters.append({"name": "@agent", "value": agent})
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        deleted = 0
+        for item in items:
+            try:
+                container.delete_item(item=item["id"], partition_key=project_id)
+                deleted += 1
+            except exceptions.CosmosResourceNotFoundError:
+                pass
+        logger.info(f"Deleted {deleted} old outcomes")
+        return deleted
+    def delete_low_confidence_heuristics(
+        self,
+        project_id: str,
+        below_confidence: float,
+        agent: Optional[str] = None,
+    ) -> int:
+        """Delete low-confidence heuristics."""
+        container = self._get_container(MemoryType.HEURISTICS)
+        query = """
+        SELECT c.id FROM c
+        WHERE c.project_id = @project_id
+        AND c.confidence < @below_confidence
+        """
+        parameters = [
+            {"name": "@project_id", "value": project_id},
+            {"name": "@below_confidence", "value": below_confidence},
+        ]
+        if agent:
+            query += " AND c.agent = @agent"
+            parameters.append({"name": "@agent", "value": agent})
+        items = list(
+            container.query_items(
+                query=query,
+                parameters=parameters,
+                enable_cross_partition_query=False,
+                partition_key=project_id,
+            )
+        )
+        deleted = 0
+        for item in items:
+            try:
+                container.delete_item(item=item["id"], partition_key=project_id)
+                deleted += 1
+            except exceptions.CosmosResourceNotFoundError:
+                pass
+        logger.info(f"Deleted {deleted} low-confidence heuristics")
+        return deleted
+    def delete_heuristic(
+        self, heuristic_id: str, project_id: Optional[str] = None
+    ) -> bool:
+        """
+        Delete a specific heuristic by ID.
+        Args:
+            heuristic_id: The heuristic document ID
+            project_id: Optional partition key for efficient point read (1 RU).
+                       If not provided, will attempt cache lookup, then
+                       fall back to cross-partition query (more expensive).
+        Returns:
+            True if deletion succeeded, False if document not found
+        """
+        container = self._get_container(MemoryType.HEURISTICS)
+        # Try to get partition key from cache if not provided
+        if project_id is None:
+            project_id = self._get_cached_partition_key(
+                MemoryType.HEURISTICS, heuristic_id
+            )
+        # If we have a partition key, try direct delete
+        if project_id is not None:
+            try:
+                container.delete_item(item=heuristic_id, partition_key=project_id)
+                self._invalidate_partition_key_cache(
+                    MemoryType.HEURISTICS, heuristic_id
+                )
+                return True
+            except exceptions.CosmosResourceNotFoundError:
+                # Document not found or partition key was wrong
+                self._invalidate_partition_key_cache(
+                    MemoryType.HEURISTICS, heuristic_id
+                )
+                # Fall through to cross-partition lookup
+        # Fallback: Cross-partition query to find the document
+        logger.debug(
+            f"Using cross-partition query for delete {heuristic_id} "
+            "(consider providing project_id for better performance)"
+        )
+        doc = self._point_read_document(MemoryType.HEURISTICS, heuristic_id, None)
+        if not doc:
+            return False
+        project_id = doc["project_id"]
+        try:
+            container.delete_item(item=heuristic_id, partition_key=project_id)
+            self._invalidate_partition_key_cache(MemoryType.HEURISTICS, heuristic_id)
+            return True
+        except exceptions.CosmosResourceNotFoundError:
+            return False
+    # ==================== STATS ====================
+    def get_stats(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+    ) -> Dict[str, Any]:
+        """Get memory statistics."""
+        stats = {
+            "project_id": project_id,
+            "agent": agent,
+            "storage_type": "azure_cosmos",
+            "database": self.database_name,
+        }
+        # Count items in each container using canonical memory types
+        for memory_type in MemoryType.ALL:
+            container = self._get_container(memory_type)
+            if memory_type == MemoryType.PREFERENCES:
+                # Preferences use user_id, not project_id
+                result = list(
+                    container.query_items(
+                        query="SELECT VALUE COUNT(1) FROM c",
+                        enable_cross_partition_query=True,
+                    )
+                )
+            else:
+                query = "SELECT VALUE COUNT(1) FROM c WHERE c.project_id = @project_id"
+                parameters = [{"name": "@project_id", "value": project_id}]
+                if agent:
+                    query = """
+                    SELECT VALUE COUNT(1) FROM c
+                    WHERE c.project_id = @project_id AND c.agent = @agent
+                    """
+                    parameters.append({"name": "@agent", "value": agent})
+                result = list(
+                    container.query_items(
+                        query=query,
+                        parameters=parameters,
+                        enable_cross_partition_query=False,
+                        partition_key=project_id,
+                    )
+                )
+            stats[f"{memory_type}_count"] = result[0] if result else 0
+        stats["total_count"] = sum(
+            stats.get(k, 0) for k in stats if k.endswith("_count")
+        )
+        return stats
+    # ==================== HELPERS ====================
+    def _parse_datetime(self, value: Any) -> Optional[datetime]:
+        """Parse datetime from string."""
+        if value is None:
+            return None
+        if isinstance(value, datetime):
+            return value
+        try:
+            return datetime.fromisoformat(value.replace("Z", "+00:00"))
+        except (ValueError, AttributeError):
+            return None
+    def _doc_to_heuristic(self, doc: Dict[str, Any]) -> Heuristic:
+        """Convert Cosmos DB document to Heuristic."""
+        return Heuristic(
+            id=doc["id"],
+            agent=doc["agent"],
+            project_id=doc["project_id"],
+            condition=doc["condition"],
+            strategy=doc["strategy"],
+            confidence=doc.get("confidence", 0.0),
+            occurrence_count=doc.get("occurrence_count", 0),
+            success_count=doc.get("success_count", 0),
+            last_validated=self._parse_datetime(doc.get("last_validated"))
+            or datetime.now(timezone.utc),
+            created_at=self._parse_datetime(doc.get("created_at"))
+            or datetime.now(timezone.utc),
+            embedding=doc.get("embedding"),
+            metadata=doc.get("metadata", {}),
+        )
+    def _doc_to_outcome(self, doc: Dict[str, Any]) -> Outcome:
+        """Convert Cosmos DB document to Outcome."""
+        return Outcome(
+            id=doc["id"],
+            agent=doc["agent"],
+            project_id=doc["project_id"],
+            task_type=doc.get("task_type", "general"),
+            task_description=doc["task_description"],
+            success=doc.get("success", False),
+            strategy_used=doc.get("strategy_used", ""),
+            duration_ms=doc.get("duration_ms"),
+            error_message=doc.get("error_message"),
+            user_feedback=doc.get("user_feedback"),
+            timestamp=self._parse_datetime(doc.get("timestamp"))
+            or datetime.now(timezone.utc),
+            embedding=doc.get("embedding"),
+            metadata=doc.get("metadata", {}),
+        )
+    def _doc_to_preference(self, doc: Dict[str, Any]) -> UserPreference:
+        """Convert Cosmos DB document to UserPreference."""
+        return UserPreference(
+            id=doc["id"],
+            user_id=doc["user_id"],
+            category=doc.get("category", "general"),
+            preference=doc["preference"],
+            source=doc.get("source", "unknown"),
+            confidence=doc.get("confidence", 1.0),
+            timestamp=self._parse_datetime(doc.get("timestamp"))
+            or datetime.now(timezone.utc),
+            metadata=doc.get("metadata", {}),
+        )
+    def _doc_to_domain_knowledge(self, doc: Dict[str, Any]) -> DomainKnowledge:
+        """Convert Cosmos DB document to DomainKnowledge."""
+        return DomainKnowledge(
+            id=doc["id"],
+            agent=doc["agent"],
+            project_id=doc["project_id"],
+            domain=doc.get("domain", "general"),
+            fact=doc["fact"],
+            source=doc.get("source", "unknown"),
+            confidence=doc.get("confidence", 1.0),
+            last_verified=self._parse_datetime(doc.get("last_verified"))
+            or datetime.now(timezone.utc),
+            embedding=doc.get("embedding"),
+            metadata=doc.get("metadata", {}),
+        )
+    def _doc_to_anti_pattern(self, doc: Dict[str, Any]) -> AntiPattern:
+        """Convert Cosmos DB document to AntiPattern."""
+        return AntiPattern(
+            id=doc["id"],
+            agent=doc["agent"],
+            project_id=doc["project_id"],
+            pattern=doc["pattern"],
+            why_bad=doc.get("why_bad", ""),
+            better_alternative=doc.get("better_alternative", ""),
+            occurrence_count=doc.get("occurrence_count", 1),
+            last_seen=self._parse_datetime(doc.get("last_seen"))
+            or datetime.now(timezone.utc),
+            created_at=self._parse_datetime(doc.get("created_at"))
+            or datetime.now(timezone.utc),
+            embedding=doc.get("embedding"),
+            metadata=doc.get("metadata", {}),
+        )

alma-memory 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl