PyPI - alma-memory - Versions diffs - 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl - Mend

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (111) hide show

alma/__init__.py +296 -226
alma/compression/__init__.py +33 -0
alma/compression/pipeline.py +980 -0
alma/confidence/__init__.py +47 -47
alma/confidence/engine.py +540 -540
alma/confidence/types.py +351 -351
alma/config/loader.py +157 -157
alma/consolidation/__init__.py +23 -23
alma/consolidation/engine.py +678 -678
alma/consolidation/prompts.py +84 -84
alma/core.py +1189 -430
alma/domains/__init__.py +30 -30
alma/domains/factory.py +359 -359
alma/domains/schemas.py +448 -448
alma/domains/types.py +272 -272
alma/events/__init__.py +75 -75
alma/events/emitter.py +285 -284
alma/events/storage_mixin.py +246 -246
alma/events/types.py +126 -126
alma/events/webhook.py +425 -425
alma/exceptions.py +49 -49
alma/extraction/__init__.py +31 -31
alma/extraction/auto_learner.py +265 -265
alma/extraction/extractor.py +420 -420
alma/graph/__init__.py +106 -106
alma/graph/backends/__init__.py +32 -32
alma/graph/backends/kuzu.py +624 -624
alma/graph/backends/memgraph.py +432 -432
alma/graph/backends/memory.py +236 -236
alma/graph/backends/neo4j.py +417 -417
alma/graph/base.py +159 -159
alma/graph/extraction.py +198 -198
alma/graph/store.py +860 -860
alma/harness/__init__.py +35 -35
alma/harness/base.py +386 -386
alma/harness/domains.py +705 -705
alma/initializer/__init__.py +37 -37
alma/initializer/initializer.py +418 -418
alma/initializer/types.py +250 -250
alma/integration/__init__.py +62 -62
alma/integration/claude_agents.py +444 -444
alma/integration/helena.py +423 -423
alma/integration/victor.py +471 -471
alma/learning/__init__.py +101 -86
alma/learning/decay.py +878 -0
alma/learning/forgetting.py +1446 -1446
alma/learning/heuristic_extractor.py +390 -390
alma/learning/protocols.py +374 -374
alma/learning/validation.py +346 -346
alma/mcp/__init__.py +123 -45
alma/mcp/__main__.py +156 -156
alma/mcp/resources.py +122 -122
alma/mcp/server.py +955 -591
alma/mcp/tools.py +3254 -509
alma/observability/__init__.py +91 -84
alma/observability/config.py +302 -302
alma/observability/guidelines.py +170 -0
alma/observability/logging.py +424 -424
alma/observability/metrics.py +583 -583
alma/observability/tracing.py +440 -440
alma/progress/__init__.py +21 -21
alma/progress/tracker.py +607 -607
alma/progress/types.py +250 -250
alma/retrieval/__init__.py +134 -53
alma/retrieval/budget.py +525 -0
alma/retrieval/cache.py +1304 -1061
alma/retrieval/embeddings.py +202 -202
alma/retrieval/engine.py +850 -427
alma/retrieval/modes.py +365 -0
alma/retrieval/progressive.py +560 -0
alma/retrieval/scoring.py +344 -344
alma/retrieval/trust_scoring.py +637 -0
alma/retrieval/verification.py +797 -0
alma/session/__init__.py +19 -19
alma/session/manager.py +442 -399
alma/session/types.py +288 -288
alma/storage/__init__.py +101 -90
alma/storage/archive.py +233 -0
alma/storage/azure_cosmos.py +1259 -1259
alma/storage/base.py +1083 -583
alma/storage/chroma.py +1443 -1443
alma/storage/constants.py +103 -103
alma/storage/file_based.py +614 -614
alma/storage/migrations/__init__.py +21 -21
alma/storage/migrations/base.py +321 -321
alma/storage/migrations/runner.py +323 -323
alma/storage/migrations/version_stores.py +337 -337
alma/storage/migrations/versions/__init__.py +11 -11
alma/storage/migrations/versions/v1_0_0.py +373 -373
alma/storage/migrations/versions/v1_1_0_workflow_context.py +551 -0
alma/storage/pinecone.py +1080 -1080
alma/storage/postgresql.py +1948 -1559
alma/storage/qdrant.py +1306 -1306
alma/storage/sqlite_local.py +3041 -1457
alma/testing/__init__.py +46 -46
alma/testing/factories.py +301 -301
alma/testing/mocks.py +389 -389
alma/types.py +292 -264
alma/utils/__init__.py +19 -0
alma/utils/tokenizer.py +521 -0
alma/workflow/__init__.py +83 -0
alma/workflow/artifacts.py +170 -0
alma/workflow/checkpoint.py +311 -0
alma/workflow/context.py +228 -0
alma/workflow/outcomes.py +189 -0
alma/workflow/reducers.py +393 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/METADATA +210 -72
alma_memory-0.7.0.dist-info/RECORD +112 -0
alma_memory-0.5.1.dist-info/RECORD +0 -93
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/WHEEL +0 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/top_level.txt +0 -0

alma/learning/protocols.py CHANGED Viewed

@@ -1,374 +1,374 @@
-"""
-ALMA Learning Protocols.
-Defines how agents learn from outcomes while respecting scope constraints.
-"""
-import logging
-import uuid
-from datetime import datetime, timedelta, timezone
-from typing import TYPE_CHECKING, Dict, Optional
-from alma.storage.base import StorageBackend
-from alma.types import (
-    AntiPattern,
-    DomainKnowledge,
-    Heuristic,
-    MemoryScope,
-    Outcome,
-    UserPreference,
-)
-if TYPE_CHECKING:
-    from alma.retrieval.embeddings import EmbeddingProvider
-logger = logging.getLogger(__name__)
-class LearningProtocol:
-    """
-    Manages how agents learn from task outcomes.
-    Key principles:
-    - Validate scope before any learning
-    - Require minimum occurrences before creating heuristics
-    - Support forgetting to prevent memory bloat
-    """
-    def __init__(
-        self,
-        storage: StorageBackend,
-        scopes: Dict[str, MemoryScope],
-        embedder: Optional["EmbeddingProvider"] = None,
-        similarity_threshold: float = 0.75,
-    ):
-        """
-        Initialize learning protocol.
-        Args:
-            storage: Storage backend for persistence
-            scopes: Dict of agent_name -> MemoryScope
-            embedder: Optional embedding provider for semantic similarity
-            similarity_threshold: Cosine similarity threshold for strategy matching (default 0.75)
-        """
-        self.storage = storage
-        self.scopes = scopes
-        self.embedder = embedder
-        self.similarity_threshold = similarity_threshold
-    def learn(
-        self,
-        agent: str,
-        project_id: str,
-        task: str,
-        outcome: bool,
-        strategy_used: str,
-        task_type: Optional[str] = None,
-        duration_ms: Optional[int] = None,
-        error_message: Optional[str] = None,
-        feedback: Optional[str] = None,
-    ) -> Outcome:
-        """
-        Learn from a task outcome.
-        Creates an Outcome record and potentially updates/creates heuristics.
-        Args:
-            agent: Agent that executed the task
-            project_id: Project context
-            task: Task description
-            outcome: True if successful, False if failed
-            strategy_used: The approach taken
-            task_type: Category for grouping
-            duration_ms: Execution time
-            error_message: Error details if failed
-            feedback: User feedback
-        Returns:
-            The created Outcome record
-        """
-        # Validate agent has a scope (warn but don't block)
-        scope = self.scopes.get(agent)
-        if scope is None:
-            logger.warning(f"Agent '{agent}' has no defined scope")
-        # Create outcome record
-        outcome_record = Outcome(
-            id=f"out_{uuid.uuid4().hex[:12]}",
-            agent=agent,
-            project_id=project_id,
-            task_type=task_type or self._infer_task_type(task),
-            task_description=task,
-            success=outcome,
-            strategy_used=strategy_used,
-            duration_ms=duration_ms,
-            error_message=error_message,
-            user_feedback=feedback,
-            timestamp=datetime.now(timezone.utc),
-        )
-        # Save outcome
-        self.storage.save_outcome(outcome_record)
-        logger.info(
-            f"Recorded outcome for {agent}: {'success' if outcome else 'failure'}"
-        )
-        # Check if we should create/update a heuristic
-        self._maybe_create_heuristic(
-            agent=agent,
-            project_id=project_id,
-            task_type=outcome_record.task_type,
-            strategy=strategy_used,
-            success=outcome,
-            scope=scope,
-        )
-        # If failure with clear pattern, consider anti-pattern
-        if not outcome and error_message:
-            self._maybe_create_anti_pattern(
-                agent=agent,
-                project_id=project_id,
-                task=task,
-                strategy=strategy_used,
-                error=error_message,
-            )
-        return outcome_record
-    def _maybe_create_heuristic(
-        self,
-        agent: str,
-        project_id: str,
-        task_type: str,
-        strategy: str,
-        success: bool,
-        scope: Optional[MemoryScope],
-    ):
-        """
-        Create or update a heuristic if we have enough occurrences.
-        Only creates heuristic after min_occurrences similar outcomes.
-        """
-        min_occurrences = 3
-        if scope:
-            min_occurrences = scope.min_occurrences_for_heuristic
-        # Get similar outcomes to check occurrence count
-        similar_outcomes = self.storage.get_outcomes(
-            project_id=project_id,
-            agent=agent,
-            task_type=task_type,
-            top_k=min_occurrences + 1,
-            success_only=False,
-        )
-        # Filter to same strategy
-        same_strategy = [
-            o
-            for o in similar_outcomes
-            if self._strategies_similar(o.strategy_used, strategy)
-        ]
-        if len(same_strategy) >= min_occurrences:
-            success_count = sum(1 for o in same_strategy if o.success)
-            confidence = success_count / len(same_strategy)
-            # Only create heuristic if confidence is meaningful
-            if confidence > 0.5:
-                heuristic = Heuristic(
-                    id=f"heur_{uuid.uuid4().hex[:12]}",
-                    agent=agent,
-                    project_id=project_id,
-                    condition=f"task type: {task_type}",
-                    strategy=strategy,
-                    confidence=confidence,
-                    occurrence_count=len(same_strategy),
-                    success_count=success_count,
-                    last_validated=datetime.now(timezone.utc),
-                    created_at=datetime.now(timezone.utc),
-                )
-                self.storage.save_heuristic(heuristic)
-                logger.info(
-                    f"Created heuristic for {agent}: {strategy[:50]}... "
-                    f"(confidence: {confidence:.0%})"
-                )
-    def _maybe_create_anti_pattern(
-        self,
-        agent: str,
-        project_id: str,
-        task: str,
-        strategy: str,
-        error: str,
-    ):
-        """Create anti-pattern if we see repeated failures with same pattern."""
-        # Check for similar failures
-        similar_failures = self.storage.get_outcomes(
-            project_id=project_id,
-            agent=agent,
-            success_only=False,
-            top_k=10,
-        )
-        # Filter to failures with similar error
-        similar = [
-            o
-            for o in similar_failures
-            if not o.success
-            and o.error_message
-            and self._errors_similar(o.error_message, error)
-        ]
-        if len(similar) >= 2:  # At least 2 similar failures
-            anti_pattern = AntiPattern(
-                id=f"anti_{uuid.uuid4().hex[:12]}",
-                agent=agent,
-                project_id=project_id,
-                pattern=strategy,
-                why_bad=error,
-                better_alternative="[To be determined from successful outcomes]",
-                occurrence_count=len(similar),
-                last_seen=datetime.now(timezone.utc),
-            )
-            self.storage.save_anti_pattern(anti_pattern)
-            logger.info(f"Created anti-pattern for {agent}: {strategy[:50]}...")
-    def add_preference(
-        self,
-        user_id: str,
-        category: str,
-        preference: str,
-        source: str,
-    ) -> UserPreference:
-        """Add a user preference."""
-        pref = UserPreference(
-            id=f"pref_{uuid.uuid4().hex[:12]}",
-            user_id=user_id,
-            category=category,
-            preference=preference,
-            source=source,
-            confidence=1.0 if source == "explicit_instruction" else 0.7,
-            timestamp=datetime.now(timezone.utc),
-        )
-        self.storage.save_user_preference(pref)
-        return pref
-    def add_domain_knowledge(
-        self,
-        agent: str,
-        project_id: str,
-        domain: str,
-        fact: str,
-        source: str,
-    ) -> DomainKnowledge:
-        """Add domain knowledge."""
-        knowledge = DomainKnowledge(
-            id=f"dk_{uuid.uuid4().hex[:12]}",
-            agent=agent,
-            project_id=project_id,
-            domain=domain,
-            fact=fact,
-            source=source,
-            confidence=1.0 if source == "user_stated" else 0.8,
-            last_verified=datetime.now(timezone.utc),
-        )
-        self.storage.save_domain_knowledge(knowledge)
-        return knowledge
-    def forget(
-        self,
-        project_id: str,
-        agent: Optional[str] = None,
-        older_than_days: int = 90,
-        below_confidence: float = 0.3,
-    ) -> int:
-        """
-        Prune stale and low-confidence memories.
-        Returns:
-            Total number of items pruned
-        """
-        cutoff = datetime.now(timezone.utc) - timedelta(days=older_than_days)
-        # Delete old outcomes
-        outcomes_deleted = self.storage.delete_outcomes_older_than(
-            project_id=project_id,
-            older_than=cutoff,
-            agent=agent,
-        )
-        # Delete low-confidence heuristics
-        heuristics_deleted = self.storage.delete_low_confidence_heuristics(
-            project_id=project_id,
-            below_confidence=below_confidence,
-            agent=agent,
-        )
-        total = outcomes_deleted + heuristics_deleted
-        logger.info(
-            f"Forgot {total} items: {outcomes_deleted} outcomes, "
-            f"{heuristics_deleted} heuristics"
-        )
-        return total
-    def _infer_task_type(self, task: str) -> str:
-        """Infer task type from description."""
-        task_lower = task.lower()
-        if "test" in task_lower or "validate" in task_lower:
-            return "testing"
-        elif "api" in task_lower or "endpoint" in task_lower:
-            return "api_testing"
-        elif "form" in task_lower or "input" in task_lower:
-            return "form_testing"
-        elif "database" in task_lower or "query" in task_lower:
-            return "database_validation"
-        return "general"
-    def _strategies_similar(self, s1: str, s2: str) -> bool:
-        """
-        Check if two strategies are similar enough to count together.
-        Uses embedding-based cosine similarity when an embedder is available,
-        otherwise falls back to simple word overlap.
-        """
-        if self.embedder is not None:
-            return self._strategies_similar_embedding(s1, s2)
-        return self._strategies_similar_word_overlap(s1, s2)
-    def _strategies_similar_embedding(self, s1: str, s2: str) -> bool:
-        """Check strategy similarity using embedding cosine similarity."""
-        try:
-            emb1 = self.embedder.encode(s1)
-            emb2 = self.embedder.encode(s2)
-            similarity = self._cosine_similarity(emb1, emb2)
-            return similarity >= self.similarity_threshold
-        except Exception as e:
-            logger.warning(
-                f"Embedding similarity failed, falling back to word overlap: {e}"
-            )
-            return self._strategies_similar_word_overlap(s1, s2)
-    def _strategies_similar_word_overlap(self, s1: str, s2: str) -> bool:
-        """Check strategy similarity using simple word overlap."""
-        words1 = set(s1.lower().split())
-        words2 = set(s2.lower().split())
-        overlap = len(words1 & words2)
-        return overlap >= min(3, len(words1) // 2)
-    def _cosine_similarity(self, v1: list, v2: list) -> float:
-        """Compute cosine similarity between two vectors."""
-        import math
-        dot_product = sum(a * b for a, b in zip(v1, v2, strict=False))
-        norm1 = math.sqrt(sum(a * a for a in v1))
-        norm2 = math.sqrt(sum(b * b for b in v2))
-        if norm1 == 0 or norm2 == 0:
-            return 0.0
-        return dot_product / (norm1 * norm2)
-    def _errors_similar(self, e1: str, e2: str) -> bool:
-        """Check if two errors are similar."""
-        # Simple substring check
-        e1_lower = e1.lower()
-        e2_lower = e2.lower()
-        return e1_lower in e2_lower or e2_lower in e1_lower
+"""
+ALMA Learning Protocols.
+Defines how agents learn from outcomes while respecting scope constraints.
+"""
+import logging
+import uuid
+from datetime import datetime, timedelta, timezone
+from typing import TYPE_CHECKING, Dict, Optional
+from alma.storage.base import StorageBackend
+from alma.types import (
+    AntiPattern,
+    DomainKnowledge,
+    Heuristic,
+    MemoryScope,
+    Outcome,
+    UserPreference,
+)
+if TYPE_CHECKING:
+    from alma.retrieval.embeddings import EmbeddingProvider
+logger = logging.getLogger(__name__)
+class LearningProtocol:
+    """
+    Manages how agents learn from task outcomes.
+    Key principles:
+    - Validate scope before any learning
+    - Require minimum occurrences before creating heuristics
+    - Support forgetting to prevent memory bloat
+    """
+    def __init__(
+        self,
+        storage: StorageBackend,
+        scopes: Dict[str, MemoryScope],
+        embedder: Optional["EmbeddingProvider"] = None,
+        similarity_threshold: float = 0.75,
+    ):
+        """
+        Initialize learning protocol.
+        Args:
+            storage: Storage backend for persistence
+            scopes: Dict of agent_name -> MemoryScope
+            embedder: Optional embedding provider for semantic similarity
+            similarity_threshold: Cosine similarity threshold for strategy matching (default 0.75)
+        """
+        self.storage = storage
+        self.scopes = scopes
+        self.embedder = embedder
+        self.similarity_threshold = similarity_threshold
+    def learn(
+        self,
+        agent: str,
+        project_id: str,
+        task: str,
+        outcome: bool,
+        strategy_used: str,
+        task_type: Optional[str] = None,
+        duration_ms: Optional[int] = None,
+        error_message: Optional[str] = None,
+        feedback: Optional[str] = None,
+    ) -> Outcome:
+        """
+        Learn from a task outcome.
+        Creates an Outcome record and potentially updates/creates heuristics.
+        Args:
+            agent: Agent that executed the task
+            project_id: Project context
+            task: Task description
+            outcome: True if successful, False if failed
+            strategy_used: The approach taken
+            task_type: Category for grouping
+            duration_ms: Execution time
+            error_message: Error details if failed
+            feedback: User feedback
+        Returns:
+            The created Outcome record
+        """
+        # Validate agent has a scope (warn but don't block)
+        scope = self.scopes.get(agent)
+        if scope is None:
+            logger.warning(f"Agent '{agent}' has no defined scope")
+        # Create outcome record
+        outcome_record = Outcome(
+            id=f"out_{uuid.uuid4().hex[:12]}",
+            agent=agent,
+            project_id=project_id,
+            task_type=task_type or self._infer_task_type(task),
+            task_description=task,
+            success=outcome,
+            strategy_used=strategy_used,
+            duration_ms=duration_ms,
+            error_message=error_message,
+            user_feedback=feedback,
+            timestamp=datetime.now(timezone.utc),
+        )
+        # Save outcome
+        self.storage.save_outcome(outcome_record)
+        logger.info(
+            f"Recorded outcome for {agent}: {'success' if outcome else 'failure'}"
+        )
+        # Check if we should create/update a heuristic
+        self._maybe_create_heuristic(
+            agent=agent,
+            project_id=project_id,
+            task_type=outcome_record.task_type,
+            strategy=strategy_used,
+            success=outcome,
+            scope=scope,
+        )
+        # If failure with clear pattern, consider anti-pattern
+        if not outcome and error_message:
+            self._maybe_create_anti_pattern(
+                agent=agent,
+                project_id=project_id,
+                task=task,
+                strategy=strategy_used,
+                error=error_message,
+            )
+        return outcome_record
+    def _maybe_create_heuristic(
+        self,
+        agent: str,
+        project_id: str,
+        task_type: str,
+        strategy: str,
+        success: bool,
+        scope: Optional[MemoryScope],
+    ):
+        """
+        Create or update a heuristic if we have enough occurrences.
+        Only creates heuristic after min_occurrences similar outcomes.
+        """
+        min_occurrences = 3
+        if scope:
+            min_occurrences = scope.min_occurrences_for_heuristic
+        # Get similar outcomes to check occurrence count
+        similar_outcomes = self.storage.get_outcomes(
+            project_id=project_id,
+            agent=agent,
+            task_type=task_type,
+            top_k=min_occurrences + 1,
+            success_only=False,
+        )
+        # Filter to same strategy
+        same_strategy = [
+            o
+            for o in similar_outcomes
+            if self._strategies_similar(o.strategy_used, strategy)
+        ]
+        if len(same_strategy) >= min_occurrences:
+            success_count = sum(1 for o in same_strategy if o.success)
+            confidence = success_count / len(same_strategy)
+            # Only create heuristic if confidence is meaningful
+            if confidence > 0.5:
+                heuristic = Heuristic(
+                    id=f"heur_{uuid.uuid4().hex[:12]}",
+                    agent=agent,
+                    project_id=project_id,
+                    condition=f"task type: {task_type}",
+                    strategy=strategy,
+                    confidence=confidence,
+                    occurrence_count=len(same_strategy),
+                    success_count=success_count,
+                    last_validated=datetime.now(timezone.utc),
+                    created_at=datetime.now(timezone.utc),
+                )
+                self.storage.save_heuristic(heuristic)
+                logger.info(
+                    f"Created heuristic for {agent}: {strategy[:50]}... "
+                    f"(confidence: {confidence:.0%})"
+                )
+    def _maybe_create_anti_pattern(
+        self,
+        agent: str,
+        project_id: str,
+        task: str,
+        strategy: str,
+        error: str,
+    ):
+        """Create anti-pattern if we see repeated failures with same pattern."""
+        # Check for similar failures
+        similar_failures = self.storage.get_outcomes(
+            project_id=project_id,
+            agent=agent,
+            success_only=False,
+            top_k=10,
+        )
+        # Filter to failures with similar error
+        similar = [
+            o
+            for o in similar_failures
+            if not o.success
+            and o.error_message
+            and self._errors_similar(o.error_message, error)
+        ]
+        if len(similar) >= 2:  # At least 2 similar failures
+            anti_pattern = AntiPattern(
+                id=f"anti_{uuid.uuid4().hex[:12]}",
+                agent=agent,
+                project_id=project_id,
+                pattern=strategy,
+                why_bad=error,
+                better_alternative="[To be determined from successful outcomes]",
+                occurrence_count=len(similar),
+                last_seen=datetime.now(timezone.utc),
+            )
+            self.storage.save_anti_pattern(anti_pattern)
+            logger.info(f"Created anti-pattern for {agent}: {strategy[:50]}...")
+    def add_preference(
+        self,
+        user_id: str,
+        category: str,
+        preference: str,
+        source: str,
+    ) -> UserPreference:
+        """Add a user preference."""
+        pref = UserPreference(
+            id=f"pref_{uuid.uuid4().hex[:12]}",
+            user_id=user_id,
+            category=category,
+            preference=preference,
+            source=source,
+            confidence=1.0 if source == "explicit_instruction" else 0.7,
+            timestamp=datetime.now(timezone.utc),
+        )
+        self.storage.save_user_preference(pref)
+        return pref
+    def add_domain_knowledge(
+        self,
+        agent: str,
+        project_id: str,
+        domain: str,
+        fact: str,
+        source: str,
+    ) -> DomainKnowledge:
+        """Add domain knowledge."""
+        knowledge = DomainKnowledge(
+            id=f"dk_{uuid.uuid4().hex[:12]}",
+            agent=agent,
+            project_id=project_id,
+            domain=domain,
+            fact=fact,
+            source=source,
+            confidence=1.0 if source == "user_stated" else 0.8,
+            last_verified=datetime.now(timezone.utc),
+        )
+        self.storage.save_domain_knowledge(knowledge)
+        return knowledge
+    def forget(
+        self,
+        project_id: str,
+        agent: Optional[str] = None,
+        older_than_days: int = 90,
+        below_confidence: float = 0.3,
+    ) -> int:
+        """
+        Prune stale and low-confidence memories.
+        Returns:
+            Total number of items pruned
+        """
+        cutoff = datetime.now(timezone.utc) - timedelta(days=older_than_days)
+        # Delete old outcomes
+        outcomes_deleted = self.storage.delete_outcomes_older_than(
+            project_id=project_id,
+            older_than=cutoff,
+            agent=agent,
+        )
+        # Delete low-confidence heuristics
+        heuristics_deleted = self.storage.delete_low_confidence_heuristics(
+            project_id=project_id,
+            below_confidence=below_confidence,
+            agent=agent,
+        )
+        total = outcomes_deleted + heuristics_deleted
+        logger.info(
+            f"Forgot {total} items: {outcomes_deleted} outcomes, "
+            f"{heuristics_deleted} heuristics"
+        )
+        return total
+    def _infer_task_type(self, task: str) -> str:
+        """Infer task type from description."""
+        task_lower = task.lower()
+        if "test" in task_lower or "validate" in task_lower:
+            return "testing"
+        elif "api" in task_lower or "endpoint" in task_lower:
+            return "api_testing"
+        elif "form" in task_lower or "input" in task_lower:
+            return "form_testing"
+        elif "database" in task_lower or "query" in task_lower:
+            return "database_validation"
+        return "general"
+    def _strategies_similar(self, s1: str, s2: str) -> bool:
+        """
+        Check if two strategies are similar enough to count together.
+        Uses embedding-based cosine similarity when an embedder is available,
+        otherwise falls back to simple word overlap.
+        """
+        if self.embedder is not None:
+            return self._strategies_similar_embedding(s1, s2)
+        return self._strategies_similar_word_overlap(s1, s2)
+    def _strategies_similar_embedding(self, s1: str, s2: str) -> bool:
+        """Check strategy similarity using embedding cosine similarity."""
+        try:
+            emb1 = self.embedder.encode(s1)
+            emb2 = self.embedder.encode(s2)
+            similarity = self._cosine_similarity(emb1, emb2)
+            return similarity >= self.similarity_threshold
+        except Exception as e:
+            logger.warning(
+                f"Embedding similarity failed, falling back to word overlap: {e}"
+            )
+            return self._strategies_similar_word_overlap(s1, s2)
+    def _strategies_similar_word_overlap(self, s1: str, s2: str) -> bool:
+        """Check strategy similarity using simple word overlap."""
+        words1 = set(s1.lower().split())
+        words2 = set(s2.lower().split())
+        overlap = len(words1 & words2)
+        return overlap >= min(3, len(words1) // 2)
+    def _cosine_similarity(self, v1: list, v2: list) -> float:
+        """Compute cosine similarity between two vectors."""
+        import math
+        dot_product = sum(a * b for a, b in zip(v1, v2, strict=False))
+        norm1 = math.sqrt(sum(a * a for a in v1))
+        norm2 = math.sqrt(sum(b * b for b in v2))
+        if norm1 == 0 or norm2 == 0:
+            return 0.0
+        return dot_product / (norm1 * norm2)
+    def _errors_similar(self, e1: str, e2: str) -> bool:
+        """Check if two errors are similar."""
+        # Simple substring check
+        e1_lower = e1.lower()
+        e2_lower = e2.lower()
+        return e1_lower in e2_lower or e2_lower in e1_lower

alma-memory 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl