PyPI - alma-memory - Versions diffs - 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl - Mend

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (111) hide show

alma/__init__.py +296 -226
alma/compression/__init__.py +33 -0
alma/compression/pipeline.py +980 -0
alma/confidence/__init__.py +47 -47
alma/confidence/engine.py +540 -540
alma/confidence/types.py +351 -351
alma/config/loader.py +157 -157
alma/consolidation/__init__.py +23 -23
alma/consolidation/engine.py +678 -678
alma/consolidation/prompts.py +84 -84
alma/core.py +1189 -430
alma/domains/__init__.py +30 -30
alma/domains/factory.py +359 -359
alma/domains/schemas.py +448 -448
alma/domains/types.py +272 -272
alma/events/__init__.py +75 -75
alma/events/emitter.py +285 -284
alma/events/storage_mixin.py +246 -246
alma/events/types.py +126 -126
alma/events/webhook.py +425 -425
alma/exceptions.py +49 -49
alma/extraction/__init__.py +31 -31
alma/extraction/auto_learner.py +265 -265
alma/extraction/extractor.py +420 -420
alma/graph/__init__.py +106 -106
alma/graph/backends/__init__.py +32 -32
alma/graph/backends/kuzu.py +624 -624
alma/graph/backends/memgraph.py +432 -432
alma/graph/backends/memory.py +236 -236
alma/graph/backends/neo4j.py +417 -417
alma/graph/base.py +159 -159
alma/graph/extraction.py +198 -198
alma/graph/store.py +860 -860
alma/harness/__init__.py +35 -35
alma/harness/base.py +386 -386
alma/harness/domains.py +705 -705
alma/initializer/__init__.py +37 -37
alma/initializer/initializer.py +418 -418
alma/initializer/types.py +250 -250
alma/integration/__init__.py +62 -62
alma/integration/claude_agents.py +444 -444
alma/integration/helena.py +423 -423
alma/integration/victor.py +471 -471
alma/learning/__init__.py +101 -86
alma/learning/decay.py +878 -0
alma/learning/forgetting.py +1446 -1446
alma/learning/heuristic_extractor.py +390 -390
alma/learning/protocols.py +374 -374
alma/learning/validation.py +346 -346
alma/mcp/__init__.py +123 -45
alma/mcp/__main__.py +156 -156
alma/mcp/resources.py +122 -122
alma/mcp/server.py +955 -591
alma/mcp/tools.py +3254 -509
alma/observability/__init__.py +91 -84
alma/observability/config.py +302 -302
alma/observability/guidelines.py +170 -0
alma/observability/logging.py +424 -424
alma/observability/metrics.py +583 -583
alma/observability/tracing.py +440 -440
alma/progress/__init__.py +21 -21
alma/progress/tracker.py +607 -607
alma/progress/types.py +250 -250
alma/retrieval/__init__.py +134 -53
alma/retrieval/budget.py +525 -0
alma/retrieval/cache.py +1304 -1061
alma/retrieval/embeddings.py +202 -202
alma/retrieval/engine.py +850 -427
alma/retrieval/modes.py +365 -0
alma/retrieval/progressive.py +560 -0
alma/retrieval/scoring.py +344 -344
alma/retrieval/trust_scoring.py +637 -0
alma/retrieval/verification.py +797 -0
alma/session/__init__.py +19 -19
alma/session/manager.py +442 -399
alma/session/types.py +288 -288
alma/storage/__init__.py +101 -90
alma/storage/archive.py +233 -0
alma/storage/azure_cosmos.py +1259 -1259
alma/storage/base.py +1083 -583
alma/storage/chroma.py +1443 -1443
alma/storage/constants.py +103 -103
alma/storage/file_based.py +614 -614
alma/storage/migrations/__init__.py +21 -21
alma/storage/migrations/base.py +321 -321
alma/storage/migrations/runner.py +323 -323
alma/storage/migrations/version_stores.py +337 -337
alma/storage/migrations/versions/__init__.py +11 -11
alma/storage/migrations/versions/v1_0_0.py +373 -373
alma/storage/migrations/versions/v1_1_0_workflow_context.py +551 -0
alma/storage/pinecone.py +1080 -1080
alma/storage/postgresql.py +1948 -1559
alma/storage/qdrant.py +1306 -1306
alma/storage/sqlite_local.py +3041 -1457
alma/testing/__init__.py +46 -46
alma/testing/factories.py +301 -301
alma/testing/mocks.py +389 -389
alma/types.py +292 -264
alma/utils/__init__.py +19 -0
alma/utils/tokenizer.py +521 -0
alma/workflow/__init__.py +83 -0
alma/workflow/artifacts.py +170 -0
alma/workflow/checkpoint.py +311 -0
alma/workflow/context.py +228 -0
alma/workflow/outcomes.py +189 -0
alma/workflow/reducers.py +393 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/METADATA +210 -72
alma_memory-0.7.0.dist-info/RECORD +112 -0
alma_memory-0.5.1.dist-info/RECORD +0 -93
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/WHEEL +0 -0
{alma_memory-0.5.1.dist-info → alma_memory-0.7.0.dist-info}/top_level.txt +0 -0

alma/types.py CHANGED Viewed

@@ -1,264 +1,292 @@
-"""
-ALMA Memory Types
-Defines the core data structures for all memory types.
-"""
-from dataclasses import dataclass, field
-from datetime import datetime, timezone
-from enum import Enum
-from typing import Any, Dict, List, Optional
-class MemoryType(Enum):
-    """Categories of memory that agents can store and retrieve."""
-    HEURISTIC = "heuristic"
-    OUTCOME = "outcome"
-    USER_PREFERENCE = "user_preference"
-    DOMAIN_KNOWLEDGE = "domain_knowledge"
-    ANTI_PATTERN = "anti_pattern"
-@dataclass
-class MemoryScope:
-    """
-    Defines what an agent is allowed to learn and share.
-    Prevents scope creep by explicitly listing allowed and forbidden domains.
-    Supports multi-agent memory sharing through share_with and inherit_from.
-    """
-    agent_name: str
-    can_learn: List[str]
-    cannot_learn: List[str]
-    share_with: List[str] = field(
-        default_factory=list
-    )  # Agents that can read this agent's memories
-    inherit_from: List[str] = field(
-        default_factory=list
-    )  # Agents whose memories this agent can read
-    min_occurrences_for_heuristic: int = 3
-    def is_allowed(self, domain: str) -> bool:
-        """Check if learning in this domain is permitted."""
-        if domain in self.cannot_learn:
-            return False
-        if not self.can_learn:  # Empty means all allowed (except cannot_learn)
-            return True
-        return domain in self.can_learn
-    def get_readable_agents(self) -> List[str]:
-        """
-        Get list of agents whose memories this agent can read.
-        Returns:
-            List containing this agent's name plus all inherited agents.
-        """
-        return [self.agent_name] + list(self.inherit_from)
-    def can_read_from(self, other_agent: str) -> bool:
-        """
-        Check if this agent can read memories from another agent.
-        Args:
-            other_agent: Name of the agent to check
-        Returns:
-            True if this agent can read from other_agent
-        """
-        return other_agent == self.agent_name or other_agent in self.inherit_from
-    def shares_with(self, other_agent: str) -> bool:
-        """
-        Check if this agent shares memories with another agent.
-        Args:
-            other_agent: Name of the agent to check
-        Returns:
-            True if this agent shares with other_agent
-        """
-        return other_agent in self.share_with
-@dataclass
-class Heuristic:
-    """
-    A learned rule: "When condition X, strategy Y works N% of the time."
-    Heuristics are only created after min_occurrences validations.
-    """
-    id: str
-    agent: str
-    project_id: str
-    condition: str  # "form with multiple required fields"
-    strategy: str  # "test happy path first, then individual validation"
-    confidence: float  # 0.0 to 1.0
-    occurrence_count: int
-    success_count: int
-    last_validated: datetime
-    created_at: datetime
-    embedding: Optional[List[float]] = None
-    metadata: Dict[str, Any] = field(default_factory=dict)
-    @property
-    def success_rate(self) -> float:
-        """Calculate success rate from occurrences."""
-        if self.occurrence_count == 0:
-            return 0.0
-        return self.success_count / self.occurrence_count
-@dataclass
-class Outcome:
-    """
-    Record of a task execution - success or failure with context.
-    Outcomes are raw data that can be consolidated into heuristics.
-    """
-    id: str
-    agent: str
-    project_id: str
-    task_type: str  # "api_validation", "form_testing", etc.
-    task_description: str
-    success: bool
-    strategy_used: str
-    duration_ms: Optional[int] = None
-    error_message: Optional[str] = None
-    user_feedback: Optional[str] = None
-    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
-    embedding: Optional[List[float]] = None
-    metadata: Dict[str, Any] = field(default_factory=dict)
-@dataclass
-class UserPreference:
-    """
-    A remembered user constraint or communication preference.
-    Persists across sessions so users don't repeat themselves.
-    """
-    id: str
-    user_id: str
-    category: str  # "communication", "code_style", "workflow"
-    preference: str  # "No emojis in documentation"
-    source: str  # "explicit_instruction", "inferred_from_correction"
-    confidence: float = 1.0  # Lower for inferred preferences
-    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
-    metadata: Dict[str, Any] = field(default_factory=dict)
-@dataclass
-class DomainKnowledge:
-    """
-    Accumulated domain-specific facts within agent's scope.
-    Different from heuristics - these are facts, not strategies.
-    """
-    id: str
-    agent: str
-    project_id: str
-    domain: str  # "authentication", "database_schema", etc.
-    fact: str  # "Login endpoint uses JWT with 24h expiry"
-    source: str  # "code_analysis", "documentation", "user_stated"
-    confidence: float = 1.0
-    last_verified: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
-    embedding: Optional[List[float]] = None
-    metadata: Dict[str, Any] = field(default_factory=dict)
-@dataclass
-class AntiPattern:
-    """
-    What NOT to do - learned from validated failures.
-    Helps agents avoid repeating mistakes.
-    """
-    id: str
-    agent: str
-    project_id: str
-    pattern: str  # "Using fixed sleep() for async waits"
-    why_bad: str  # "Causes flaky tests, doesn't adapt to load"
-    better_alternative: str  # "Use explicit waits with conditions"
-    occurrence_count: int
-    last_seen: datetime
-    created_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
-    embedding: Optional[List[float]] = None
-    metadata: Dict[str, Any] = field(default_factory=dict)
-@dataclass
-class MemorySlice:
-    """
-    A compact, relevant subset of memories for injection into context.
-    This is what gets injected per-call - must stay under token budget.
-    """
-    heuristics: List[Heuristic] = field(default_factory=list)
-    outcomes: List[Outcome] = field(default_factory=list)
-    preferences: List[UserPreference] = field(default_factory=list)
-    domain_knowledge: List[DomainKnowledge] = field(default_factory=list)
-    anti_patterns: List[AntiPattern] = field(default_factory=list)
-    # Retrieval metadata
-    query: Optional[str] = None
-    agent: Optional[str] = None
-    retrieval_time_ms: Optional[int] = None
-    def to_prompt(self, max_tokens: int = 2000) -> str:
-        """
-        Format memories for injection into agent context.
-        Respects token budget by prioritizing high-confidence items.
-        """
-        sections = []
-        if self.heuristics:
-            h_text = "## Relevant Strategies\n"
-            for h in sorted(self.heuristics, key=lambda x: -x.confidence)[:5]:
-                h_text += f"- When: {h.condition}\n  Do: {h.strategy} (confidence: {h.confidence:.0%})\n"
-            sections.append(h_text)
-        if self.anti_patterns:
-            ap_text = "## Avoid These Patterns\n"
-            for ap in self.anti_patterns[:3]:
-                ap_text += f"- Don't: {ap.pattern}\n  Why: {ap.why_bad}\n  Instead: {ap.better_alternative}\n"
-            sections.append(ap_text)
-        if self.preferences:
-            p_text = "## User Preferences\n"
-            for p in self.preferences[:5]:
-                p_text += f"- {p.preference}\n"
-            sections.append(p_text)
-        if self.domain_knowledge:
-            dk_text = "## Domain Context\n"
-            for dk in self.domain_knowledge[:5]:
-                dk_text += f"- {dk.fact}\n"
-            sections.append(dk_text)
-        result = "\n".join(sections)
-        # Basic token estimation (rough: 1 token ~ 4 chars)
-        if len(result) > max_tokens * 4:
-            result = result[: max_tokens * 4] + "\n[truncated]"
-        return result
-    @property
-    def total_items(self) -> int:
-        """Total number of memory items in this slice."""
-        return (
-            len(self.heuristics)
-            + len(self.outcomes)
-            + len(self.preferences)
-            + len(self.domain_knowledge)
-            + len(self.anti_patterns)
-        )
+"""
+ALMA Memory Types
+Defines the core data structures for all memory types.
+"""
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from enum import Enum
+from typing import TYPE_CHECKING, Any, Dict, List, Optional
+if TYPE_CHECKING:
+    from alma.workflow.outcomes import WorkflowOutcome
+class MemoryType(Enum):
+    """Categories of memory that agents can store and retrieve."""
+    HEURISTIC = "heuristic"
+    OUTCOME = "outcome"
+    USER_PREFERENCE = "user_preference"
+    DOMAIN_KNOWLEDGE = "domain_knowledge"
+    ANTI_PATTERN = "anti_pattern"
+@dataclass
+class MemoryScope:
+    """
+    Defines what an agent is allowed to learn and share.
+    Prevents scope creep by explicitly listing allowed and forbidden domains.
+    Supports multi-agent memory sharing through share_with and inherit_from.
+    """
+    agent_name: str
+    can_learn: List[str]
+    cannot_learn: List[str]
+    share_with: List[str] = field(
+        default_factory=list
+    )  # Agents that can read this agent's memories
+    inherit_from: List[str] = field(
+        default_factory=list
+    )  # Agents whose memories this agent can read
+    min_occurrences_for_heuristic: int = 3
+    def is_allowed(self, domain: str) -> bool:
+        """Check if learning in this domain is permitted."""
+        if domain in self.cannot_learn:
+            return False
+        if not self.can_learn:  # Empty means all allowed (except cannot_learn)
+            return True
+        return domain in self.can_learn
+    def get_readable_agents(self) -> List[str]:
+        """
+        Get list of agents whose memories this agent can read.
+        Returns:
+            List containing this agent's name plus all inherited agents.
+        """
+        return [self.agent_name] + list(self.inherit_from)
+    def can_read_from(self, other_agent: str) -> bool:
+        """
+        Check if this agent can read memories from another agent.
+        Args:
+            other_agent: Name of the agent to check
+        Returns:
+            True if this agent can read from other_agent
+        """
+        return other_agent == self.agent_name or other_agent in self.inherit_from
+    def shares_with(self, other_agent: str) -> bool:
+        """
+        Check if this agent shares memories with another agent.
+        Args:
+            other_agent: Name of the agent to check
+        Returns:
+            True if this agent shares with other_agent
+        """
+        return other_agent in self.share_with
+@dataclass
+class Heuristic:
+    """
+    A learned rule: "When condition X, strategy Y works N% of the time."
+    Heuristics are only created after min_occurrences validations.
+    """
+    id: str
+    agent: str
+    project_id: str
+    condition: str  # "form with multiple required fields"
+    strategy: str  # "test happy path first, then individual validation"
+    confidence: float  # 0.0 to 1.0
+    occurrence_count: int
+    success_count: int
+    last_validated: datetime
+    created_at: datetime
+    embedding: Optional[List[float]] = None
+    metadata: Dict[str, Any] = field(default_factory=dict)
+    @property
+    def success_rate(self) -> float:
+        """Calculate success rate from occurrences."""
+        if self.occurrence_count == 0:
+            return 0.0
+        return self.success_count / self.occurrence_count
+@dataclass
+class Outcome:
+    """
+    Record of a task execution - success or failure with context.
+    Outcomes are raw data that can be consolidated into heuristics.
+    """
+    id: str
+    agent: str
+    project_id: str
+    task_type: str  # "api_validation", "form_testing", etc.
+    task_description: str
+    success: bool
+    strategy_used: str
+    duration_ms: Optional[int] = None
+    error_message: Optional[str] = None
+    user_feedback: Optional[str] = None
+    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    embedding: Optional[List[float]] = None
+    metadata: Dict[str, Any] = field(default_factory=dict)
+@dataclass
+class UserPreference:
+    """
+    A remembered user constraint or communication preference.
+    Persists across sessions so users don't repeat themselves.
+    """
+    id: str
+    user_id: str
+    category: str  # "communication", "code_style", "workflow"
+    preference: str  # "No emojis in documentation"
+    source: str  # "explicit_instruction", "inferred_from_correction"
+    confidence: float = 1.0  # Lower for inferred preferences
+    timestamp: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    metadata: Dict[str, Any] = field(default_factory=dict)
+@dataclass
+class DomainKnowledge:
+    """
+    Accumulated domain-specific facts within agent's scope.
+    Different from heuristics - these are facts, not strategies.
+    """
+    id: str
+    agent: str
+    project_id: str
+    domain: str  # "authentication", "database_schema", etc.
+    fact: str  # "Login endpoint uses JWT with 24h expiry"
+    source: str  # "code_analysis", "documentation", "user_stated"
+    confidence: float = 1.0
+    last_verified: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    embedding: Optional[List[float]] = None
+    metadata: Dict[str, Any] = field(default_factory=dict)
+@dataclass
+class AntiPattern:
+    """
+    What NOT to do - learned from validated failures.
+    Helps agents avoid repeating mistakes.
+    """
+    id: str
+    agent: str
+    project_id: str
+    pattern: str  # "Using fixed sleep() for async waits"
+    why_bad: str  # "Causes flaky tests, doesn't adapt to load"
+    better_alternative: str  # "Use explicit waits with conditions"
+    occurrence_count: int
+    last_seen: datetime
+    created_at: datetime = field(default_factory=lambda: datetime.now(timezone.utc))
+    embedding: Optional[List[float]] = None
+    metadata: Dict[str, Any] = field(default_factory=dict)
+@dataclass
+class MemorySlice:
+    """
+    A compact, relevant subset of memories for injection into context.
+    This is what gets injected per-call - must stay under token budget.
+    """
+    heuristics: List[Heuristic] = field(default_factory=list)
+    outcomes: List[Outcome] = field(default_factory=list)
+    preferences: List[UserPreference] = field(default_factory=list)
+    domain_knowledge: List[DomainKnowledge] = field(default_factory=list)
+    anti_patterns: List[AntiPattern] = field(default_factory=list)
+    # Workflow outcomes (v0.6.0+)
+    workflow_outcomes: List["WorkflowOutcome"] = field(default_factory=list)
+    # Retrieval metadata
+    query: Optional[str] = None
+    agent: Optional[str] = None
+    retrieval_time_ms: Optional[int] = None
+    def to_prompt(
+        self,
+        max_tokens: int = 2000,
+        model: Optional[str] = None,
+    ) -> str:
+        """
+        Format memories for injection into agent context.
+        Respects token budget by prioritizing high-confidence items.
+        Uses accurate token counting via tiktoken when available.
+        Args:
+            max_tokens: Maximum tokens allowed for the output
+            model: Optional model name for accurate tokenization
+                   (e.g., "gpt-4", "claude-3-sonnet"). If not provided,
+                   uses a general-purpose estimation.
+        Returns:
+            Formatted prompt string, truncated if necessary
+        """
+        from alma.utils.tokenizer import TokenEstimator
+        # Initialize token estimator
+        estimator = TokenEstimator(model=model) if model else TokenEstimator()
+        sections = []
+        if self.heuristics:
+            h_text = "## Relevant Strategies\n"
+            for h in sorted(self.heuristics, key=lambda x: -x.confidence)[:5]:
+                h_text += f"- When: {h.condition}\n  Do: {h.strategy} (confidence: {h.confidence:.0%})\n"
+            sections.append(h_text)
+        if self.anti_patterns:
+            ap_text = "## Avoid These Patterns\n"
+            for ap in self.anti_patterns[:3]:
+                ap_text += f"- Don't: {ap.pattern}\n  Why: {ap.why_bad}\n  Instead: {ap.better_alternative}\n"
+            sections.append(ap_text)
+        if self.preferences:
+            p_text = "## User Preferences\n"
+            for p in self.preferences[:5]:
+                p_text += f"- {p.preference}\n"
+            sections.append(p_text)
+        if self.domain_knowledge:
+            dk_text = "## Domain Context\n"
+            for dk in self.domain_knowledge[:5]:
+                dk_text += f"- {dk.fact}\n"
+            sections.append(dk_text)
+        result = "\n".join(sections)
+        # Use accurate token estimation and truncation
+        result = estimator.truncate_to_token_limit(
+            text=result,
+            max_tokens=max_tokens,
+            suffix="\n[truncated]",
+        )
+        return result
+    @property
+    def total_items(self) -> int:
+        """Total number of memory items in this slice."""
+        return (
+            len(self.heuristics)
+            + len(self.outcomes)
+            + len(self.preferences)
+            + len(self.domain_knowledge)
+            + len(self.anti_patterns)
+        )

alma/utils/__init__.py ADDED Viewed

@@ -0,0 +1,19 @@
+"""
+ALMA Utility modules.
+Provides shared utilities for token estimation and other common functionality.
+"""
+from alma.utils.tokenizer import (
+    ModelTokenBudget,
+    TokenEstimator,
+    get_default_token_budget,
+    get_token_estimator,
+)
+__all__ = [
+    "TokenEstimator",
+    "ModelTokenBudget",
+    "get_token_estimator",
+    "get_default_token_budget",
+]

alma-memory 0.5.1__py3-none-any.whl → 0.7.0__py3-none-any.whl

alma-memory 0.5.1py3-none-any.whl → 0.7.0py3-none-any.whl