PyPI - hot-memory-mcp - Versions diffs - 0.4.0__tar.gz - Mend

hot-memory-mcp 0.4.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (45) hide show

hot_memory_mcp-0.4.0/.dockerignore +43 -0
hot_memory_mcp-0.4.0/.github/workflows/ci.yml +74 -0
hot_memory_mcp-0.4.0/.github/workflows/publish.yml +22 -0
hot_memory_mcp-0.4.0/.gitignore +52 -0
hot_memory_mcp-0.4.0/.pre-commit-config.yaml +30 -0
hot_memory_mcp-0.4.0/ARCHITECTURE.md +337 -0
hot_memory_mcp-0.4.0/CHANGELOG.md +159 -0
hot_memory_mcp-0.4.0/CLAUDE.md +131 -0
hot_memory_mcp-0.4.0/CONTRIBUTING.md +188 -0
hot_memory_mcp-0.4.0/Dockerfile +26 -0
hot_memory_mcp-0.4.0/LICENSE +21 -0
hot_memory_mcp-0.4.0/PKG-INFO +654 -0
hot_memory_mcp-0.4.0/README.md +623 -0
hot_memory_mcp-0.4.0/docs/API.md +813 -0
hot_memory_mcp-0.4.0/docs/examples/cross-session-continuity.md +123 -0
hot_memory_mcp-0.4.0/docs/examples/pattern-mining.md +144 -0
hot_memory_mcp-0.4.0/docs/examples/project-onboarding.md +94 -0
hot_memory_mcp-0.4.0/hooks/memory-log-response.sh +70 -0
hot_memory_mcp-0.4.0/pyproject.toml +67 -0
hot_memory_mcp-0.4.0/src/memory_mcp/__init__.py +3 -0
hot_memory_mcp-0.4.0/src/memory_mcp/cli.py +613 -0
hot_memory_mcp-0.4.0/src/memory_mcp/config.py +364 -0
hot_memory_mcp-0.4.0/src/memory_mcp/embeddings.py +570 -0
hot_memory_mcp-0.4.0/src/memory_mcp/helpers.py +613 -0
hot_memory_mcp-0.4.0/src/memory_mcp/logging.py +236 -0
hot_memory_mcp-0.4.0/src/memory_mcp/metrics.py +30 -0
hot_memory_mcp-0.4.0/src/memory_mcp/migrations.py +447 -0
hot_memory_mcp-0.4.0/src/memory_mcp/mining.py +278 -0
hot_memory_mcp-0.4.0/src/memory_mcp/models.py +358 -0
hot_memory_mcp-0.4.0/src/memory_mcp/project.py +200 -0
hot_memory_mcp-0.4.0/src/memory_mcp/responses.py +377 -0
hot_memory_mcp-0.4.0/src/memory_mcp/server.py +2215 -0
hot_memory_mcp-0.4.0/src/memory_mcp/storage.py +4427 -0
hot_memory_mcp-0.4.0/src/memory_mcp/text_parsing.py +39 -0
hot_memory_mcp-0.4.0/tests/__init__.py +0 -0
hot_memory_mcp-0.4.0/tests/conftest.py +76 -0
hot_memory_mcp-0.4.0/tests/test_bug_regressions.py +1104 -0
hot_memory_mcp-0.4.0/tests/test_cli.py +234 -0
hot_memory_mcp-0.4.0/tests/test_clustering.py +294 -0
hot_memory_mcp-0.4.0/tests/test_embeddings.py +496 -0
hot_memory_mcp-0.4.0/tests/test_mining.py +461 -0
hot_memory_mcp-0.4.0/tests/test_project.py +376 -0
hot_memory_mcp-0.4.0/tests/test_server.py +855 -0
hot_memory_mcp-0.4.0/tests/test_storage.py +2733 -0
hot_memory_mcp-0.4.0/uv.lock +3327 -0

hot_memory_mcp-0.4.0/.dockerignore ADDED Viewed

@@ -0,0 +1,43 @@
+# Git
+.git/
+.gitignore
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+*.egg-info/
+*.egg
+dist/
+build/
+# Virtual environments
+.venv/
+venv/
+ENV/
+# IDE
+.idea/
+.vscode/
+*.swp
+*.swo
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+.nox/
+tests/
+# Project-specific
+.beads/
+.claude/
+*.db
+*.pdf
+# Cache
+.mypy_cache/
+.ruff_cache/

hot_memory_mcp-0.4.0/.github/workflows/ci.yml ADDED Viewed

@@ -0,0 +1,74 @@
+name: CI
+on:
+  push:
+    branches: [main]
+  pull_request:
+    branches: [main]
+jobs:
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          version: "latest"
+      - name: Set up Python
+        run: uv python install 3.11
+      - name: Install dependencies
+        run: uv sync --group dev
+      - name: Run ruff linter
+        run: uv run ruff check src/ tests/
+      - name: Run ruff formatter check
+        run: uv run ruff format --check src/ tests/
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.10", "3.11", "3.12"]
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          version: "latest"
+      - name: Set up Python
+        env:
+          PYTHON_VERSION: ${{ matrix.python-version }}
+        run: uv python install "$PYTHON_VERSION"
+      - name: Install dependencies
+        run: uv sync --group dev
+      - name: Run tests
+        run: uv run pytest -v --tb=short
+  pre-commit:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v5
+        with:
+          version: "latest"
+      - name: Set up Python
+        run: uv python install 3.11
+      - name: Install pre-commit
+        run: uv tool install pre-commit
+      - name: Run pre-commit
+        run: uvx pre-commit run --all-files

hot_memory_mcp-0.4.0/.github/workflows/publish.yml ADDED Viewed

@@ -0,0 +1,22 @@
+name: Publish to PyPI
+on:
+  release:
+    types: [published]
+jobs:
+  publish:
+    runs-on: ubuntu-latest
+    permissions:
+      id-token: write  # Required for trusted publishing
+    steps:
+      - uses: actions/checkout@v4
+      - name: Install uv
+        uses: astral-sh/setup-uv@v4
+      - name: Build package
+        run: uv build
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1

hot_memory_mcp-0.4.0/.gitignore ADDED Viewed

@@ -0,0 +1,52 @@
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+# Virtual environments
+.venv/
+venv/
+ENV/
+# IDE
+.idea/
+.vscode/
+*.swp
+*.swo
+# Testing
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+.nox/
+# Database
+*.db
+# OS
+.DS_Store
+Thumbs.db
+# Project-specific
+.beads/
+# Claude local settings
+.claude/settings.local.json

hot_memory_mcp-0.4.0/.pre-commit-config.yaml ADDED Viewed

@@ -0,0 +1,30 @@
+repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v5.0.0
+    hooks:
+      - id: trailing-whitespace
+      - id: end-of-file-fixer
+      - id: check-yaml
+      - id: check-added-large-files
+        args: ['--maxkb=500']
+      - id: check-merge-conflict
+      - id: debug-statements
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.8.6
+    hooks:
+      # Linter
+      - id: ruff
+        args: [--fix, --exit-non-zero-on-fix]
+      # Formatter (replaces black)
+      - id: ruff-format
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.14.1
+    hooks:
+      - id: mypy
+        additional_dependencies:
+          - pydantic>=2.0
+          - pydantic-settings>=2.0
+        args: [--ignore-missing-imports, --no-strict-optional]
+        files: ^src/

hot_memory_mcp-0.4.0/ARCHITECTURE.md ADDED Viewed

@@ -0,0 +1,337 @@
+# Memory MCP Architecture
+This document describes the design decisions, architecture patterns, and rationale behind Memory MCP.
+## Core Design Principle
+**The Engram Insight**: Frequently-used patterns should be instantly available, not searched for every time.
+This principle drives every architectural decision. We optimize for the common case where a small set of project knowledge is accessed repeatedly.
+## Two-Tier Memory Architecture
+```
+┌─────────────────────────────────────────────────────────────┐
+│                      Claude / LLM                            │
+└─────────────────────────────────────────────────────────────┘
+        │                                    │
+        ▼ (auto-injected)                    ▼ (tool call)
+┌───────────────────┐              ┌────────────────────────┐
+│    Hot Cache      │              │    Cold Storage        │
+│  MCP Resource     │              │    Vector Database     │
+│                   │              │                        │
+│  - 20 items max   │◄────────────►│  - Unlimited capacity  │
+│  - Instant recall │  promotion   │  - Semantic search     │
+│  - Pinnable       │  / demotion  │  - ~50ms lookup        │
+└───────────────────┘              └────────────────────────┘
+        ▲                                    ▲
+        │                                    │
+        └──────────── Mining Pipeline ───────┘
+```
+### Why Two Tiers?
+| Problem | Solution |
+|---------|----------|
+| Tool calls add latency | Hot cache injected via MCP resource (0ms) |
+| Large context wastes tokens | Only 20 high-value items in hot cache |
+| Manual memory management is tedious | Automatic promotion/demotion based on access |
+### Hot Cache
+- **Implementation**: MCP resource at `memory://hot-cache`
+- **Capacity**: 20 items (configurable via `HOT_CACHE_MAX_ITEMS`)
+- **Eviction**: LRU with composite scoring (access count + recency)
+- **Pinning**: Items can be pinned to prevent eviction
+**Scoring Formula**:
+```
+hot_score = (access_weight × access_count) + (recency_weight × recency_boost)
+recency_boost = 0.5^(days_since_access / halflife_days)
+```
+### Cold Storage
+- **Implementation**: SQLite with sqlite-vec extension
+- **Vector Dimension**: 384 (all-MiniLM-L6-v2 default)
+- **Search**: Cosine similarity with composite ranking
+**Ranking Formula**:
+```
+composite_score = (similarity_weight × similarity) +
+                  (recency_weight × recency_score) +
+                  (access_weight × normalized_access)
+```
+## Data Flow
+```mermaid
+graph TB
+    subgraph Input["Input Layer"]
+        direction LR
+        R[remember tool]
+        L[log_output tool]
+    end
+    subgraph Process["Processing"]
+        direction TB
+        subgraph Store["Store Path"]
+            S[Store Memory] --> E[Embed]
+        end
+        subgraph Mine["Mining Path"]
+            O[Output Log] --> MP[Extract Patterns]
+            MP --> P{Confidence?}
+        end
+    end
+    subgraph Persist["Persistence Layer"]
+        direction LR
+        V[(Vectors)]
+        M[(Metadata)]
+    end
+    subgraph Retrieve["Retrieval"]
+        direction TB
+        Q[recall tool] --> VS[Vector Search]
+        VS --> RK[Composite Rank]
+    end
+    subgraph Cache["Hot Cache Lifecycle"]
+        direction LR
+        PR[Promote] --> H[Hot Cache]
+        H --> DE[Demote]
+    end
+    R --> S
+    L --> O
+    E --> V & M
+    P -->|≥0.8| S
+    P -->|<0.8| A[approve_candidate]
+    A --> S
+    RK --> V & M
+    RK -->|access 3+| PR
+    DE -->|14 days stale| V
+```
+## Module Structure
+```
+src/memory_mcp/
+├── server.py       # MCP tools and resources - the API layer
+├── storage.py      # SQLite operations, vector search, caching logic
+├── responses.py    # Pydantic response models for MCP tools
+├── models.py       # Enums and dataclasses (domain models)
+├── migrations.py   # Database schema and version migrations
+├── mining.py       # Pattern extraction from outputs
+├── config.py       # Settings with environment variable loading
+├── cli.py          # CLI commands for hooks and administration
+├── embeddings.py   # Embedding providers (sentence-transformers, MLX)
+├── text_parsing.py # Content chunking for seeding
+├── logging.py      # Structured logging configuration
+└── metrics.py      # Metrics collection and observability
+```
+### Module Dependencies
+```mermaid
+graph TB
+    subgraph API["API Layer"]
+        direction LR
+        server[server.py]
+        cli[cli.py]
+    end
+    subgraph Core["Core Layer"]
+        direction LR
+        storage[storage.py]
+        mining[mining.py]
+    end
+    subgraph Support["Support Layer"]
+        direction LR
+        helpers[helpers.py]
+        responses[responses.py]
+        embeddings[embeddings.py]
+    end
+    subgraph Foundation["Foundation Layer"]
+        direction LR
+        models[models.py]
+        config[config.py]
+        migrations[migrations.py]
+        logging[logging.py]
+        metrics[metrics.py]
+    end
+    server --> storage & helpers & responses & logging
+    cli --> storage & config
+    storage --> models & migrations & embeddings & config
+    mining --> storage
+    helpers --> models & responses
+    responses --> models
+    metrics --> logging
+```
+### Layer Responsibilities
+| Module | Responsibility |
+|--------|----------------|
+| `server.py` | MCP tools/resources, request validation, response construction |
+| `storage.py` | Data persistence, vector operations, business logic |
+| `responses.py` | Pydantic models for tool return types |
+| `models.py` | Domain enums (MemoryType, TrustReason) and dataclasses (Memory, Session) |
+| `migrations.py` | Database schema definition and version migrations |
+| `mining.py` | Pattern extraction algorithms |
+| `embeddings.py` | Embedding abstraction (MLX on Apple Silicon, else ST) |
+| `logging.py` | Loguru configuration, stderr output for MCP compatibility |
+| `metrics.py` | Counters, gauges, and metric recording helpers |
+### Why This Structure?
+1. **Separated concerns**: Models, responses, and migrations extracted for clarity
+2. **Thin server layer**: Adapts storage operations to MCP protocol
+3. **Swappable embeddings**: Backend detection allows hardware optimization
+4. **Backwards-compatible imports**: Re-exports preserve existing import paths
+## Key Design Decisions
+### 1. SQLite + sqlite-vec Over Vector Databases
+**Chose**: SQLite with sqlite-vec extension
+**Alternatives considered**: Pinecone, Weaviate, Milvus, Chroma
+**Rationale**:
+- **Local-first**: No network dependency, instant startup
+- **Simplicity**: Single file database, easy backup/restore
+- **Scale**: Handles thousands of memories efficiently
+- **Portability**: Works everywhere Python works
+**Trade-off**: Limited to single-user, single-machine scenarios
+### 2. Sentence Transformers for Embeddings
+**Chose**: all-MiniLM-L6-v2 (384 dimensions)
+**Alternatives considered**: OpenAI embeddings, larger BERT models
+**Rationale**:
+- **Local**: No API calls, no costs, offline capable
+- **Fast**: ~50ms per embedding on CPU
+- **Small**: 90MB model, 384 dimensions
+- **Quality**: Good semantic similarity for short text
+**Trade-off**: Less powerful than larger models, but sufficient for memory retrieval
+### 3. Automatic Promotion/Demotion
+**Chose**: Frequency-based with configurable thresholds
+**Design**:
+- Promote after 3 accesses (configurable)
+- Demote after 14 days without access (configurable)
+- Evict lowest-scored when cache full
+**Rationale**: Reduces manual intervention while ensuring hot cache reflects actual usage
+### 4. Pattern Mining Pipeline
+**Chose**: Regex-based extraction with occurrence counting
+**Extracted patterns**:
+- Python imports
+- Shell commands (npm, git, docker, etc.)
+- Project facts ("This project uses X")
+- Code blocks from markdown
+**Auto-approval**: Patterns with confidence ≥ 0.8 and occurrences ≥ 3 are automatically promoted
+**Rationale**: Low overhead, high precision for common patterns
+### 5. Trust Score System
+**Chose**: Decay-based trust with explicit validation/invalidation
+**Design**:
+- Manual memories start at 1.0 trust
+- Mined memories start at 0.7 trust
+- Trust decays over time (type-specific half-lives)
+- Explicit validation/invalidation adjusts trust
+**Rationale**: Older information naturally becomes less reliable; explicit feedback accelerates correction
+### 6. Knowledge Graph
+**Chose**: Simple typed relationships stored in SQLite
+**Relation types**:
+- `relates_to`: General association
+- `depends_on`: Prerequisite
+- `supersedes`: Replaces older info
+- `refines`: More specific version
+- `contradicts`: Conflicting information
+- `elaborates`: More detail
+**Rationale**: Enables context expansion during recall without complex graph database
+### 7. Predictive Hot Cache
+**Chose**: Markov chain of access sequences
+**Design**:
+- Record (memory_A, memory_B) when accessed together
+- Build transition probabilities
+- Pre-warm cache with predicted next memories after each recall
+**Rationale**: Learns actual usage patterns without explicit configuration
+## Configuration Philosophy
+**Principle**: Maximum value with minimal configuration
+Default settings are optimized for immediate value:
+- Predictive cache: Enabled by default
+- Auto-approve mining: Enabled with conservative thresholds
+- Auto-promote/demote: Enabled
+Power users can tune via environment variables, but sensible defaults mean most users never need to.
+## Error Handling Strategy
+1. **Graceful degradation**: If embedding fails, memory still stored without vector
+2. **Idempotent operations**: Duplicate stores merge tags and increment access
+3. **Audit logging**: Destructive operations logged for recovery
+4. **No silent failures**: Errors returned in response, not swallowed
+## Performance Characteristics
+| Operation | Typical Latency | Notes |
+|-----------|-----------------|-------|
+| Hot cache read | 0ms | Auto-injected by MCP |
+| remember() | 50-100ms | Embedding dominates |
+| recall() | 50-150ms | Vector search + ranking |
+| Mining (24h) | 1-5s | Depends on log volume |
+| Bootstrap | 2-10s | Depends on file count |
+## Future Considerations
+### Considered but Deferred
+1. **Multi-user support**: Would require auth, permissions, conflict resolution
+2. **Distributed storage**: Current single-file model sufficient for local use
+3. **Custom embedding models**: Current model adequate; adding complexity not justified
+4. **LLM-based extraction**: Regex patterns sufficient; LLM adds latency and cost
+### Potential Enhancements
+1. **Semantic deduplication**: Merge near-duplicate memories automatically
+2. **Memory aging**: Archive very old, unused memories
+3. **Cross-project sharing**: Share patterns across projects
+4. **Embedding model migration**: Tools to rebuild vectors when changing models
+## References
+- [Engram](https://github.com/AnswerDotAI/engram) - Inspiration for hot cache concept
+- [sqlite-vec](https://github.com/asg017/sqlite-vec) - Vector search extension
+- [FastMCP](https://github.com/jlowin/fastmcp) - MCP server framework
+- [sentence-transformers](https://www.sbert.net/) - Embedding models