PyPI - memstash - Versions diffs - 0.15.0__tar.gz - Mend

memstash 0.15.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (59) hide show

memstash-0.15.0/.github/workflows/ci.yml +26 -0
memstash-0.15.0/.github/workflows/publish.yml +47 -0
memstash-0.15.0/.gitignore +25 -0
memstash-0.15.0/CHANGELOG.md +293 -0
memstash-0.15.0/LICENSE +21 -0
memstash-0.15.0/PKG-INFO +471 -0
memstash-0.15.0/README.md +418 -0
memstash-0.15.0/ROADMAP.md +118 -0
memstash-0.15.0/examples/basic.py +22 -0
memstash-0.15.0/memstash/__init__.py +18 -0
memstash-0.15.0/memstash/adapters/__init__.py +165 -0
memstash-0.15.0/memstash/adapters/anthropic_adapter.py +75 -0
memstash-0.15.0/memstash/adapters/base.py +61 -0
memstash-0.15.0/memstash/adapters/gemini_adapter.py +77 -0
memstash-0.15.0/memstash/adapters/openai_adapter.py +90 -0
memstash-0.15.0/memstash/bench.py +150 -0
memstash-0.15.0/memstash/cli.py +998 -0
memstash-0.15.0/memstash/config.py +80 -0
memstash-0.15.0/memstash/core.py +594 -0
memstash-0.15.0/memstash/dashboard/__init__.py +1 -0
memstash-0.15.0/memstash/dashboard/server.py +143 -0
memstash-0.15.0/memstash/evals.py +98 -0
memstash-0.15.0/memstash/extract.py +53 -0
memstash-0.15.0/memstash/extract_llm.py +90 -0
memstash-0.15.0/memstash/graph_extract.py +77 -0
memstash-0.15.0/memstash/ingest.py +57 -0
memstash-0.15.0/memstash/instrument.py +121 -0
memstash-0.15.0/memstash/mcp_server.py +108 -0
memstash-0.15.0/memstash/memory.py +388 -0
memstash-0.15.0/memstash/otel_export.py +92 -0
memstash-0.15.0/memstash/pricing.py +140 -0
memstash-0.15.0/memstash/prompts.py +39 -0
memstash-0.15.0/memstash/reconcile.py +109 -0
memstash-0.15.0/memstash/store.py +738 -0
memstash-0.15.0/pyproject.toml +70 -0
memstash-0.15.0/tests/test_bench.py +52 -0
memstash-0.15.0/tests/test_bitemporal.py +66 -0
memstash-0.15.0/tests/test_core.py +103 -0
memstash-0.15.0/tests/test_embeddings.py +87 -0
memstash-0.15.0/tests/test_eval_suites.py +92 -0
memstash-0.15.0/tests/test_evals.py +84 -0
memstash-0.15.0/tests/test_features.py +118 -0
memstash-0.15.0/tests/test_graph.py +66 -0
memstash-0.15.0/tests/test_graph_retrieval.py +57 -0
memstash-0.15.0/tests/test_ingest.py +87 -0
memstash-0.15.0/tests/test_instrument.py +88 -0
memstash-0.15.0/tests/test_lifecycle.py +113 -0
memstash-0.15.0/tests/test_memory_ops.py +112 -0
memstash-0.15.0/tests/test_multiturn.py +64 -0
memstash-0.15.0/tests/test_otel.py +32 -0
memstash-0.15.0/tests/test_plugins.py +44 -0
memstash-0.15.0/tests/test_pricing_map.py +47 -0
memstash-0.15.0/tests/test_prompts.py +50 -0
memstash-0.15.0/tests/test_provenance.py +54 -0
memstash-0.15.0/tests/test_reconcile.py +105 -0
memstash-0.15.0/tests/test_retrieval_budget.py +127 -0
memstash-0.15.0/tests/test_robustness.py +83 -0
memstash-0.15.0/tests/test_trace_tree.py +76 -0
memstash-0.15.0/tests/test_v3.py +114 -0

memstash-0.15.0/.github/workflows/ci.yml ADDED Viewed

@@ -0,0 +1,26 @@
+name: CI
+on:
+  push:
+    branches: [main]
+  pull_request:
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    strategy:
+      matrix:
+        python-version: ["3.9", "3.11", "3.12"]
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+      - name: Install
+        run: |
+          python -m pip install --upgrade pip
+          pip install -e '.[dev]'
+      - name: Lint
+        run: ruff check memstash
+      - name: Test
+        run: pytest -q

memstash-0.15.0/.github/workflows/publish.yml ADDED Viewed

@@ -0,0 +1,47 @@
+name: Publish to PyPI
+# Publishes memstash to PyPI when a version tag is pushed (e.g. v0.3.0).
+# Uses PyPI Trusted Publishing (OIDC) — no API token stored in the repo.
+#
+# One-time setup on PyPI:
+#   1. Create the project `memstash` (or let the first manual upload create it).
+#   2. PyPI → project → Publishing → add a trusted publisher:
+#        owner: zionLyl  repo: recall  workflow: publish.yml  environment: pypi
+#
+# Then releasing is just:  git tag v0.3.0 && git push origin v0.3.0
+on:
+  push:
+    tags:
+      - "v*"
+jobs:
+  build:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+      - name: Build sdist + wheel
+        run: |
+          python -m pip install --upgrade build
+          python -m build
+      - uses: actions/upload-artifact@v4
+        with:
+          name: dist
+          path: dist/
+  publish:
+    needs: build
+    runs-on: ubuntu-latest
+    environment: pypi
+    permissions:
+      id-token: write   # required for trusted publishing
+    steps:
+      - uses: actions/download-artifact@v4
+        with:
+          name: dist
+          path: dist/
+      - name: Publish to PyPI
+        uses: pypa/gh-action-pypi-publish@release/v1

memstash-0.15.0/.gitignore ADDED Viewed

@@ -0,0 +1,25 @@
+# Python
+__pycache__/
+*.py[cod]
+*.egg-info/
+.eggs/
+build/
+dist/
+.venv/
+venv/
+env/
+# recall local data
+.recall/
+*.db
+*.sqlite
+# tooling
+.pytest_cache/
+.ruff_cache/
+.mypy_cache/
+# OS / editor
+.DS_Store
+.vscode/
+.idea/

memstash-0.15.0/CHANGELOG.md ADDED Viewed

@@ -0,0 +1,293 @@
+# Changelog
+## [0.15.0]
+Renamed to **memstash** (the PyPI name `engram-ai` collided with the existing
+`engram` project). Brand, CLI command, and import are all `memstash` now.
+### Changed
+- PyPI package + CLI + import are now **`memstash`** (`pip install memstash`,
+  `memstash ...`, `import memstash`). The `Memstash` class is exported (the
+  `Recall` class name still works as an alias).
+- Env vars are `MEMSTASH_*`; the default store is `~/.memstash/memstash.db`;
+  the adapter entry-point group is `memstash.adapters`.
+- (The unreleased `engram-ai` 0.14.0 was never published; this supersedes it.)
+## [0.14.0]
+Rebrand to **Engram**.
+### Changed
+- Project renamed from `zion-recall-ai` to **`engram-ai`** (PyPI) with the
+  **`engram`** CLI command and `import engram`. The `Engram` class is exported
+  (the old `Recall` class name still works as an alias).
+- Env vars are now `ENGRAM_*` (was `RECALL_*`); the default store moved to
+  `~/.engram/engram.db`; the adapter entry-point group is `engram.adapters`.
+- README reworked with a sharper pitch, a comparison table, and CI/PyPI badges.
+## [0.13.0]
+New capability (3/3): capture other libraries' LLM calls.
+### Added
+- **`recall.instrument()`**: makes recall a *local* OpenInference/OpenTelemetry
+  span sink — LLM calls made by LangChain, LlamaIndex, the OpenAI SDK, etc.
+  (instrumented via OpenInference) get written to `~/.engram/recall.db` as
+  traces (model, tokens, cost, latency, `kind="instrumented"`), visible in
+  `engram recent` / `stats` / `trace`. No server, no cloud — the local
+  counterpart to Phoenix/Langfuse auto-instrumentation. Best-effort enables the
+  OpenAI/LangChain instrumentors if installed. New `recall/instrument.py`
+  (`span_to_trace`, `instrument`). Requires `[otel]`.
+## [0.12.0]
+New capability (2/3): document ingestion.
+### Added
+- **`engram ingest <file>`**: read a `.txt` / `.md` (or `.pdf` with the `[pdf]`
+  extra), split it into reasonably-sized chunks, and store each as a searchable
+  memory tagged with the filename — so `engram search` and chat memory-injection
+  cover your notes/docs. 100% local and deterministic (no LLM). Dedupes on
+  re-ingest. `recall/ingest.py` (`chunk_text`, `read_file`) + `Recall.ingest`.
+## [0.11.0]
+New capability (1/3): bi-temporal memory.
+### Added
+- **Point-in-time queries**: `engram list --at <when>` shows the memories that
+  were valid at a past time — `YYYY-MM-DD`, a relative `30d`/`12h`/`45m` ago, or
+  an epoch. Includes since-forgotten memories whose validity window covers that
+  moment. `Store.memories_as_of()` / `Recall.as_of()`.
+### Changed
+- **Conflict-resolution UPDATE now supersedes instead of overwriting**: the old
+  fact's validity window is closed (kept as history, deactivated) and the new
+  fact is added — so "what did I know on date X?" stays answerable.
+## [0.10.0]
+Credibility — reproducible quality numbers.
+### Added
+- **Benchmark harness** (`engram benchmark`): deterministic, key-free. Seeds a
+  fixed, hand-labeled memory set into a throwaway store and reports retrieval
+  quality — **recall@1, recall@k, precision@k, MRR** — plus a heuristic
+  extraction fact-recall / false-capture check. Honestly labels whether the run
+  used the semantic or keyword/BM25 backend, so numbers are comparable and not
+  overstated. New `recall/bench.py` (`run_retrieval_benchmark`,
+  `run_extraction_benchmark`, `run_all`). Baseline (keyword): recall@1 ≈ 0.50,
+  MRR ≈ 0.69, extraction fact-recall 1.00 with 0 false captures; semantic
+  embeddings score higher.
+## [0.9.0]
+Robustness & scale.
+### Added
+- **Vectorized retrieval**: semantic ranking now uses numpy (when present) to
+  cosine-score all memories in one matrix op, with a pure-Python fallback —
+  keeping recall fast as the store grows to thousands of memories. No new
+  required dependency.
+### Fixed
+- **Embedding dimension safety**: stored vectors whose dimension differs from
+  the query (e.g. after switching embedding models/backends) are now skipped
+  instead of producing silently-wrong cosine scores. `_cosine` returns 0 on
+  mismatch, protecting search, near-dup suppression, and dedupe.
+### Changed
+- SQLite now opens in **WAL** mode (`synchronous=NORMAL`) for safer concurrent
+  reads/writes (e.g. the dashboard reading while the CLI writes).
+## [0.8.0]
+### Added
+- **Pluggable embedding backend**: semantic search can now use any
+  OpenAI-compatible `/embeddings` endpoint instead of the local
+  sentence-transformers model — point at a local Ollama / LM Studio (no PyTorch
+  download) or a cloud provider. Config: `embedding_backend = api`,
+  `embedding_model`, `embedding_base_url`, `embedding_api_key_env`. Falls back to
+  keyword/BM25 search if the endpoint is unreachable. Default stays `local`.
+### Changed
+- Published to PyPI as **`engram-ai`** (`pip install engram-ai`); the
+  import package and `recall` CLI command are unchanged. README gains a PyPI
+  badge + prominent install line.
+## [0.7.0]
+Usability & onboarding polish — informed by a competitive scan of how peers
+(simonw/llm, Jan, Phoenix, mem0, …) handle ease-of-adoption.
+### Added
+- **Interactive chat REPL**: bare `engram chat` (no prompt) drops into a
+  multi-turn conversation loop — memory injected + auto-captured each turn,
+  cost traced, `/exit` or Ctrl-D to quit. Matches `llm chat`'s ergonomics.
+- **Multi-turn conversation history**: adapters and `Recall.chat/stream` accept
+  a `history` of prior turns, so chats are no longer single-shot. OpenAI,
+  Anthropic, and Gemini adapters all thread it natively.
+- **Zero-key local default**: `engram init` now detects a running Ollama
+  (localhost:11434) and offers it as the default provider — no API key needed.
+### Changed
+- **Onboarding**: README leads with `pipx install 'engram-ai[all]'` (and `uv tool
+  install`); the quickstart's first chat command now installs a working provider
+  extra instead of failing on the base install.
+- First semantic search prints a one-time "loading embedding model (~80MB)"
+  notice to stderr instead of hanging silently.
+## [0.6.0]
+The rest of the roadmap — extensibility, interop, auditing, and eval workflow.
+### Added
+- **Provenance**: auto-captured memories record the chat trace they came from
+  (`source_trace`); `engram show <id>` prints a memory's detail plus the source
+  call's model and prompt snippet for end-to-end auditing.
+- **Plugin hooks**: `recall.register_adapter(...)` for runtime custom providers,
+  and auto-discovery of adapters published under the `recall.adapters`
+  entry-point group. *(simonw/llm-style.)*
+- **OpenTelemetry export** (opt-in): `config otel_export true` mirrors calls as
+  OpenInference LLM spans to an OTLP backend (Phoenix/Langfuse) or the console —
+  no server dependency. `pip install 'engram-ai[otel]'`.
+- **Eval ergonomics**: saved eval suites (`engram eval-suite save/list/rm`,
+  `engram eval <id> --suite NAME`), an eval pass-rate/score summary in
+  `engram stats`, and opt-in **auto-eval after chat** (`config auto_eval_suite`).
+## [0.5.0]
+Retrieval, cost accuracy, and quality — the next batch from the roadmap.
+### Added
+- **Graph-aware retrieval**: with `graph_weight > 0`, recall finds entities
+  named in the query, expands to their neighbors via the graph-lite relations,
+  and pulls in memories about those neighbors as an extra RRF signal — surfacing
+  connected memories the query never mentions. *(mem0/Zep-style.)*
+- **Maintained pricing map**: provider-prefixed ids resolve
+  (`openrouter/openai/gpt-4o` → `gpt-4o`); override without editing the package
+  via `ENGRAM_PRICING_FILE` (JSON file) layered under `ENGRAM_PRICING` (inline);
+  more current models added; `engram pricing [model]` to inspect. *(LiteLLM-style.)*
+- **Quality evals**: attach checks to a traced reply — local rules
+  (`--contains` / `--not-contains` / `--regex` / `--max-tokens`, free &
+  deterministic) and an opt-in `--judge "criterion"` LLM score (1–5 → 0–1).
+  `engram eval <trace_id> ...` and `engram evals` list results; `engram recent`
+  now shows trace IDs and kind. *(Langfuse/Phoenix-style, local.)*
+## [0.4.0]
+Memory intelligence + deeper local observability — closing the biggest gaps vs
+mem0 / Letta / Zep / Langfuse, while staying single-file and server-free.
+### Added
+- **Memory lifecycle**: memories track `hit_count` / `last_used` and a
+  `valid_from` / `valid_to` / `active` window. Retrieval records hits and skips
+  inactive memories. Soft-forget via `engram forget --soft` and bulk
+  `engram prune --older-than DAYS --unused`. Opt-in recency/usage ranking
+  (`config recency_weight`) blends a lifecycle signal into retrieval via
+  weighted RRF. *(Zep/Letta-inspired.)*
+- **Conflict resolution (ADD/UPDATE/DELETE/NOOP)**: opt-in `memory_ops = "llm"`
+  reconciles each new fact against its most-related memories so contradictions
+  are updated/removed instead of piling up. New `reconcile.py`; cost traced;
+  degrades to a plain ADD on any failure. *(mem0's signature.)*
+- **Graph-lite**: a `relations` table stores `(subject, predicate, object)`
+  triples per scope — relational memory without a graph DB. Opt-in LLM mining
+  (`graph_extract`) from chats; `engram graph [entity]` to query, `--add` to add
+  manually. *(mem0/Zep/cognee-style, single-SQLite.)*
+- **Local trace tree**: traces gain `session_id` / `parent_id` / `kind`, so a
+  turn's chat + its extraction/reconcile/graph calls form a tree. `engram trace`
+  renders per-turn call trees with token/cost totals; the dashboard gains a
+  "Recent turns" section.
+- **Prompt templates / fragments**: `engram prompt save/list/show/use/rm` with
+  `{var}` substitution; `engram chat --template NAME --var k=v`. *(simonw/llm-style.)*
+## [0.3.0]
+Streaming, smarter memory, and the MCP bridge.
+### Added
+- **Streaming chat**: replies now type out token-by-token. `Recall.stream(...)`
+  yields chunks via an `on_token` callback and still returns the full
+  `ChatOutcome` (text, tokens, cost, auto-memory, budget). CLI: streams by
+  default; toggle with `engram chat --no-stream` or `config set stream false`.
+  Every adapter supports it — native OpenAI / Anthropic / Gemini adapters stream
+  for real, others transparently fall back to a single chunk.
+- **LLM-based memory extraction** (opt-in): set `extraction_mode = "llm"` to let
+  a model pull durable first-person facts from each message — higher recall than
+  the heuristic patterns. Configurable extraction model (`extraction_model`),
+  its cost is traced, and it falls back to the heuristic extractor on any error.
+- **MCP server** (`engram mcp`): exposes your memory to any MCP-aware agent
+  (Claude Desktop, Claude Code, Cursor, …) as tools — `remember`,
+  `recall_search`, `list_memories`, `forget`, `usage_stats`. Same local SQLite
+  store, nothing leaves your machine. Install with `pip install 'engram-ai[mcp]'`.
+- **Memory editing**: `engram edit <id> "new content" [--tags ...]` updates a
+  memory in place and re-embeds it. Library: `Recall.edit(...)`.
+- **Similarity merge / dedupe**: `engram dedupe [--threshold 0.9] [--all]
+  [--dry-run]` clusters near-duplicate memories by cosine similarity, keeps the
+  earliest, and unions their tags. Optional on-add suppression via
+  `config set dedupe_similarity 0.95` (both need embeddings; exact dedupe still
+  works without them).
+- **Hybrid retrieval**: memory search now fuses semantic (embeddings) with
+  BM25 keyword ranking (SQLite FTS5) via Reciprocal Rank Fusion — exact terms,
+  names, and IDs the embeddings blur now surface, while semantically-close
+  memories still rank. FTS5 stays in sync via triggers and falls back to LIKE
+  where unavailable. No new dependencies. *(mem0 / Zep do the same.)*
+- **Budget hard-stop**: `config set budget_enforce true` makes recall *refuse*
+  a call once today's spend hits `daily_budget_usd` (raises `BudgetExceeded`),
+  instead of only warning. *(LiteLLM-style.)*
+### Fixed
+- Install hints (`engram-ai[dashboard]`, `engram-ai[mcp]`) and model output are
+  no longer mangled by Rich markup parsing.
+### Packaging
+- PyPI Trusted Publishing workflow (`.github/workflows/publish.yml`): push a
+  `vX.Y.Z` tag to publish. CI workflow runs lint + tests on 3.9 / 3.11 / 3.12.
+## [0.2.0]
+Major feature round.
+### Added
+- **Auto-memory**: after each chat, recall heuristically captures durable
+  first-person facts/preferences (English + Chinese), tagged as `auto`.
+- **Memory scopes**: isolate memories per project/context
+  (`engram scope work`, `--scope`, `--all`). Active scope stored in config.
+- **Config system** (`~/.engram/config.json`): default provider/model, daily
+  budget, auto-memory toggle, inject limit, active scope.
+  CLI: `engram config show|set|path`.
+- **Daily budget + warnings**: set `daily_budget_usd`; chat and `stats` warn at
+  80% and 100% of the day's spend.
+- **Guided setup**: `engram init` (pick defaults, detect keys) and
+  `engram doctor` (which providers are ready).
+- **Export / import**: `engram export mem.json` / `engram import mem.json`
+  (JSON, dedupe-aware).
+- **Deduplication**: identical memories in the same scope are skipped.
+- **Flexible chat**: `engram chat "prompt"` uses configured defaults; the
+  three-arg form still works.
+- **Dashboard upgrades**: auto-refresh, daily-budget bar, scope chips.
+- Safe schema migrations for existing databases.
+### Changed
+- `Recall.chat()` now returns a richer `ChatOutcome` (cost, latency,
+  auto-remembered list, budget warning).
+## [0.1.0]
+First MVP.
+### Added
+- Local-first SQLite store (`~/.engram/recall.db`) for memories + call traces.
+- Memory engine with semantic search (sentence-transformers) and automatic
+  keyword fallback when embeddings are not installed.
+- **22 model providers** out of the box: OpenAI, Anthropic, Gemini, DeepSeek,
+  Qwen, Moonshot (Kimi), Zhipu (GLM), MiniMax, Baichuan, 01.AI (Yi), StepFun,
+  Mistral, xAI (Grok), Groq, Together, Fireworks, DeepInfra, Perplexity,
+  OpenRouter, Ollama, LM Studio, and any OpenAI-compatible endpoint.
+- Per-provider API key env var resolution with `ENGRAM_API_KEY` fallback.
+- Expanded pricing table covering the new providers.
+- Automatic per-call tracing: tokens, estimated cost, latency.
+- CLI: `add`, `search`, `list`, `forget`, `chat`, `stats`, `recent`, `models`,
+  `dashboard`, `version`.
+- Minimal local web dashboard (FastAPI, single page, no build step).
+- Library API via `from recall import Recall`.

memstash-0.15.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 zionLyl
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.