PyPI - ccrecall - Versions diffs - 0.10.0__tar.gz - Mend

ccrecall 0.10.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (75) hide show

ccrecall-0.10.0/LICENSE +21 -0
ccrecall-0.10.0/PKG-INFO +244 -0
ccrecall-0.10.0/README.md +210 -0
ccrecall-0.10.0/pyproject.toml +113 -0
ccrecall-0.10.0/setup.cfg +4 -0
ccrecall-0.10.0/src/ccrecall/__init__.py +18 -0
ccrecall-0.10.0/src/ccrecall/cli/__init__.py +98 -0
ccrecall-0.10.0/src/ccrecall/cli/commands.py +245 -0
ccrecall-0.10.0/src/ccrecall/cli/context.py +31 -0
ccrecall-0.10.0/src/ccrecall/content.py +152 -0
ccrecall-0.10.0/src/ccrecall/db.py +306 -0
ccrecall-0.10.0/src/ccrecall/embeddings.py +125 -0
ccrecall-0.10.0/src/ccrecall/formatting.py +144 -0
ccrecall-0.10.0/src/ccrecall/fusion.py +17 -0
ccrecall-0.10.0/src/ccrecall/hooks/__init__.py +0 -0
ccrecall-0.10.0/src/ccrecall/hooks/backfill_embeddings.py +374 -0
ccrecall-0.10.0/src/ccrecall/hooks/backfill_summaries.py +99 -0
ccrecall-0.10.0/src/ccrecall/hooks/clear_handoff.py +49 -0
ccrecall-0.10.0/src/ccrecall/hooks/import_conversations.py +271 -0
ccrecall-0.10.0/src/ccrecall/hooks/memory_context.py +539 -0
ccrecall-0.10.0/src/ccrecall/hooks/memory_setup.py +162 -0
ccrecall-0.10.0/src/ccrecall/hooks/memory_sync.py +57 -0
ccrecall-0.10.0/src/ccrecall/hooks/onboarding.py +83 -0
ccrecall-0.10.0/src/ccrecall/hooks/sync_current.py +154 -0
ccrecall-0.10.0/src/ccrecall/hooks/write_config.py +51 -0
ccrecall-0.10.0/src/ccrecall/models.py +121 -0
ccrecall-0.10.0/src/ccrecall/parsing.py +314 -0
ccrecall-0.10.0/src/ccrecall/project_ops.py +92 -0
ccrecall-0.10.0/src/ccrecall/recent_chats.py +204 -0
ccrecall-0.10.0/src/ccrecall/schema.py +192 -0
ccrecall-0.10.0/src/ccrecall/search_conversations.py +500 -0
ccrecall-0.10.0/src/ccrecall/serialization.py +41 -0
ccrecall-0.10.0/src/ccrecall/session_ops.py +563 -0
ccrecall-0.10.0/src/ccrecall/session_tail.py +384 -0
ccrecall-0.10.0/src/ccrecall/summarizer.py +427 -0
ccrecall-0.10.0/src/ccrecall/token_analytics.py +212 -0
ccrecall-0.10.0/src/ccrecall/token_dashboard.py +119 -0
ccrecall-0.10.0/src/ccrecall/token_insights.py +862 -0
ccrecall-0.10.0/src/ccrecall/token_output.py +867 -0
ccrecall-0.10.0/src/ccrecall/token_parser.py +661 -0
ccrecall-0.10.0/src/ccrecall/token_schema.py +206 -0
ccrecall-0.10.0/src/ccrecall.egg-info/PKG-INFO +244 -0
ccrecall-0.10.0/src/ccrecall.egg-info/SOURCES.txt +73 -0
ccrecall-0.10.0/src/ccrecall.egg-info/dependency_links.txt +1 -0
ccrecall-0.10.0/src/ccrecall.egg-info/entry_points.txt +7 -0
ccrecall-0.10.0/src/ccrecall.egg-info/requires.txt +11 -0
ccrecall-0.10.0/src/ccrecall.egg-info/top_level.txt +1 -0
ccrecall-0.10.0/tests/test_backfill_embeddings.py +719 -0
ccrecall-0.10.0/tests/test_boundary_validation.py +149 -0
ccrecall-0.10.0/tests/test_clear_handoff_contract.py +233 -0
ccrecall-0.10.0/tests/test_cli_context.py +23 -0
ccrecall-0.10.0/tests/test_content.py +377 -0
ccrecall-0.10.0/tests/test_context_injection.py +738 -0
ccrecall-0.10.0/tests/test_db.py +826 -0
ccrecall-0.10.0/tests/test_embeddings.py +110 -0
ccrecall-0.10.0/tests/test_formatting.py +283 -0
ccrecall-0.10.0/tests/test_fusion.py +62 -0
ccrecall-0.10.0/tests/test_import_pipeline.py +699 -0
ccrecall-0.10.0/tests/test_ingest_token_data.py +620 -0
ccrecall-0.10.0/tests/test_integration.py +267 -0
ccrecall-0.10.0/tests/test_onboarding.py +164 -0
ccrecall-0.10.0/tests/test_parsing.py +383 -0
ccrecall-0.10.0/tests/test_project_ops.py +132 -0
ccrecall-0.10.0/tests/test_recent_chats.py +158 -0
ccrecall-0.10.0/tests/test_search.py +909 -0
ccrecall-0.10.0/tests/test_security.py +92 -0
ccrecall-0.10.0/tests/test_serialization.py +58 -0
ccrecall-0.10.0/tests/test_session_ops.py +690 -0
ccrecall-0.10.0/tests/test_session_tail.py +276 -0
ccrecall-0.10.0/tests/test_summarizer.py +667 -0
ccrecall-0.10.0/tests/test_sync_hook.py +641 -0
ccrecall-0.10.0/tests/test_token_insights.py +530 -0
ccrecall-0.10.0/tests/test_token_output.py +211 -0
ccrecall-0.10.0/tests/test_token_parser.py +280 -0
ccrecall-0.10.0/tests/test_write_config.py +186 -0

ccrecall-0.10.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Jessica Smith
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

ccrecall-0.10.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,244 @@
+Metadata-Version: 2.4
+Name: ccrecall
+Version: 0.10.0
+Summary: Conversation history and semantic search for Claude Code
+Author-email: Jessica Smith <12jessicasmith34@gmail.com>
+License-Expression: MIT
+Project-URL: Homepage, https://github.com/NodeJSmith/claude-code-recall
+Project-URL: Issues, https://github.com/NodeJSmith/claude-code-recall/issues
+Project-URL: Changelog, https://github.com/NodeJSmith/claude-code-recall/blob/main/CHANGELOG.md
+Keywords: claude-code,conversation-history,search,recall,transcripts,semantic-search
+Classifier: Development Status :: 4 - Beta
+Classifier: Environment :: Console
+Classifier: Intended Audience :: Developers
+Classifier: Operating System :: OS Independent
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.10
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Classifier: Programming Language :: Python :: 3.14
+Classifier: Topic :: Utilities
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Requires-Python: >=3.10
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: sqlite-vec==0.1.9
+Requires-Dist: fastembed==0.8.0
+Requires-Dist: numpy==2.2.6; python_version < "3.11"
+Requires-Dist: numpy==2.4.6; python_version >= "3.11"
+Requires-Dist: whenever==0.10.0
+Requires-Dist: pydantic==2.13.4
+Requires-Dist: cyclopts>=4.16
+Dynamic: license-file
+# ccrecall
+**Conversation history and semantic search for Claude Code.**
+ccrecall stores your Claude Code sessions in a local SQLite database so you can recall past conversations, search across them by keyword and meaning, and get automatic context on session start. Everything runs on your machine — no data leaves it.
+> ccrecall is an independent, community project for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). It is not affiliated with, endorsed by, or sponsored by Anthropic.
+## What it does
+Every time a Claude Code session ends, the conversation is synced to `~/.ccrecall/conversations.db`. On your next session start, Claude automatically gets a summary of what you were last working on. You can also search past sessions by keyword or pull recent ones at any time.
+## Install
+ccrecall has two parts: a **Python package** (the `ccrecall` CLI plus the hook binaries) and a **Claude Code plugin** (the `/ccr-*` skills and the hook wiring). Install both.
+**1. Install the package** — puts `ccrecall` and the hook commands on your PATH:
+```bash
+uv tool install ccrecall
+```
+(`pipx install ccrecall` or `pip install ccrecall` work too.)
+**2. Enable the plugin** — ccrecall ships as a Claude Code plugin. The repo doubles as a single-plugin marketplace, so from inside Claude Code:
+```
+/plugin marketplace add NodeJSmith/claude-code-recall
+/plugin install ccrecall@claude-code-recall
+```
+That registers the skills and wires the SessionStart / Stop / SessionEnd hooks (`hooks/hooks.json`) — both are auto-discovered from the plugin's directory layout. Reload with `/reload-plugins` if they don't appear immediately.
+> Plugin skills are namespaced under the plugin name, so the skills below are invoked as `/ccrecall:ccr-recall`, `/ccrecall:ccr-resume`, and `/ccrecall:ccr-tokens`. The hook commands degrade gracefully — each is guarded by `command -v … || true`, so if the package isn't installed (or isn't yet on PATH) the hook is a silent no-op rather than a broken session.
+## First-run setup
+On your first session after installing, Claude will notice that `~/.ccrecall/config.json` doesn't exist and walk you through a brief onboarding. It asks a single question — **session context injection**: should Claude automatically recall what you were working on last session?
+Your choice gets written to `~/.ccrecall/config.json`. You can edit that file directly at any time to change settings.
+To skip the walkthrough and use recommended defaults immediately:
+```bash
+ccrecall write-config --defaults
+```
+## Semantic search
+Search results are fused from two signals: keyword full-text search (FTS5 → FTS4 → LIKE fallback) and vector similarity from a locally-running embedding model. The two ranked lists are merged with Reciprocal Rank Fusion (RRF), so results that rank well in both signals appear first.
+The embedding model is [jina-embeddings-v2-small-en](https://huggingface.co/jinaai/jina-embeddings-v2-small-en) (512-dim), running entirely on your machine via [fastembed](https://github.com/qdrant/fastembed). No data leaves your machine.
+### Coverage
+New sessions are embedded automatically as they sync (embed-on-write), so coverage builds forward on its own. Only **active-leaf** branches are embedded — at most one active leaf per session (maintained by sync/import), not its abandoned forks/retries. The flag isn't DB-enforced, but sync/import marks exactly one branch `is_active=1` per session. The search path only ever returns active leaves, so embedding inactive forks would just produce vectors that can never surface.
+### Optional: seed historical conversations
+Embedding runs on CPU via fastembed. jina-v2-small-en is light — a few milliseconds for a short summary, up to ~400ms for a long one — but seeding a large history (~2k active leaves) is still a bounded chunk of work, and a parallel run can thrash a small or shared box. It is therefore **opt-in** — it is *not* auto-spawned on SessionStart — so it never fires unbidden. Run it yourself when you want to seed:
+```bash
+ccrecall backfill embeddings              # all active leaves, all history
+ccrecall backfill embeddings --days 14    # only the last 14 days
+ccrecall backfill embeddings --limit 500  # cap this run at 500 branches
+ccrecall backfill embeddings --threads 4  # use 4 inference threads (idle machine)
+```
+It runs at low scheduling priority (`nice`) and a single inference thread by default so it yields to interactive work. Tune the thread count with `--threads` (e.g. `--threads 4` on an idle workstation to finish faster). Progress prints to stderr (one line per batch); the run is resumable — re-running skips already-embedded branches.
+### Flags
+| Flag | Effect |
+|------|--------|
+| `--keyword-only` | Skip the embedding step entirely, use keyword search only |
+| `--status` | Print diagnostic info (vec extension loaded, model name, embedded vs. total summarized (embeddable) branch count) and exit 0 |
+### Runtime deps
+The semantic search path requires three extra packages beyond the base install:
+- `sqlite-vec` — SQLite extension for vector KNN queries
+- `fastembed` — downloads and runs the embedding model (manages onnxruntime + tokenization)
+- `numpy` — vector math (normalization)
+These are included in the package dependencies. If fastembed fails to import (e.g. ABI mismatch on an unusual platform), search falls back silently to keyword-only mode.
+### Degradation
+Semantic fusion is automatically disabled when:
+- The embedding model can't be loaded (e.g. a first-run download failed and no cached copy exists)
+- `fastembed` cannot be imported
+- `sqlite-vec` cannot be loaded on the connection (e.g. Python built without loadable extensions)
+In all cases, search falls back to keyword-only and returns results normally. Use `ccrecall search --status` to check which path is active.
+## Skills
+| Skill | Trigger | What it does |
+|---|---|---|
+| `/ccr-recall` | "what did we discuss", "continue where we left off", "search my conversations" | Lets Claude search or browse your past sessions on demand |
+| `/ccr-resume` | "pick up where we left off after /clear", a stop, or an unanswered question | Reconstructs the prior session's intent from its transcript tail and surfaces any unresolved decision |
+| `/ccr-tokens` | "analyze Claude token usage", "how much am I spending on Claude" | Full cost + workflow analytics report with an interactive HTML dashboard |
+## Entry points
+### Hooks (run automatically — don't call these manually)
+These are wired by the plugin's `hooks/hooks.json` and fire on their respective Claude Code events.
+| Entry point | Event | What it does |
+|---|---|---|
+| `ccrecall-setup` | SessionStart | Creates `~/.ccrecall/` if needed, opens the DB to apply any pending migrations, then spawns `ccrecall import` and `ccrecall backfill summaries` as background processes |
+| `ccrecall-onboarding` | SessionStart (startup only) | One-time first-run onboarding. Injects setup instructions into Claude's context if `config.json` is missing or onboarding hasn't been completed. Silent no-op after that |
+| `ccrecall-context` | SessionStart (startup + clear) | Injects a summary of your most recent session into Claude's context so it knows what you were working on. On `/clear`, reads a handoff file to link directly to the session you just cleared from |
+| `ccrecall-clear-handoff` | SessionEnd (clear only) | Writes a small handoff file so the next session start knows which session to link to after a `/clear`. Without this, context injection falls back to a "most recent session" heuristic |
+| `ccrecall-sync` | Stop | Syncs the current session to the DB in a detached background process. Runs on every session end |
+> These are kept as separate console scripts (rather than `ccrecall hook …` subcommands) on purpose: hooks fire on every session boundary, and a direct entry point avoids eagerly importing the full CLI command surface on the hot path.
+### Internal helpers (spawned by hooks — don't call these manually)
+| Entry point | What it does |
+|---|---|
+| `ccrecall sync-current` | Syncs a single session file to the DB. Called by `ccrecall-sync` with the session ID from stdin |
+| `ccrecall import` | Full import of all JSONL files in `~/.claude/projects/`. Skips files that haven't changed since last import (file hash check). Run on first install and whenever new sessions need backfilling |
+| `ccrecall backfill summaries` | Generates context summaries for any DB branches that don't have one yet. Runs in the background after `ccrecall-setup` |
+| `ccrecall write-config` | Writes `~/.ccrecall/config.json`. Called by Claude during onboarding to persist your settings choices. You can also call it directly — run `ccrecall write-config --help` for flags |
+### Skill CLIs (called from skill files — can also be used directly)
+These are the `ccrecall` subcommands the `/ccr-*` skills invoke. You can run them from the terminal too.
+| Entry point | What it does |
+|---|---|
+| `ccrecall recent` | Prints recent sessions from the DB in markdown (default) or JSON. Used by `/ccr-recall` |
+| `ccrecall search` | Searches sessions by keyword fused with vector similarity (FTS5 → FTS4 → LIKE fallback, RRF-fused with jina embeddings when available). Used by `/ccr-recall` |
+| `ccrecall tail` | Reads the tail of a prior session's transcript to recover the last instruction and any unanswered question. Used by `/ccr-resume` |
+| `ccrecall backfill embeddings` | Opt-in seeding of embeddings for historical active-leaf branches (jina-v2-small-en via fastembed). Not auto-spawned. Supports `--days N` / `--limit N` / `--threads N`; throttled via `nice` + a single inference thread by default. Resumable |
+| `ccrecall tokens` | Parses JSONL files for token usage analytics — cost, cache hits, model mix, skill/agent/hook patterns. Populates analytics tables and builds `~/.ccrecall/dashboard.html`. Used by `/ccr-tokens` |
+## Data flow
+```
+Session ends
+  └─ ccrecall-sync (Stop hook)
+       └─ ccrecall sync-current (background)
+            └─ writes to ~/.ccrecall/conversations.db
+            └─ embeds the active leaf via jina if model available (drops silently on failure)
+/clear (SessionEnd)
+  └─ ccrecall-clear-handoff
+       └─ writes a handoff file naming the session being cleared
+            (so the next SessionStart links to it instead of guessing)
+Session starts
+  └─ ccrecall-setup (SessionStart)
+  │    └─ ccrecall import (background, first run / new files)
+  │         └─ embeds each new active leaf via jina if model available
+  │    └─ ccrecall backfill summaries (background, if summaries missing)
+  │    └─ (embedding backfill is NOT auto-spawned — opt-in via ccrecall backfill embeddings)
+  ├─ ccrecall-onboarding (SessionStart, startup only — one-time)
+  └─ ccrecall-context (SessionStart, startup + clear)
+       └─ injects last session summary into Claude's context
+```
+## Config file
+`~/.ccrecall/config.json` — written by `ccrecall write-config` during onboarding:
+```json
+{
+  "onboarding_completed": true,
+  "onboarding_version": 1,
+  "auto_inject_context": true
+}
+```
+Onboarding sets `auto_inject_context`. The remaining settings are tunable by editing `config.json` directly:
+| Key | Type | Default | Effect |
+|---|---|---|---|
+| `auto_inject_context` | bool | `true` | Inject a summary of your previous session at session start. |
+| `max_context_sessions` | int | `2` | How many recent sessions to include in that injected context. |
+| `exclude_projects` | list[str] | `[]` | Project names to skip when **storing** conversations — excluded projects are not imported or synced. Matched against the project's directory name. This is write-side only: it prevents new data from being indexed; it does not remove or hide conversations already stored before the project was excluded. |
+| `logging_enabled` | bool | `false` | Write hook diagnostics (including swallowed hook exceptions) to `~/.ccrecall/ccrecall.log`. Useful for troubleshooting a misbehaving hook. |
+## Database
+`~/.ccrecall/conversations.db` — SQLite, WAL mode. Tables:
+- `sessions` — one row per conversation session
+- `branches` — one row per conversation branch (rewinding creates new branches)
+- `messages` — all messages, stored once per session regardless of branch
+- `branch_messages` — join table linking messages to branches
+- `import_log` — tracks which JSONL files have been imported and their hashes
+- `branch_vec` — vec0 virtual table (sqlite-vec) storing 512-dim jina embeddings for each branch, used for KNN search
+- `token_snapshots`, `turns`, `turn_tool_calls`, `session_metrics` — analytics tables populated by `ccrecall tokens`
+## Development
+```bash
+uv sync                       # install package + dev dependencies
+uv run pytest                 # run the test suite
+uvx prek run --all-files      # run the lint/format/type hooks
+```
+## License
+[MIT](LICENSE)

ccrecall-0.10.0/README.md ADDED Viewed

@@ -0,0 +1,210 @@
+# ccrecall
+**Conversation history and semantic search for Claude Code.**
+ccrecall stores your Claude Code sessions in a local SQLite database so you can recall past conversations, search across them by keyword and meaning, and get automatic context on session start. Everything runs on your machine — no data leaves it.
+> ccrecall is an independent, community project for [Claude Code](https://docs.anthropic.com/en/docs/claude-code). It is not affiliated with, endorsed by, or sponsored by Anthropic.
+## What it does
+Every time a Claude Code session ends, the conversation is synced to `~/.ccrecall/conversations.db`. On your next session start, Claude automatically gets a summary of what you were last working on. You can also search past sessions by keyword or pull recent ones at any time.
+## Install
+ccrecall has two parts: a **Python package** (the `ccrecall` CLI plus the hook binaries) and a **Claude Code plugin** (the `/ccr-*` skills and the hook wiring). Install both.
+**1. Install the package** — puts `ccrecall` and the hook commands on your PATH:
+```bash
+uv tool install ccrecall
+```
+(`pipx install ccrecall` or `pip install ccrecall` work too.)
+**2. Enable the plugin** — ccrecall ships as a Claude Code plugin. The repo doubles as a single-plugin marketplace, so from inside Claude Code:
+```
+/plugin marketplace add NodeJSmith/claude-code-recall
+/plugin install ccrecall@claude-code-recall
+```
+That registers the skills and wires the SessionStart / Stop / SessionEnd hooks (`hooks/hooks.json`) — both are auto-discovered from the plugin's directory layout. Reload with `/reload-plugins` if they don't appear immediately.
+> Plugin skills are namespaced under the plugin name, so the skills below are invoked as `/ccrecall:ccr-recall`, `/ccrecall:ccr-resume`, and `/ccrecall:ccr-tokens`. The hook commands degrade gracefully — each is guarded by `command -v … || true`, so if the package isn't installed (or isn't yet on PATH) the hook is a silent no-op rather than a broken session.
+## First-run setup
+On your first session after installing, Claude will notice that `~/.ccrecall/config.json` doesn't exist and walk you through a brief onboarding. It asks a single question — **session context injection**: should Claude automatically recall what you were working on last session?
+Your choice gets written to `~/.ccrecall/config.json`. You can edit that file directly at any time to change settings.
+To skip the walkthrough and use recommended defaults immediately:
+```bash
+ccrecall write-config --defaults
+```
+## Semantic search
+Search results are fused from two signals: keyword full-text search (FTS5 → FTS4 → LIKE fallback) and vector similarity from a locally-running embedding model. The two ranked lists are merged with Reciprocal Rank Fusion (RRF), so results that rank well in both signals appear first.
+The embedding model is [jina-embeddings-v2-small-en](https://huggingface.co/jinaai/jina-embeddings-v2-small-en) (512-dim), running entirely on your machine via [fastembed](https://github.com/qdrant/fastembed). No data leaves your machine.
+### Coverage
+New sessions are embedded automatically as they sync (embed-on-write), so coverage builds forward on its own. Only **active-leaf** branches are embedded — at most one active leaf per session (maintained by sync/import), not its abandoned forks/retries. The flag isn't DB-enforced, but sync/import marks exactly one branch `is_active=1` per session. The search path only ever returns active leaves, so embedding inactive forks would just produce vectors that can never surface.
+### Optional: seed historical conversations
+Embedding runs on CPU via fastembed. jina-v2-small-en is light — a few milliseconds for a short summary, up to ~400ms for a long one — but seeding a large history (~2k active leaves) is still a bounded chunk of work, and a parallel run can thrash a small or shared box. It is therefore **opt-in** — it is *not* auto-spawned on SessionStart — so it never fires unbidden. Run it yourself when you want to seed:
+```bash
+ccrecall backfill embeddings              # all active leaves, all history
+ccrecall backfill embeddings --days 14    # only the last 14 days
+ccrecall backfill embeddings --limit 500  # cap this run at 500 branches
+ccrecall backfill embeddings --threads 4  # use 4 inference threads (idle machine)
+```
+It runs at low scheduling priority (`nice`) and a single inference thread by default so it yields to interactive work. Tune the thread count with `--threads` (e.g. `--threads 4` on an idle workstation to finish faster). Progress prints to stderr (one line per batch); the run is resumable — re-running skips already-embedded branches.
+### Flags
+| Flag | Effect |
+|------|--------|
+| `--keyword-only` | Skip the embedding step entirely, use keyword search only |
+| `--status` | Print diagnostic info (vec extension loaded, model name, embedded vs. total summarized (embeddable) branch count) and exit 0 |
+### Runtime deps
+The semantic search path requires three extra packages beyond the base install:
+- `sqlite-vec` — SQLite extension for vector KNN queries
+- `fastembed` — downloads and runs the embedding model (manages onnxruntime + tokenization)
+- `numpy` — vector math (normalization)
+These are included in the package dependencies. If fastembed fails to import (e.g. ABI mismatch on an unusual platform), search falls back silently to keyword-only mode.
+### Degradation
+Semantic fusion is automatically disabled when:
+- The embedding model can't be loaded (e.g. a first-run download failed and no cached copy exists)
+- `fastembed` cannot be imported
+- `sqlite-vec` cannot be loaded on the connection (e.g. Python built without loadable extensions)
+In all cases, search falls back to keyword-only and returns results normally. Use `ccrecall search --status` to check which path is active.
+## Skills
+| Skill | Trigger | What it does |
+|---|---|---|
+| `/ccr-recall` | "what did we discuss", "continue where we left off", "search my conversations" | Lets Claude search or browse your past sessions on demand |
+| `/ccr-resume` | "pick up where we left off after /clear", a stop, or an unanswered question | Reconstructs the prior session's intent from its transcript tail and surfaces any unresolved decision |
+| `/ccr-tokens` | "analyze Claude token usage", "how much am I spending on Claude" | Full cost + workflow analytics report with an interactive HTML dashboard |
+## Entry points
+### Hooks (run automatically — don't call these manually)
+These are wired by the plugin's `hooks/hooks.json` and fire on their respective Claude Code events.
+| Entry point | Event | What it does |
+|---|---|---|
+| `ccrecall-setup` | SessionStart | Creates `~/.ccrecall/` if needed, opens the DB to apply any pending migrations, then spawns `ccrecall import` and `ccrecall backfill summaries` as background processes |
+| `ccrecall-onboarding` | SessionStart (startup only) | One-time first-run onboarding. Injects setup instructions into Claude's context if `config.json` is missing or onboarding hasn't been completed. Silent no-op after that |
+| `ccrecall-context` | SessionStart (startup + clear) | Injects a summary of your most recent session into Claude's context so it knows what you were working on. On `/clear`, reads a handoff file to link directly to the session you just cleared from |
+| `ccrecall-clear-handoff` | SessionEnd (clear only) | Writes a small handoff file so the next session start knows which session to link to after a `/clear`. Without this, context injection falls back to a "most recent session" heuristic |
+| `ccrecall-sync` | Stop | Syncs the current session to the DB in a detached background process. Runs on every session end |
+> These are kept as separate console scripts (rather than `ccrecall hook …` subcommands) on purpose: hooks fire on every session boundary, and a direct entry point avoids eagerly importing the full CLI command surface on the hot path.
+### Internal helpers (spawned by hooks — don't call these manually)
+| Entry point | What it does |
+|---|---|
+| `ccrecall sync-current` | Syncs a single session file to the DB. Called by `ccrecall-sync` with the session ID from stdin |
+| `ccrecall import` | Full import of all JSONL files in `~/.claude/projects/`. Skips files that haven't changed since last import (file hash check). Run on first install and whenever new sessions need backfilling |
+| `ccrecall backfill summaries` | Generates context summaries for any DB branches that don't have one yet. Runs in the background after `ccrecall-setup` |
+| `ccrecall write-config` | Writes `~/.ccrecall/config.json`. Called by Claude during onboarding to persist your settings choices. You can also call it directly — run `ccrecall write-config --help` for flags |
+### Skill CLIs (called from skill files — can also be used directly)
+These are the `ccrecall` subcommands the `/ccr-*` skills invoke. You can run them from the terminal too.
+| Entry point | What it does |
+|---|---|
+| `ccrecall recent` | Prints recent sessions from the DB in markdown (default) or JSON. Used by `/ccr-recall` |
+| `ccrecall search` | Searches sessions by keyword fused with vector similarity (FTS5 → FTS4 → LIKE fallback, RRF-fused with jina embeddings when available). Used by `/ccr-recall` |
+| `ccrecall tail` | Reads the tail of a prior session's transcript to recover the last instruction and any unanswered question. Used by `/ccr-resume` |
+| `ccrecall backfill embeddings` | Opt-in seeding of embeddings for historical active-leaf branches (jina-v2-small-en via fastembed). Not auto-spawned. Supports `--days N` / `--limit N` / `--threads N`; throttled via `nice` + a single inference thread by default. Resumable |
+| `ccrecall tokens` | Parses JSONL files for token usage analytics — cost, cache hits, model mix, skill/agent/hook patterns. Populates analytics tables and builds `~/.ccrecall/dashboard.html`. Used by `/ccr-tokens` |
+## Data flow
+```
+Session ends
+  └─ ccrecall-sync (Stop hook)
+       └─ ccrecall sync-current (background)
+            └─ writes to ~/.ccrecall/conversations.db
+            └─ embeds the active leaf via jina if model available (drops silently on failure)
+/clear (SessionEnd)
+  └─ ccrecall-clear-handoff
+       └─ writes a handoff file naming the session being cleared
+            (so the next SessionStart links to it instead of guessing)
+Session starts
+  └─ ccrecall-setup (SessionStart)
+  │    └─ ccrecall import (background, first run / new files)
+  │         └─ embeds each new active leaf via jina if model available
+  │    └─ ccrecall backfill summaries (background, if summaries missing)
+  │    └─ (embedding backfill is NOT auto-spawned — opt-in via ccrecall backfill embeddings)
+  ├─ ccrecall-onboarding (SessionStart, startup only — one-time)
+  └─ ccrecall-context (SessionStart, startup + clear)
+       └─ injects last session summary into Claude's context
+```
+## Config file
+`~/.ccrecall/config.json` — written by `ccrecall write-config` during onboarding:
+```json
+{
+  "onboarding_completed": true,
+  "onboarding_version": 1,
+  "auto_inject_context": true
+}
+```
+Onboarding sets `auto_inject_context`. The remaining settings are tunable by editing `config.json` directly:
+| Key | Type | Default | Effect |
+|---|---|---|---|
+| `auto_inject_context` | bool | `true` | Inject a summary of your previous session at session start. |
+| `max_context_sessions` | int | `2` | How many recent sessions to include in that injected context. |
+| `exclude_projects` | list[str] | `[]` | Project names to skip when **storing** conversations — excluded projects are not imported or synced. Matched against the project's directory name. This is write-side only: it prevents new data from being indexed; it does not remove or hide conversations already stored before the project was excluded. |
+| `logging_enabled` | bool | `false` | Write hook diagnostics (including swallowed hook exceptions) to `~/.ccrecall/ccrecall.log`. Useful for troubleshooting a misbehaving hook. |
+## Database
+`~/.ccrecall/conversations.db` — SQLite, WAL mode. Tables:
+- `sessions` — one row per conversation session
+- `branches` — one row per conversation branch (rewinding creates new branches)
+- `messages` — all messages, stored once per session regardless of branch
+- `branch_messages` — join table linking messages to branches
+- `import_log` — tracks which JSONL files have been imported and their hashes
+- `branch_vec` — vec0 virtual table (sqlite-vec) storing 512-dim jina embeddings for each branch, used for KNN search
+- `token_snapshots`, `turns`, `turn_tool_calls`, `session_metrics` — analytics tables populated by `ccrecall tokens`
+## Development
+```bash
+uv sync                       # install package + dev dependencies
+uv run pytest                 # run the test suite
+uvx prek run --all-files      # run the lint/format/type hooks
+```
+## License
+[MIT](LICENSE)

ccrecall-0.10.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,113 @@
+[build-system]
+requires = ["setuptools>=80", "wheel"]
+build-backend = "setuptools.build_meta"
+[project]
+name = "ccrecall"
+version = "0.10.0"
+description = "Conversation history and semantic search for Claude Code"
+readme = "README.md"
+requires-python = ">=3.10"
+license = "MIT"
+license-files = ["LICENSE"]
+authors = [{ name = "Jessica Smith", email = "12jessicasmith34@gmail.com" }]
+keywords = [
+    "claude-code",
+    "conversation-history",
+    "search",
+    "recall",
+    "transcripts",
+    "semantic-search",
+]
+classifiers = [
+    "Development Status :: 4 - Beta",
+    "Environment :: Console",
+    "Intended Audience :: Developers",
+    "Operating System :: OS Independent",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Programming Language :: Python :: 3.13",
+    "Programming Language :: Python :: 3.14",
+    "Topic :: Utilities",
+    "Topic :: Software Development :: Libraries :: Python Modules",
+]
+# Pinned to the versions in uv.lock: `uv tool install` without a lockfile
+# ignores uv.lock and resolves fresh, so an unbounded range would pull newer
+# ABI/runtime-breaking releases of these native wheels.
+# fastembed is the embedding engine — it owns the ONNX runtime + tokenizers and
+# the model download, so onnxruntime is left to fastembed's own constraint (an
+# explicit pin here fights its resolver) and reproducibility comes from uv.lock.
+# numpy is a direct dependency and uses Python-version markers. To re-sync after
+# a bump: `uv lock` then mirror the resolved versions here.
+dependencies = [
+    "sqlite-vec==0.1.9",
+    "fastembed==0.8.0",
+    "numpy==2.2.6; python_version < '3.11'",
+    "numpy==2.4.6; python_version >= '3.11'",
+    "whenever==0.10.0",
+    # Pin pydantic exactly so its native (Rust) pydantic-core dep resolves to a
+    # known ABI — same rationale as the native wheels above.
+    "pydantic==2.13.4",
+    "cyclopts>=4.16",
+]
+[project.urls]
+Homepage = "https://github.com/NodeJSmith/claude-code-recall"
+Issues = "https://github.com/NodeJSmith/claude-code-recall/issues"
+Changelog = "https://github.com/NodeJSmith/claude-code-recall/blob/main/CHANGELOG.md"
+[project.scripts]
+# Unified CLI — single entry point. Subcommands replace the former skill-facing
+# and helper cm-* tools.
+ccrecall                 = "ccrecall.cli:main"
+# Hook entry points (wired by the plugin's hooks/hooks.json). Kept as separate
+# console scripts rather than `ccrecall hook ...` subcommands on purpose: hooks
+# fire on every SessionStart/Stop, and routing through the full cyclopts app
+# eager-imports the whole command surface (fastembed/numpy/onnxruntime, ~1800ms)
+# vs ~440ms for a direct hook import. The no-lazy-imports rule rules out dodging
+# that, so a direct entry point per hook stays the fast path.
+ccrecall-setup           = "ccrecall.hooks.memory_setup:main"
+ccrecall-sync            = "ccrecall.hooks.memory_sync:main"
+ccrecall-context         = "ccrecall.hooks.memory_context:main"
+ccrecall-onboarding      = "ccrecall.hooks.onboarding:main"
+ccrecall-clear-handoff   = "ccrecall.hooks.clear_handoff:main"
+[tool.setuptools.packages.find]
+where = ["src"]
+[dependency-groups]
+dev = [
+    "pytest>=8.0",
+    "hypothesis>=6.0",
+    "pytest-cov>=7.0.0",
+    "coverage[toml]>=7.10.7",
+]
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+[tool.coverage.run]
+branch = true          # measure branch coverage, not just lines
+source = ["ccrecall"]
+parallel = true        # suffix data files so per-Python-version CI shards combine cleanly
+relative_files = true  # stable paths across CI runners
+omit = ["*/__init__.py", "*/__main__.py"]
+[tool.coverage.report]
+show_missing = true
+skip_covered = true
+# fail_under = 80  # enable once a baseline is established; CI can override
+exclude_lines = [
+    "pragma: no cover",
+    "if TYPE_CHECKING:",
+    "if __name__ == .__main__.:",
+    "raise NotImplementedError",
+]
+[tool.coverage.html]
+directory = "htmlcov"
+[tool.coverage.xml]
+output = "coverage.xml"

ccrecall-0.10.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

ccrecall-0.10.0/src/ccrecall/__init__.py ADDED Viewed

@@ -0,0 +1,18 @@
+"""
+ccrecall — conversation memory package for Claude Code.
+Submodules:
+  db                — Database connection, config/settings, vec operations, logging
+  schema            — Conversation DB schema constants (SCHEMA_*) and FTS detection
+  content           — Message content extraction and tool detection
+  parsing           — JSONL parsing, branch detection, metadata extraction
+  formatting        — Session formatting, time/path utilities
+  project_ops       — Shared project upsert logic (cwd strategy + JSONL-probe strategy)
+  session_ops       — Shared session import logic (used by sync and import pipelines)
+  token_schema      — Token ingest schema definitions, ensure_schema(), version management
+  token_parser      — Token JSONL parsing, data classes, session parsing, file discovery
+  token_analytics   — Session import and token_snapshots backfill
+  token_output      — Dashboard JSON output assembly (chart queries)
+  token_insights    — Trend analysis, insight generation, findings/recommendations
+  token_dashboard   — Token dashboard deployment and main() entry point
+"""