agentpack-cli 0.3.20__tar.gz → 0.3.21__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/PKG-INFO +90 -66
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/README.md +89 -65
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/pyproject.toml +1 -1
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/__init__.py +1 -1
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/ranking.py +410 -19
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/symbols.py +4 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/application/pack_service.py +52 -30
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/benchmark.py +1010 -24
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/diagnose_selection.py +1 -1
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/explain.py +11 -6
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/guard.py +4 -3
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/init.py +14 -16
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/migrate.py +4 -3
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/pack.py +6 -5
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/quickstart.py +5 -3
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/stats.py +2 -2
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/tune.py +1 -1
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/config.py +8 -4
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/context_pack.py +419 -38
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/models.py +4 -2
- agentpack_cli-0.3.21/src/agentpack/core/modes.py +23 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/mcp_server.py +2 -2
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/renderers/markdown.py +2 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/summaries/base.py +6 -2
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/.gitignore +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/LICENSE +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/antigravity.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/base.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/claude.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/codex.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/cursor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/detect.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/generic.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/adapters/windsurf.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/dependency_graph.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/go_imports.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/java_imports.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/js_ts_imports.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/monorepo.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/naming_signals.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_ast.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_imports.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/repo_map.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/role_inference.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/rust_imports.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/task_classifier.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/analysis/tests.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/application/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/cli.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/_shared.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/ci_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/claude_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/compress_output.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/dashboard.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/dev_check.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/diff.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/doctor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/eval_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/hook_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/ignore_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/install.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/learn.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/mcp_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/memory.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/monitor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/next_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/perf.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/release_check.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/release_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/repair.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/retrieve.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/route.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/scan.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/skills.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/start_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/state_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/status.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/summarize.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/task_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/threads.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/verify_wheel.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/watch.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/workflow_cmd.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/commands/wrap.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/bootstrap.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/cache.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/changed_paths.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/diff.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/evals.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/execution_state.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/git.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/git_hooks.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/global_install.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/ignore.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/loop_protocol.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/merkle.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/pack_registry.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/redactor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/scanner.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/snapshot.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/task_freshness.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/thread_context.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/token_estimator.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/core/vscode_tasks.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/dashboard/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/dashboard/collectors.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/dashboard/models.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/dashboard/renderers.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/data/agentpack.md +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/antigravity.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/claude.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/codex.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/cursor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/installers/windsurf.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/agents.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/git_hooks.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/global_install.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/platform.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/integrations/vscode_tasks.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/collector.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/extractor.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/feedback.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/lesson_ranker.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/models.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/provider.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/quality.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/renderers.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/learning/skill_map.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/output_compression/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/output_compression/core.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/renderers/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/renderers/compact.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/renderers/receipts.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/discovery.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/models.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/parser.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/prompt_builder.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/scoring.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/service.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/router/skills_index.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/session/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/session/events.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/session/state.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/summaries/__init__.py +0 -0
- {agentpack_cli-0.3.20 → agentpack_cli-0.3.21}/src/agentpack/summaries/offline.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: agentpack-cli
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.21
|
|
4
4
|
Summary: Local MCP context router for Claude Code, Codex, Cursor, and AI coding agents.
|
|
5
5
|
License: MIT
|
|
6
6
|
License-File: LICENSE
|
|
@@ -49,14 +49,17 @@ Description-Content-Type: text/markdown
|
|
|
49
49
|
[](https://opensource.org/licenses/MIT)
|
|
50
50
|
[](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
|
|
51
51
|
|
|
52
|
-
**Local
|
|
52
|
+
**Local context router for AI coding agents.**
|
|
53
53
|
|
|
54
|
-
Claude Code, Codex, Cursor, and other coding agents
|
|
54
|
+
AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
|
|
55
55
|
|
|
56
|
-
|
|
56
|
+
One workflow matters:
|
|
57
57
|
|
|
58
|
-
|
|
59
|
-
|
|
58
|
+
```text
|
|
59
|
+
route -> pack -> agent acts -> benchmark captures miss
|
|
60
|
+
```
|
|
61
|
+
|
|
62
|
+
First route the task to likely files, tests, rules, and skills:
|
|
60
63
|
|
|
61
64
|
```bash
|
|
62
65
|
pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
@@ -64,68 +67,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
|
64
67
|
|
|
65
68
|

|
|
66
69
|
|
|
67
|
-
> **Status: alpha (v0.3.
|
|
70
|
+
> **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
|
|
68
71
|
>
|
|
69
72
|
> **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
|
|
70
73
|
>
|
|
71
74
|
> **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
|
|
72
75
|
|
|
73
|
-
## What's New in 0.3.
|
|
76
|
+
## What's New in 0.3.21
|
|
74
77
|
|
|
75
|
-
`0.3.
|
|
76
|
-
|
|
77
|
-
|
|
78
|
-
|
|
78
|
+
`0.3.21` is a benchmark trust release. It keeps the current honest expanded
|
|
79
|
+
public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
|
|
80
|
+
legacy minimal-mode surface in favor of `balanced`, improves benchmark
|
|
81
|
+
diagnostics and public-suite methodology, and documents the next release target:
|
|
82
|
+
**65%+ recall while holding 50%+ token precision**.
|
|
79
83
|
|
|
80
|
-
##
|
|
84
|
+
## Core Workflow
|
|
81
85
|
|
|
82
|
-
|
|
86
|
+
### 1. Route
|
|
83
87
|
|
|
84
|
-
|
|
85
|
-
Task: fix auth token expiry
|
|
88
|
+
Use the read-only router when you want quick orientation without writing files:
|
|
86
89
|
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
- opens nearby middleware and config
|
|
90
|
-
- may miss related tests
|
|
91
|
-
- spends early turns building a repo map
|
|
90
|
+
```bash
|
|
91
|
+
agentpack route --task "fix auth token expiry"
|
|
92
92
|
```
|
|
93
93
|
|
|
94
|
-
|
|
94
|
+
### 2. Pack
|
|
95
95
|
|
|
96
96
|
```bash
|
|
97
|
-
agentpack
|
|
97
|
+
agentpack task set "fix auth token expiry"
|
|
98
|
+
agentpack pack --task auto
|
|
98
99
|
```
|
|
99
100
|
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
fix auth token expiry
|
|
101
|
+
AgentPack writes `.agentpack/context.md` with selected files, omitted-file
|
|
102
|
+
receipts, task freshness, token stats, and suggested checks.
|
|
103
103
|
|
|
104
|
-
|
|
105
|
-
- tests/test_auth.py
|
|
106
|
-
- src/app/auth.py
|
|
107
|
-
- src/app/users.py
|
|
104
|
+
### 3. Agent Acts
|
|
108
105
|
|
|
109
|
-
|
|
110
|
-
|
|
106
|
+
Point the agent at the pack or use MCP tools. Agent still verifies code before
|
|
107
|
+
editing; AgentPack is map, not correctness proof.
|
|
108
|
+
|
|
109
|
+
### 4. Benchmark Captures Miss
|
|
110
|
+
|
|
111
|
+
After a task, capture the files that actually changed:
|
|
112
|
+
|
|
113
|
+
```bash
|
|
114
|
+
agentpack benchmark capture --since main --task "fix auth token expiry"
|
|
115
|
+
agentpack benchmark --misses
|
|
111
116
|
```
|
|
112
117
|
|
|
118
|
+
Miss diagnostics show whether a required file was ignored, scored too low,
|
|
119
|
+
ranked but cut by budget, or absent from scan.
|
|
120
|
+
|
|
113
121
|
## Features
|
|
114
122
|
|
|
115
|
-
- **
|
|
116
|
-
- **
|
|
117
|
-
- **
|
|
118
|
-
- **
|
|
119
|
-
- **
|
|
120
|
-
- **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
|
|
121
|
-
- **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
|
|
122
|
-
- **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
|
|
123
|
-
- **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
|
|
124
|
-
- **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
|
|
123
|
+
- **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
|
|
124
|
+
- **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
|
|
125
|
+
- **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
|
|
126
|
+
- **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
|
|
127
|
+
- **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
|
|
125
128
|
|
|
126
129
|
## Benchmark Proof
|
|
127
130
|
|
|
128
|
-
Latest
|
|
131
|
+
Latest published v0.3.20 release table: 8 pinned public commits from Pallets
|
|
132
|
+
Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
|
|
133
|
+
each commit. The public manifest now also supports 100+ sampled historical
|
|
134
|
+
commits across Python, TypeScript, Go, Java, and monorepo repos for broader
|
|
135
|
+
release runs.
|
|
129
136
|
|
|
130
137
|
| Metric | Result |
|
|
131
138
|
|---|---:|
|
|
@@ -134,19 +141,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
|
|
|
134
141
|
| Pack p50 | 1,450 tokens |
|
|
135
142
|
| Pack p95 | 3,805 tokens |
|
|
136
143
|
|
|
137
|
-
Full table: [`benchmarks/results/2026-
|
|
144
|
+
Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
|
|
145
|
+
The expanded 109-case public suite is the current optimization baseline:
|
|
146
|
+
**57.0% recall / 50.6% token precision**. It is broader and harder than the
|
|
147
|
+
8-case published table, and recall remains the active improvement target.
|
|
148
|
+
Reproduce the expanded public suite:
|
|
149
|
+
|
|
150
|
+
```bash
|
|
151
|
+
agentpack benchmark --public-suite --reproduce v0.3.20
|
|
152
|
+
```
|
|
153
|
+
|
|
154
|
+
Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
|
|
155
|
+
|
|
156
|
+
### Next Release Benchmark Target
|
|
157
|
+
|
|
158
|
+
The next benchmark release target is to raise the expanded public suite from the
|
|
159
|
+
current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
|
|
160
|
+
while keeping token precision at **50%+**. The target should be measured on the
|
|
161
|
+
same 100+ public historical-commit suite, with per-language slices published so
|
|
162
|
+
precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
|
|
163
|
+
|
|
164
|
+
Decision gate for the next public table:
|
|
165
|
+
|
|
166
|
+
- full-suite recall is at least 65.0%
|
|
167
|
+
- full-suite token precision is at least 50.0%
|
|
168
|
+
- no major language or task slice loses more than 2 recall points
|
|
169
|
+
- Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
|
|
170
|
+
- any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
|
|
171
|
+
token cost, and time-to-first-correct-file
|
|
172
|
+
|
|
173
|
+
## Trust
|
|
174
|
+
|
|
175
|
+
AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
|
|
176
|
+
npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
|
|
177
|
+
[`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
|
|
178
|
+
and [`docs/data-flow.md`](docs/data-flow.md).
|
|
138
179
|
|
|
139
180
|
## Use Cases
|
|
140
181
|
|
|
141
|
-
|
|
142
|
-
- [MCP
|
|
143
|
-
|
|
144
|
-
|
|
145
|
-
- [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
|
|
146
|
-
- [How AgentPack works](docs/how-agentpack-works.md)
|
|
147
|
-
- [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
|
|
148
|
-
- [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
|
|
149
|
-
- [Docs index](docs/index.md)
|
|
182
|
+
Start with the [docs index](docs/index.md), or jump to guides for
|
|
183
|
+
[Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
|
|
184
|
+
[Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
|
|
185
|
+
and [how AgentPack works](docs/how-agentpack-works.md).
|
|
150
186
|
|
|
151
187
|
## Install
|
|
152
188
|
|
|
@@ -274,7 +310,7 @@ budget = 8000
|
|
|
274
310
|
output = ".agentpack/context.md"
|
|
275
311
|
```
|
|
276
312
|
|
|
277
|
-
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use
|
|
313
|
+
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
|
|
278
314
|
|
|
279
315
|
Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
|
|
280
316
|
|
|
@@ -391,18 +427,6 @@ THREAD=codex-local make context-thread
|
|
|
391
427
|
AGENTPACK_THREAD_ID=codex-local make context-thread
|
|
392
428
|
```
|
|
393
429
|
|
|
394
|
-
## Benchmark Proof
|
|
395
|
-
|
|
396
|
-
AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
|
|
397
|
-
|
|
398
|
-
Use real repo evals instead of trusting compression numbers:
|
|
399
|
-
|
|
400
|
-
```bash
|
|
401
|
-
agentpack benchmark --release-gate
|
|
402
|
-
```
|
|
403
|
-
|
|
404
|
-
Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
|
|
405
|
-
|
|
406
430
|
## What A Pack Contains
|
|
407
431
|
|
|
408
432
|
Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
|
|
@@ -8,14 +8,17 @@
|
|
|
8
8
|
[](https://opensource.org/licenses/MIT)
|
|
9
9
|
[](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
|
|
10
10
|
|
|
11
|
-
**Local
|
|
11
|
+
**Local context router for AI coding agents.**
|
|
12
12
|
|
|
13
|
-
Claude Code, Codex, Cursor, and other coding agents
|
|
13
|
+
AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
|
|
14
14
|
|
|
15
|
-
|
|
15
|
+
One workflow matters:
|
|
16
16
|
|
|
17
|
-
|
|
18
|
-
|
|
17
|
+
```text
|
|
18
|
+
route -> pack -> agent acts -> benchmark captures miss
|
|
19
|
+
```
|
|
20
|
+
|
|
21
|
+
First route the task to likely files, tests, rules, and skills:
|
|
19
22
|
|
|
20
23
|
```bash
|
|
21
24
|
pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
@@ -23,68 +26,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
|
23
26
|
|
|
24
27
|

|
|
25
28
|
|
|
26
|
-
> **Status: alpha (v0.3.
|
|
29
|
+
> **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
|
|
27
30
|
>
|
|
28
31
|
> **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
|
|
29
32
|
>
|
|
30
33
|
> **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
|
|
31
34
|
|
|
32
|
-
## What's New in 0.3.
|
|
35
|
+
## What's New in 0.3.21
|
|
33
36
|
|
|
34
|
-
`0.3.
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
37
|
+
`0.3.21` is a benchmark trust release. It keeps the current honest expanded
|
|
38
|
+
public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
|
|
39
|
+
legacy minimal-mode surface in favor of `balanced`, improves benchmark
|
|
40
|
+
diagnostics and public-suite methodology, and documents the next release target:
|
|
41
|
+
**65%+ recall while holding 50%+ token precision**.
|
|
38
42
|
|
|
39
|
-
##
|
|
43
|
+
## Core Workflow
|
|
40
44
|
|
|
41
|
-
|
|
45
|
+
### 1. Route
|
|
42
46
|
|
|
43
|
-
|
|
44
|
-
Task: fix auth token expiry
|
|
47
|
+
Use the read-only router when you want quick orientation without writing files:
|
|
45
48
|
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
- opens nearby middleware and config
|
|
49
|
-
- may miss related tests
|
|
50
|
-
- spends early turns building a repo map
|
|
49
|
+
```bash
|
|
50
|
+
agentpack route --task "fix auth token expiry"
|
|
51
51
|
```
|
|
52
52
|
|
|
53
|
-
|
|
53
|
+
### 2. Pack
|
|
54
54
|
|
|
55
55
|
```bash
|
|
56
|
-
agentpack
|
|
56
|
+
agentpack task set "fix auth token expiry"
|
|
57
|
+
agentpack pack --task auto
|
|
57
58
|
```
|
|
58
59
|
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
fix auth token expiry
|
|
60
|
+
AgentPack writes `.agentpack/context.md` with selected files, omitted-file
|
|
61
|
+
receipts, task freshness, token stats, and suggested checks.
|
|
62
62
|
|
|
63
|
-
|
|
64
|
-
- tests/test_auth.py
|
|
65
|
-
- src/app/auth.py
|
|
66
|
-
- src/app/users.py
|
|
63
|
+
### 3. Agent Acts
|
|
67
64
|
|
|
68
|
-
|
|
69
|
-
|
|
65
|
+
Point the agent at the pack or use MCP tools. Agent still verifies code before
|
|
66
|
+
editing; AgentPack is map, not correctness proof.
|
|
67
|
+
|
|
68
|
+
### 4. Benchmark Captures Miss
|
|
69
|
+
|
|
70
|
+
After a task, capture the files that actually changed:
|
|
71
|
+
|
|
72
|
+
```bash
|
|
73
|
+
agentpack benchmark capture --since main --task "fix auth token expiry"
|
|
74
|
+
agentpack benchmark --misses
|
|
70
75
|
```
|
|
71
76
|
|
|
77
|
+
Miss diagnostics show whether a required file was ignored, scored too low,
|
|
78
|
+
ranked but cut by budget, or absent from scan.
|
|
79
|
+
|
|
72
80
|
## Features
|
|
73
81
|
|
|
74
|
-
- **
|
|
75
|
-
- **
|
|
76
|
-
- **
|
|
77
|
-
- **
|
|
78
|
-
- **
|
|
79
|
-
- **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
|
|
80
|
-
- **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
|
|
81
|
-
- **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
|
|
82
|
-
- **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
|
|
83
|
-
- **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
|
|
82
|
+
- **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
|
|
83
|
+
- **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
|
|
84
|
+
- **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
|
|
85
|
+
- **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
|
|
86
|
+
- **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
|
|
84
87
|
|
|
85
88
|
## Benchmark Proof
|
|
86
89
|
|
|
87
|
-
Latest
|
|
90
|
+
Latest published v0.3.20 release table: 8 pinned public commits from Pallets
|
|
91
|
+
Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
|
|
92
|
+
each commit. The public manifest now also supports 100+ sampled historical
|
|
93
|
+
commits across Python, TypeScript, Go, Java, and monorepo repos for broader
|
|
94
|
+
release runs.
|
|
88
95
|
|
|
89
96
|
| Metric | Result |
|
|
90
97
|
|---|---:|
|
|
@@ -93,19 +100,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
|
|
|
93
100
|
| Pack p50 | 1,450 tokens |
|
|
94
101
|
| Pack p95 | 3,805 tokens |
|
|
95
102
|
|
|
96
|
-
Full table: [`benchmarks/results/2026-
|
|
103
|
+
Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
|
|
104
|
+
The expanded 109-case public suite is the current optimization baseline:
|
|
105
|
+
**57.0% recall / 50.6% token precision**. It is broader and harder than the
|
|
106
|
+
8-case published table, and recall remains the active improvement target.
|
|
107
|
+
Reproduce the expanded public suite:
|
|
108
|
+
|
|
109
|
+
```bash
|
|
110
|
+
agentpack benchmark --public-suite --reproduce v0.3.20
|
|
111
|
+
```
|
|
112
|
+
|
|
113
|
+
Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
|
|
114
|
+
|
|
115
|
+
### Next Release Benchmark Target
|
|
116
|
+
|
|
117
|
+
The next benchmark release target is to raise the expanded public suite from the
|
|
118
|
+
current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
|
|
119
|
+
while keeping token precision at **50%+**. The target should be measured on the
|
|
120
|
+
same 100+ public historical-commit suite, with per-language slices published so
|
|
121
|
+
precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
|
|
122
|
+
|
|
123
|
+
Decision gate for the next public table:
|
|
124
|
+
|
|
125
|
+
- full-suite recall is at least 65.0%
|
|
126
|
+
- full-suite token precision is at least 50.0%
|
|
127
|
+
- no major language or task slice loses more than 2 recall points
|
|
128
|
+
- Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
|
|
129
|
+
- any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
|
|
130
|
+
token cost, and time-to-first-correct-file
|
|
131
|
+
|
|
132
|
+
## Trust
|
|
133
|
+
|
|
134
|
+
AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
|
|
135
|
+
npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
|
|
136
|
+
[`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
|
|
137
|
+
and [`docs/data-flow.md`](docs/data-flow.md).
|
|
97
138
|
|
|
98
139
|
## Use Cases
|
|
99
140
|
|
|
100
|
-
|
|
101
|
-
- [MCP
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
- [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
|
|
105
|
-
- [How AgentPack works](docs/how-agentpack-works.md)
|
|
106
|
-
- [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
|
|
107
|
-
- [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
|
|
108
|
-
- [Docs index](docs/index.md)
|
|
141
|
+
Start with the [docs index](docs/index.md), or jump to guides for
|
|
142
|
+
[Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
|
|
143
|
+
[Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
|
|
144
|
+
and [how AgentPack works](docs/how-agentpack-works.md).
|
|
109
145
|
|
|
110
146
|
## Install
|
|
111
147
|
|
|
@@ -233,7 +269,7 @@ budget = 8000
|
|
|
233
269
|
output = ".agentpack/context.md"
|
|
234
270
|
```
|
|
235
271
|
|
|
236
|
-
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use
|
|
272
|
+
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
|
|
237
273
|
|
|
238
274
|
Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
|
|
239
275
|
|
|
@@ -350,18 +386,6 @@ THREAD=codex-local make context-thread
|
|
|
350
386
|
AGENTPACK_THREAD_ID=codex-local make context-thread
|
|
351
387
|
```
|
|
352
388
|
|
|
353
|
-
## Benchmark Proof
|
|
354
|
-
|
|
355
|
-
AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
|
|
356
|
-
|
|
357
|
-
Use real repo evals instead of trusting compression numbers:
|
|
358
|
-
|
|
359
|
-
```bash
|
|
360
|
-
agentpack benchmark --release-gate
|
|
361
|
-
```
|
|
362
|
-
|
|
363
|
-
Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
|
|
364
|
-
|
|
365
389
|
## What A Pack Contains
|
|
366
390
|
|
|
367
391
|
Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
|