agentpack-cli 0.3.19__tar.gz → 0.3.21__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/PKG-INFO +88 -90
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/README.md +87 -89
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/pyproject.toml +1 -1
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/__init__.py +1 -1
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/ranking.py +410 -19
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/symbols.py +4 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/application/pack_service.py +52 -30
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/benchmark.py +1010 -24
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/diagnose_selection.py +1 -1
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/explain.py +11 -6
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/guard.py +4 -3
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/init.py +14 -16
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/migrate.py +4 -3
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/pack.py +6 -5
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/quickstart.py +5 -3
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/stats.py +2 -2
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/tune.py +1 -1
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/config.py +8 -4
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/context_pack.py +419 -38
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/models.py +4 -2
- agentpack_cli-0.3.21/src/agentpack/core/modes.py +23 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/collectors.py +68 -4
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/renderers.py +180 -56
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/mcp_server.py +2 -2
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/markdown.py +2 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/parser.py +197 -17
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/skills_index.py +4 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/base.py +6 -2
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/.gitignore +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/LICENSE +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/antigravity.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/base.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/claude.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/codex.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/cursor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/detect.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/generic.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/windsurf.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/dependency_graph.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/go_imports.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/java_imports.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/js_ts_imports.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/monorepo.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/naming_signals.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_ast.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_imports.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/repo_map.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/role_inference.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/rust_imports.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/task_classifier.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/tests.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/application/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/cli.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/_shared.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/ci_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/claude_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/compress_output.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/dashboard.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/dev_check.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/diff.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/doctor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/eval_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/hook_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/ignore_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/install.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/learn.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/mcp_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/memory.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/monitor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/next_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/perf.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/release_check.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/release_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/repair.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/retrieve.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/route.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/scan.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/skills.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/start_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/state_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/status.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/summarize.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/task_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/threads.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/verify_wheel.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/watch.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/workflow_cmd.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/wrap.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/bootstrap.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/cache.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/changed_paths.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/diff.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/evals.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/execution_state.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/git.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/git_hooks.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/global_install.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/ignore.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/loop_protocol.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/merkle.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/pack_registry.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/redactor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/scanner.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/snapshot.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/task_freshness.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/thread_context.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/token_estimator.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/vscode_tasks.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/models.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/data/agentpack.md +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/antigravity.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/claude.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/codex.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/cursor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/windsurf.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/agents.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/git_hooks.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/global_install.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/platform.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/vscode_tasks.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/collector.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/extractor.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/feedback.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/lesson_ranker.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/models.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/provider.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/quality.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/renderers.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/skill_map.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/output_compression/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/output_compression/core.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/compact.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/receipts.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/discovery.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/models.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/prompt_builder.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/scoring.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/service.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/events.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/state.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/__init__.py +0 -0
- {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/offline.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: agentpack-cli
|
|
3
|
-
Version: 0.3.
|
|
3
|
+
Version: 0.3.21
|
|
4
4
|
Summary: Local MCP context router for Claude Code, Codex, Cursor, and AI coding agents.
|
|
5
5
|
License: MIT
|
|
6
6
|
License-File: LICENSE
|
|
@@ -49,15 +49,17 @@ Description-Content-Type: text/markdown
|
|
|
49
49
|
[](https://opensource.org/licenses/MIT)
|
|
50
50
|
[](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
|
|
51
51
|
|
|
52
|
-
**Local
|
|
52
|
+
**Local context router for AI coding agents.**
|
|
53
53
|
|
|
54
|
-
Claude Code, Codex, Cursor, and other coding agents
|
|
54
|
+
AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
|
|
55
55
|
|
|
56
|
-
|
|
56
|
+
One workflow matters:
|
|
57
57
|
|
|
58
|
-
|
|
58
|
+
```text
|
|
59
|
+
route -> pack -> agent acts -> benchmark captures miss
|
|
60
|
+
```
|
|
59
61
|
|
|
60
|
-
|
|
62
|
+
First route the task to likely files, tests, rules, and skills:
|
|
61
63
|
|
|
62
64
|
```bash
|
|
63
65
|
pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
@@ -65,94 +67,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
|
65
67
|
|
|
66
68
|

|
|
67
69
|
|
|
68
|
-
> **Status: alpha (v0.3.
|
|
70
|
+
> **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
|
|
69
71
|
>
|
|
70
72
|
> **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
|
|
71
73
|
>
|
|
72
74
|
> **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
|
|
73
75
|
|
|
74
|
-
## What's New in 0.3.
|
|
76
|
+
## What's New in 0.3.21
|
|
75
77
|
|
|
76
|
-
`0.3.
|
|
77
|
-
|
|
78
|
-
|
|
78
|
+
`0.3.21` is a benchmark trust release. It keeps the current honest expanded
|
|
79
|
+
public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
|
|
80
|
+
legacy minimal-mode surface in favor of `balanced`, improves benchmark
|
|
81
|
+
diagnostics and public-suite methodology, and documents the next release target:
|
|
82
|
+
**65%+ recall while holding 50%+ token precision**.
|
|
79
83
|
|
|
80
|
-
##
|
|
84
|
+
## Core Workflow
|
|
81
85
|
|
|
82
|
-
|
|
83
|
-
frontmatter, confidence thresholds, negative triggers, diversity-aware ranking,
|
|
84
|
-
and a pull-based MCP `get_skill` flow. Skill benchmark cases can declare
|
|
85
|
-
`expected_skills` and `avoid_skills`, and `agentpack skills feedback` records
|
|
86
|
-
local outcome signals for future routing.
|
|
86
|
+
### 1. Route
|
|
87
87
|
|
|
88
|
-
|
|
88
|
+
Use the read-only router when you want quick orientation without writing files:
|
|
89
89
|
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
90
|
+
```bash
|
|
91
|
+
agentpack route --task "fix auth token expiry"
|
|
92
|
+
```
|
|
93
93
|
|
|
94
|
-
|
|
95
|
-
AgentPack sends a bounded, redacted report JSON on stdin and accepts
|
|
96
|
-
LearningReport-compatible JSON fields on stdout. No hosted service is called
|
|
97
|
-
unless your command does it.
|
|
98
|
-
- `agentpack learn --dashboard` writes a static
|
|
99
|
-
`.agentpack/learning-dashboard.html` for IDE/browser review.
|
|
100
|
-
- `agentpack learn --team-export` writes `.agentpack/team-lessons.md`, a
|
|
101
|
-
shareable lesson file that omits personal skill history.
|
|
102
|
-
- `agentpack learn --feedback`, `--skills`, and `--drills` close the loop from
|
|
103
|
-
a task summary to skill memory and next-practice prompts.
|
|
104
|
-
- `agentpack dev-check` and `agentpack release-check` now print bounded failure
|
|
105
|
-
excerpts, so CI shows the failing test instead of only a red stage name.
|
|
94
|
+
### 2. Pack
|
|
106
95
|
|
|
107
|
-
|
|
96
|
+
```bash
|
|
97
|
+
agentpack task set "fix auth token expiry"
|
|
98
|
+
agentpack pack --task auto
|
|
99
|
+
```
|
|
108
100
|
|
|
109
|
-
|
|
101
|
+
AgentPack writes `.agentpack/context.md` with selected files, omitted-file
|
|
102
|
+
receipts, task freshness, token stats, and suggested checks.
|
|
110
103
|
|
|
111
|
-
|
|
112
|
-
Task: fix auth token expiry
|
|
104
|
+
### 3. Agent Acts
|
|
113
105
|
|
|
114
|
-
Agent
|
|
115
|
-
|
|
116
|
-
- opens nearby middleware and config
|
|
117
|
-
- may miss related tests
|
|
118
|
-
- spends early turns building a repo map
|
|
119
|
-
```
|
|
106
|
+
Point the agent at the pack or use MCP tools. Agent still verifies code before
|
|
107
|
+
editing; AgentPack is map, not correctness proof.
|
|
120
108
|
|
|
121
|
-
|
|
109
|
+
### 4. Benchmark Captures Miss
|
|
110
|
+
|
|
111
|
+
After a task, capture the files that actually changed:
|
|
122
112
|
|
|
123
113
|
```bash
|
|
124
|
-
agentpack
|
|
114
|
+
agentpack benchmark capture --since main --task "fix auth token expiry"
|
|
115
|
+
agentpack benchmark --misses
|
|
125
116
|
```
|
|
126
117
|
|
|
127
|
-
|
|
128
|
-
|
|
129
|
-
fix auth token expiry
|
|
130
|
-
|
|
131
|
-
Relevant files:
|
|
132
|
-
- tests/test_auth.py
|
|
133
|
-
- src/app/auth.py
|
|
134
|
-
- src/app/users.py
|
|
135
|
-
|
|
136
|
-
Suggested commands:
|
|
137
|
-
- pytest tests/test_auth.py -q
|
|
138
|
-
```
|
|
118
|
+
Miss diagnostics show whether a required file was ignored, scored too low,
|
|
119
|
+
ranked but cut by budget, or absent from scan.
|
|
139
120
|
|
|
140
121
|
## Features
|
|
141
122
|
|
|
142
|
-
- **
|
|
143
|
-
- **
|
|
144
|
-
- **
|
|
145
|
-
- **
|
|
146
|
-
- **
|
|
147
|
-
- **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
|
|
148
|
-
- **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
|
|
149
|
-
- **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
|
|
150
|
-
- **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
|
|
151
|
-
- **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
|
|
123
|
+
- **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
|
|
124
|
+
- **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
|
|
125
|
+
- **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
|
|
126
|
+
- **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
|
|
127
|
+
- **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
|
|
152
128
|
|
|
153
129
|
## Benchmark Proof
|
|
154
130
|
|
|
155
|
-
Latest
|
|
131
|
+
Latest published v0.3.20 release table: 8 pinned public commits from Pallets
|
|
132
|
+
Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
|
|
133
|
+
each commit. The public manifest now also supports 100+ sampled historical
|
|
134
|
+
commits across Python, TypeScript, Go, Java, and monorepo repos for broader
|
|
135
|
+
release runs.
|
|
156
136
|
|
|
157
137
|
| Metric | Result |
|
|
158
138
|
|---|---:|
|
|
@@ -161,18 +141,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
|
|
|
161
141
|
| Pack p50 | 1,450 tokens |
|
|
162
142
|
| Pack p95 | 3,805 tokens |
|
|
163
143
|
|
|
164
|
-
Full table: [`benchmarks/results/2026-
|
|
144
|
+
Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
|
|
145
|
+
The expanded 109-case public suite is the current optimization baseline:
|
|
146
|
+
**57.0% recall / 50.6% token precision**. It is broader and harder than the
|
|
147
|
+
8-case published table, and recall remains the active improvement target.
|
|
148
|
+
Reproduce the expanded public suite:
|
|
149
|
+
|
|
150
|
+
```bash
|
|
151
|
+
agentpack benchmark --public-suite --reproduce v0.3.20
|
|
152
|
+
```
|
|
153
|
+
|
|
154
|
+
Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
|
|
155
|
+
|
|
156
|
+
### Next Release Benchmark Target
|
|
157
|
+
|
|
158
|
+
The next benchmark release target is to raise the expanded public suite from the
|
|
159
|
+
current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
|
|
160
|
+
while keeping token precision at **50%+**. The target should be measured on the
|
|
161
|
+
same 100+ public historical-commit suite, with per-language slices published so
|
|
162
|
+
precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
|
|
163
|
+
|
|
164
|
+
Decision gate for the next public table:
|
|
165
|
+
|
|
166
|
+
- full-suite recall is at least 65.0%
|
|
167
|
+
- full-suite token precision is at least 50.0%
|
|
168
|
+
- no major language or task slice loses more than 2 recall points
|
|
169
|
+
- Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
|
|
170
|
+
- any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
|
|
171
|
+
token cost, and time-to-first-correct-file
|
|
172
|
+
|
|
173
|
+
## Trust
|
|
174
|
+
|
|
175
|
+
AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
|
|
176
|
+
npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
|
|
177
|
+
[`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
|
|
178
|
+
and [`docs/data-flow.md`](docs/data-flow.md).
|
|
165
179
|
|
|
166
180
|
## Use Cases
|
|
167
181
|
|
|
168
|
-
|
|
169
|
-
- [MCP
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
- [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
|
|
173
|
-
- [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
|
|
174
|
-
- [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
|
|
175
|
-
- [Docs index](docs/index.md)
|
|
182
|
+
Start with the [docs index](docs/index.md), or jump to guides for
|
|
183
|
+
[Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
|
|
184
|
+
[Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
|
|
185
|
+
and [how AgentPack works](docs/how-agentpack-works.md).
|
|
176
186
|
|
|
177
187
|
## Install
|
|
178
188
|
|
|
@@ -300,7 +310,7 @@ budget = 8000
|
|
|
300
310
|
output = ".agentpack/context.md"
|
|
301
311
|
```
|
|
302
312
|
|
|
303
|
-
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use
|
|
313
|
+
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
|
|
304
314
|
|
|
305
315
|
Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
|
|
306
316
|
|
|
@@ -417,18 +427,6 @@ THREAD=codex-local make context-thread
|
|
|
417
427
|
AGENTPACK_THREAD_ID=codex-local make context-thread
|
|
418
428
|
```
|
|
419
429
|
|
|
420
|
-
## Benchmark Proof
|
|
421
|
-
|
|
422
|
-
AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
|
|
423
|
-
|
|
424
|
-
Use real repo evals instead of trusting compression numbers:
|
|
425
|
-
|
|
426
|
-
```bash
|
|
427
|
-
agentpack benchmark --release-gate
|
|
428
|
-
```
|
|
429
|
-
|
|
430
|
-
Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
|
|
431
|
-
|
|
432
430
|
## What A Pack Contains
|
|
433
431
|
|
|
434
432
|
Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
|
|
@@ -8,15 +8,17 @@
|
|
|
8
8
|
[](https://opensource.org/licenses/MIT)
|
|
9
9
|
[](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
|
|
10
10
|
|
|
11
|
-
**Local
|
|
11
|
+
**Local context router for AI coding agents.**
|
|
12
12
|
|
|
13
|
-
Claude Code, Codex, Cursor, and other coding agents
|
|
13
|
+
AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
|
|
14
14
|
|
|
15
|
-
|
|
15
|
+
One workflow matters:
|
|
16
16
|
|
|
17
|
-
|
|
17
|
+
```text
|
|
18
|
+
route -> pack -> agent acts -> benchmark captures miss
|
|
19
|
+
```
|
|
18
20
|
|
|
19
|
-
|
|
21
|
+
First route the task to likely files, tests, rules, and skills:
|
|
20
22
|
|
|
21
23
|
```bash
|
|
22
24
|
pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
@@ -24,94 +26,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
|
|
|
24
26
|
|
|
25
27
|

|
|
26
28
|
|
|
27
|
-
> **Status: alpha (v0.3.
|
|
29
|
+
> **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
|
|
28
30
|
>
|
|
29
31
|
> **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
|
|
30
32
|
>
|
|
31
33
|
> **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
|
|
32
34
|
|
|
33
|
-
## What's New in 0.3.
|
|
35
|
+
## What's New in 0.3.21
|
|
34
36
|
|
|
35
|
-
`0.3.
|
|
36
|
-
|
|
37
|
-
|
|
37
|
+
`0.3.21` is a benchmark trust release. It keeps the current honest expanded
|
|
38
|
+
public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
|
|
39
|
+
legacy minimal-mode surface in favor of `balanced`, improves benchmark
|
|
40
|
+
diagnostics and public-suite methodology, and documents the next release target:
|
|
41
|
+
**65%+ recall while holding 50%+ token precision**.
|
|
38
42
|
|
|
39
|
-
##
|
|
43
|
+
## Core Workflow
|
|
40
44
|
|
|
41
|
-
|
|
42
|
-
frontmatter, confidence thresholds, negative triggers, diversity-aware ranking,
|
|
43
|
-
and a pull-based MCP `get_skill` flow. Skill benchmark cases can declare
|
|
44
|
-
`expected_skills` and `avoid_skills`, and `agentpack skills feedback` records
|
|
45
|
-
local outcome signals for future routing.
|
|
45
|
+
### 1. Route
|
|
46
46
|
|
|
47
|
-
|
|
47
|
+
Use the read-only router when you want quick orientation without writing files:
|
|
48
48
|
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
49
|
+
```bash
|
|
50
|
+
agentpack route --task "fix auth token expiry"
|
|
51
|
+
```
|
|
52
52
|
|
|
53
|
-
|
|
54
|
-
AgentPack sends a bounded, redacted report JSON on stdin and accepts
|
|
55
|
-
LearningReport-compatible JSON fields on stdout. No hosted service is called
|
|
56
|
-
unless your command does it.
|
|
57
|
-
- `agentpack learn --dashboard` writes a static
|
|
58
|
-
`.agentpack/learning-dashboard.html` for IDE/browser review.
|
|
59
|
-
- `agentpack learn --team-export` writes `.agentpack/team-lessons.md`, a
|
|
60
|
-
shareable lesson file that omits personal skill history.
|
|
61
|
-
- `agentpack learn --feedback`, `--skills`, and `--drills` close the loop from
|
|
62
|
-
a task summary to skill memory and next-practice prompts.
|
|
63
|
-
- `agentpack dev-check` and `agentpack release-check` now print bounded failure
|
|
64
|
-
excerpts, so CI shows the failing test instead of only a red stage name.
|
|
53
|
+
### 2. Pack
|
|
65
54
|
|
|
66
|
-
|
|
55
|
+
```bash
|
|
56
|
+
agentpack task set "fix auth token expiry"
|
|
57
|
+
agentpack pack --task auto
|
|
58
|
+
```
|
|
67
59
|
|
|
68
|
-
|
|
60
|
+
AgentPack writes `.agentpack/context.md` with selected files, omitted-file
|
|
61
|
+
receipts, task freshness, token stats, and suggested checks.
|
|
69
62
|
|
|
70
|
-
|
|
71
|
-
Task: fix auth token expiry
|
|
63
|
+
### 3. Agent Acts
|
|
72
64
|
|
|
73
|
-
Agent
|
|
74
|
-
|
|
75
|
-
- opens nearby middleware and config
|
|
76
|
-
- may miss related tests
|
|
77
|
-
- spends early turns building a repo map
|
|
78
|
-
```
|
|
65
|
+
Point the agent at the pack or use MCP tools. Agent still verifies code before
|
|
66
|
+
editing; AgentPack is map, not correctness proof.
|
|
79
67
|
|
|
80
|
-
|
|
68
|
+
### 4. Benchmark Captures Miss
|
|
69
|
+
|
|
70
|
+
After a task, capture the files that actually changed:
|
|
81
71
|
|
|
82
72
|
```bash
|
|
83
|
-
agentpack
|
|
73
|
+
agentpack benchmark capture --since main --task "fix auth token expiry"
|
|
74
|
+
agentpack benchmark --misses
|
|
84
75
|
```
|
|
85
76
|
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
fix auth token expiry
|
|
89
|
-
|
|
90
|
-
Relevant files:
|
|
91
|
-
- tests/test_auth.py
|
|
92
|
-
- src/app/auth.py
|
|
93
|
-
- src/app/users.py
|
|
94
|
-
|
|
95
|
-
Suggested commands:
|
|
96
|
-
- pytest tests/test_auth.py -q
|
|
97
|
-
```
|
|
77
|
+
Miss diagnostics show whether a required file was ignored, scored too low,
|
|
78
|
+
ranked but cut by budget, or absent from scan.
|
|
98
79
|
|
|
99
80
|
## Features
|
|
100
81
|
|
|
101
|
-
- **
|
|
102
|
-
- **
|
|
103
|
-
- **
|
|
104
|
-
- **
|
|
105
|
-
- **
|
|
106
|
-
- **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
|
|
107
|
-
- **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
|
|
108
|
-
- **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
|
|
109
|
-
- **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
|
|
110
|
-
- **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
|
|
82
|
+
- **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
|
|
83
|
+
- **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
|
|
84
|
+
- **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
|
|
85
|
+
- **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
|
|
86
|
+
- **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
|
|
111
87
|
|
|
112
88
|
## Benchmark Proof
|
|
113
89
|
|
|
114
|
-
Latest
|
|
90
|
+
Latest published v0.3.20 release table: 8 pinned public commits from Pallets
|
|
91
|
+
Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
|
|
92
|
+
each commit. The public manifest now also supports 100+ sampled historical
|
|
93
|
+
commits across Python, TypeScript, Go, Java, and monorepo repos for broader
|
|
94
|
+
release runs.
|
|
115
95
|
|
|
116
96
|
| Metric | Result |
|
|
117
97
|
|---|---:|
|
|
@@ -120,18 +100,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
|
|
|
120
100
|
| Pack p50 | 1,450 tokens |
|
|
121
101
|
| Pack p95 | 3,805 tokens |
|
|
122
102
|
|
|
123
|
-
Full table: [`benchmarks/results/2026-
|
|
103
|
+
Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
|
|
104
|
+
The expanded 109-case public suite is the current optimization baseline:
|
|
105
|
+
**57.0% recall / 50.6% token precision**. It is broader and harder than the
|
|
106
|
+
8-case published table, and recall remains the active improvement target.
|
|
107
|
+
Reproduce the expanded public suite:
|
|
108
|
+
|
|
109
|
+
```bash
|
|
110
|
+
agentpack benchmark --public-suite --reproduce v0.3.20
|
|
111
|
+
```
|
|
112
|
+
|
|
113
|
+
Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
|
|
114
|
+
|
|
115
|
+
### Next Release Benchmark Target
|
|
116
|
+
|
|
117
|
+
The next benchmark release target is to raise the expanded public suite from the
|
|
118
|
+
current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
|
|
119
|
+
while keeping token precision at **50%+**. The target should be measured on the
|
|
120
|
+
same 100+ public historical-commit suite, with per-language slices published so
|
|
121
|
+
precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
|
|
122
|
+
|
|
123
|
+
Decision gate for the next public table:
|
|
124
|
+
|
|
125
|
+
- full-suite recall is at least 65.0%
|
|
126
|
+
- full-suite token precision is at least 50.0%
|
|
127
|
+
- no major language or task slice loses more than 2 recall points
|
|
128
|
+
- Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
|
|
129
|
+
- any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
|
|
130
|
+
token cost, and time-to-first-correct-file
|
|
131
|
+
|
|
132
|
+
## Trust
|
|
133
|
+
|
|
134
|
+
AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
|
|
135
|
+
npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
|
|
136
|
+
[`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
|
|
137
|
+
and [`docs/data-flow.md`](docs/data-flow.md).
|
|
124
138
|
|
|
125
139
|
## Use Cases
|
|
126
140
|
|
|
127
|
-
|
|
128
|
-
- [MCP
|
|
129
|
-
|
|
130
|
-
|
|
131
|
-
- [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
|
|
132
|
-
- [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
|
|
133
|
-
- [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
|
|
134
|
-
- [Docs index](docs/index.md)
|
|
141
|
+
Start with the [docs index](docs/index.md), or jump to guides for
|
|
142
|
+
[Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
|
|
143
|
+
[Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
|
|
144
|
+
and [how AgentPack works](docs/how-agentpack-works.md).
|
|
135
145
|
|
|
136
146
|
## Install
|
|
137
147
|
|
|
@@ -259,7 +269,7 @@ budget = 8000
|
|
|
259
269
|
output = ".agentpack/context.md"
|
|
260
270
|
```
|
|
261
271
|
|
|
262
|
-
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use
|
|
272
|
+
Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
|
|
263
273
|
|
|
264
274
|
Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
|
|
265
275
|
|
|
@@ -376,18 +386,6 @@ THREAD=codex-local make context-thread
|
|
|
376
386
|
AGENTPACK_THREAD_ID=codex-local make context-thread
|
|
377
387
|
```
|
|
378
388
|
|
|
379
|
-
## Benchmark Proof
|
|
380
|
-
|
|
381
|
-
AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
|
|
382
|
-
|
|
383
|
-
Use real repo evals instead of trusting compression numbers:
|
|
384
|
-
|
|
385
|
-
```bash
|
|
386
|
-
agentpack benchmark --release-gate
|
|
387
|
-
```
|
|
388
|
-
|
|
389
|
-
Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
|
|
390
|
-
|
|
391
389
|
## What A Pack Contains
|
|
392
390
|
|
|
393
391
|
Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
|