agentpack-cli 0.3.19__tar.gz → 0.3.21__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (153) hide show
  1. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/PKG-INFO +88 -90
  2. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/README.md +87 -89
  3. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/pyproject.toml +1 -1
  4. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/__init__.py +1 -1
  5. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/ranking.py +410 -19
  6. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/symbols.py +4 -0
  7. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/application/pack_service.py +52 -30
  8. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/benchmark.py +1010 -24
  9. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/diagnose_selection.py +1 -1
  10. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/explain.py +11 -6
  11. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/guard.py +4 -3
  12. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/init.py +14 -16
  13. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/migrate.py +4 -3
  14. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/pack.py +6 -5
  15. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/quickstart.py +5 -3
  16. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/stats.py +2 -2
  17. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/tune.py +1 -1
  18. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/config.py +8 -4
  19. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/context_pack.py +419 -38
  20. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/models.py +4 -2
  21. agentpack_cli-0.3.21/src/agentpack/core/modes.py +23 -0
  22. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/collectors.py +68 -4
  23. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/renderers.py +180 -56
  24. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/mcp_server.py +2 -2
  25. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/markdown.py +2 -0
  26. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/parser.py +197 -17
  27. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/skills_index.py +4 -0
  28. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/base.py +6 -2
  29. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/.gitignore +0 -0
  30. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/LICENSE +0 -0
  31. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/__init__.py +0 -0
  32. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/antigravity.py +0 -0
  33. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/base.py +0 -0
  34. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/claude.py +0 -0
  35. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/codex.py +0 -0
  36. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/cursor.py +0 -0
  37. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/detect.py +0 -0
  38. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/generic.py +0 -0
  39. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/adapters/windsurf.py +0 -0
  40. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/__init__.py +0 -0
  41. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/dependency_graph.py +0 -0
  42. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/go_imports.py +0 -0
  43. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/java_imports.py +0 -0
  44. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/js_ts_imports.py +0 -0
  45. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/monorepo.py +0 -0
  46. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/naming_signals.py +0 -0
  47. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_ast.py +0 -0
  48. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/python_imports.py +0 -0
  49. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/repo_map.py +0 -0
  50. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/role_inference.py +0 -0
  51. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/rust_imports.py +0 -0
  52. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/task_classifier.py +0 -0
  53. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/analysis/tests.py +0 -0
  54. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/application/__init__.py +0 -0
  55. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/cli.py +0 -0
  56. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/__init__.py +0 -0
  57. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/_shared.py +0 -0
  58. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/ci_cmd.py +0 -0
  59. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/claude_cmd.py +0 -0
  60. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/compress_output.py +0 -0
  61. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/dashboard.py +0 -0
  62. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/dev_check.py +0 -0
  63. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/diff.py +0 -0
  64. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/doctor.py +0 -0
  65. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/eval_cmd.py +0 -0
  66. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/hook_cmd.py +0 -0
  67. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/ignore_cmd.py +0 -0
  68. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/install.py +0 -0
  69. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/learn.py +0 -0
  70. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/mcp_cmd.py +0 -0
  71. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/memory.py +0 -0
  72. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/monitor.py +0 -0
  73. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/next_cmd.py +0 -0
  74. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/perf.py +0 -0
  75. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/release_check.py +0 -0
  76. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/release_cmd.py +0 -0
  77. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/repair.py +0 -0
  78. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/retrieve.py +0 -0
  79. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/route.py +0 -0
  80. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/scan.py +0 -0
  81. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/skills.py +0 -0
  82. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/start_cmd.py +0 -0
  83. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/state_cmd.py +0 -0
  84. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/status.py +0 -0
  85. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/summarize.py +0 -0
  86. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/task_cmd.py +0 -0
  87. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/threads.py +0 -0
  88. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/verify_wheel.py +0 -0
  89. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/watch.py +0 -0
  90. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/workflow_cmd.py +0 -0
  91. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/commands/wrap.py +0 -0
  92. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/__init__.py +0 -0
  93. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/bootstrap.py +0 -0
  94. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/cache.py +0 -0
  95. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/changed_paths.py +0 -0
  96. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/diff.py +0 -0
  97. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/evals.py +0 -0
  98. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/execution_state.py +0 -0
  99. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/git.py +0 -0
  100. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/git_hooks.py +0 -0
  101. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/global_install.py +0 -0
  102. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/ignore.py +0 -0
  103. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/loop_protocol.py +0 -0
  104. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/merkle.py +0 -0
  105. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/pack_registry.py +0 -0
  106. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/redactor.py +0 -0
  107. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/scanner.py +0 -0
  108. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/snapshot.py +0 -0
  109. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/task_freshness.py +0 -0
  110. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/thread_context.py +0 -0
  111. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/token_estimator.py +0 -0
  112. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/core/vscode_tasks.py +0 -0
  113. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/__init__.py +0 -0
  114. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/dashboard/models.py +0 -0
  115. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/data/agentpack.md +0 -0
  116. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/__init__.py +0 -0
  117. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/antigravity.py +0 -0
  118. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/claude.py +0 -0
  119. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/codex.py +0 -0
  120. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/cursor.py +0 -0
  121. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/installers/windsurf.py +0 -0
  122. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/__init__.py +0 -0
  123. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/agents.py +0 -0
  124. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/git_hooks.py +0 -0
  125. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/global_install.py +0 -0
  126. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/platform.py +0 -0
  127. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/integrations/vscode_tasks.py +0 -0
  128. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/__init__.py +0 -0
  129. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/collector.py +0 -0
  130. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/extractor.py +0 -0
  131. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/feedback.py +0 -0
  132. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/lesson_ranker.py +0 -0
  133. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/models.py +0 -0
  134. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/provider.py +0 -0
  135. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/quality.py +0 -0
  136. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/renderers.py +0 -0
  137. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/learning/skill_map.py +0 -0
  138. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/output_compression/__init__.py +0 -0
  139. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/output_compression/core.py +0 -0
  140. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/__init__.py +0 -0
  141. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/compact.py +0 -0
  142. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/renderers/receipts.py +0 -0
  143. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/__init__.py +0 -0
  144. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/discovery.py +0 -0
  145. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/models.py +0 -0
  146. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/prompt_builder.py +0 -0
  147. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/scoring.py +0 -0
  148. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/router/service.py +0 -0
  149. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/__init__.py +0 -0
  150. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/events.py +0 -0
  151. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/session/state.py +0 -0
  152. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/__init__.py +0 -0
  153. {agentpack_cli-0.3.19 → agentpack_cli-0.3.21}/src/agentpack/summaries/offline.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: agentpack-cli
3
- Version: 0.3.19
3
+ Version: 0.3.21
4
4
  Summary: Local MCP context router for Claude Code, Codex, Cursor, and AI coding agents.
5
5
  License: MIT
6
6
  License-File: LICENSE
@@ -49,15 +49,17 @@ Description-Content-Type: text/markdown
49
49
  [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
50
50
  [![CI](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml/badge.svg)](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
51
51
 
52
- **Local MCP context router for AI coding agents.**
52
+ **Local context router for AI coding agents.**
53
53
 
54
- Claude Code, Codex, Cursor, and other coding agents can waste tool calls rediscovering your repo before they make the edit you asked for.
54
+ AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
55
55
 
56
- AgentPack gives them a ranked map of likely relevant files, tests, rules, and skills for each task. It analyzes your repo locally and packages compact context for CLI and MCP workflows.
56
+ One workflow matters:
57
57
 
58
- How it works: AgentPack compresses repo context into ranked packs, caches scans/summaries/pack metadata for fast refreshes, and retrieves exact file or symbol blocks later when an agent needs more detail. Rendered packs also put stable instructions before volatile task, timestamp, git, and file sections so provider prompt-prefix caches can reuse the front of repeated refreshes. No cloud indexing, embeddings, or API calls are required for scan, summarize, rank, pack, stats, or benchmark.
58
+ ```text
59
+ route -> pack -> agent acts -> benchmark captures miss
60
+ ```
59
61
 
60
- Try the read-only task router without writing context files:
62
+ First route the task to likely files, tests, rules, and skills:
61
63
 
62
64
  ```bash
63
65
  pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
@@ -65,94 +67,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
65
67
 
66
68
  ![AgentPack route demo](docs/assets/agentpack-route-demo.svg)
67
69
 
68
- > **Status: alpha (v0.3.16).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
70
+ > **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
69
71
  >
70
72
  > **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
71
73
  >
72
74
  > **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
73
75
 
74
- ## What's New in 0.3.16
76
+ ## What's New in 0.3.21
75
77
 
76
- `0.3.16` bundles `watchdog` in normal installs so `agentpack watch` uses native
77
- filesystem events by default instead of polling after `pipx`, `pip`, or npm
78
- wrapper installation.
78
+ `0.3.21` is a benchmark trust release. It keeps the current honest expanded
79
+ public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
80
+ legacy minimal-mode surface in favor of `balanced`, improves benchmark
81
+ diagnostics and public-suite methodology, and documents the next release target:
82
+ **65%+ recall while holding 50%+ token precision**.
79
83
 
80
- ## What's New in 0.3.15
84
+ ## Core Workflow
81
85
 
82
- AgentPack Router now recommends skills with stronger local signals: richer
83
- frontmatter, confidence thresholds, negative triggers, diversity-aware ranking,
84
- and a pull-based MCP `get_skill` flow. Skill benchmark cases can declare
85
- `expected_skills` and `avoid_skills`, and `agentpack skills feedback` records
86
- local outcome signals for future routing.
86
+ ### 1. Route
87
87
 
88
- ## What's New in 0.3.14
88
+ Use the read-only router when you want quick orientation without writing files:
89
89
 
90
- AgentPack Learn now covers both sides of AI-assisted development: the coding
91
- agent gets compact future-agent lessons, and the developer gets task-specific
92
- learning notes, skill evidence, and practice follow-up.
90
+ ```bash
91
+ agentpack route --task "fix auth token expiry"
92
+ ```
93
93
 
94
- - `agentpack learn --provider-command` adds an opt-in local provider bridge:
95
- AgentPack sends a bounded, redacted report JSON on stdin and accepts
96
- LearningReport-compatible JSON fields on stdout. No hosted service is called
97
- unless your command does it.
98
- - `agentpack learn --dashboard` writes a static
99
- `.agentpack/learning-dashboard.html` for IDE/browser review.
100
- - `agentpack learn --team-export` writes `.agentpack/team-lessons.md`, a
101
- shareable lesson file that omits personal skill history.
102
- - `agentpack learn --feedback`, `--skills`, and `--drills` close the loop from
103
- a task summary to skill memory and next-practice prompts.
104
- - `agentpack dev-check` and `agentpack release-check` now print bounded failure
105
- excerpts, so CI shows the failing test instead of only a red stage name.
94
+ ### 2. Pack
106
95
 
107
- ## Before vs After
96
+ ```bash
97
+ agentpack task set "fix auth token expiry"
98
+ agentpack pack --task auto
99
+ ```
108
100
 
109
- Without AgentPack, a cold coding-agent session often starts with manual repo orientation:
101
+ AgentPack writes `.agentpack/context.md` with selected files, omitted-file
102
+ receipts, task freshness, token stats, and suggested checks.
110
103
 
111
- ```text
112
- Task: fix auth token expiry
104
+ ### 3. Agent Acts
113
105
 
114
- Agent:
115
- - searches for auth files
116
- - opens nearby middleware and config
117
- - may miss related tests
118
- - spends early turns building a repo map
119
- ```
106
+ Point the agent at the pack or use MCP tools. Agent still verifies code before
107
+ editing; AgentPack is map, not correctness proof.
120
108
 
121
- With AgentPack:
109
+ ### 4. Benchmark Captures Miss
110
+
111
+ After a task, capture the files that actually changed:
122
112
 
123
113
  ```bash
124
- agentpack route --task "fix auth token expiry"
114
+ agentpack benchmark capture --since main --task "fix auth token expiry"
115
+ agentpack benchmark --misses
125
116
  ```
126
117
 
127
- ```text
128
- Task:
129
- fix auth token expiry
130
-
131
- Relevant files:
132
- - tests/test_auth.py
133
- - src/app/auth.py
134
- - src/app/users.py
135
-
136
- Suggested commands:
137
- - pytest tests/test_auth.py -q
138
- ```
118
+ Miss diagnostics show whether a required file was ignored, scored too low,
119
+ ranked but cut by budget, or absent from scan.
139
120
 
140
121
  ## Features
141
122
 
142
- - **Task-focused packing**: ranks files from git changes, task terms, symbols, imports, related tests, configs, churn, repo history, and deterministic offline summaries.
143
- - **Budget-aware compression**: emits `full`, `diff`, `symbols`, `skeleton`, or `summary` views instead of all-or-nothing file dumps.
144
- - **Rendered-token accounting and reserve buckets**: budgets against actual markdown while protecting changed files, tests, docs, and dependencies.
145
- - **Execution state**: optional task state files and git-derived fallback status show whether work is planned, in progress, blocked, done, committed, or committed but not pushed.
146
- - **Thread-scoped context**: explicit `--thread <id>` or `--thread auto` isolates task/context files for multiple agents in one repo and warns on same-branch file overlap.
147
- - **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
148
- - **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
149
- - **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
150
- - **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
151
- - **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
123
+ - **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
124
+ - **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
125
+ - **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
126
+ - **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
127
+ - **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
152
128
 
153
129
  ## Benchmark Proof
154
130
 
155
- Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and MarkupSafe, scored against files actually changed by each commit.
131
+ Latest published v0.3.20 release table: 8 pinned public commits from Pallets
132
+ Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
133
+ each commit. The public manifest now also supports 100+ sampled historical
134
+ commits across Python, TypeScript, Go, Java, and monorepo repos for broader
135
+ release runs.
156
136
 
157
137
  | Metric | Result |
158
138
  |---|---:|
@@ -161,18 +141,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
161
141
  | Pack p50 | 1,450 tokens |
162
142
  | Pack p95 | 3,805 tokens |
163
143
 
164
- Full table: [`benchmarks/results/2026-05-27-public.md`](benchmarks/results/2026-05-27-public.md). This is public smoke proof, not a claim of universal ranking quality; expand cases for your own repo with `agentpack benchmark capture`.
144
+ Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
145
+ The expanded 109-case public suite is the current optimization baseline:
146
+ **57.0% recall / 50.6% token precision**. It is broader and harder than the
147
+ 8-case published table, and recall remains the active improvement target.
148
+ Reproduce the expanded public suite:
149
+
150
+ ```bash
151
+ agentpack benchmark --public-suite --reproduce v0.3.20
152
+ ```
153
+
154
+ Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
155
+
156
+ ### Next Release Benchmark Target
157
+
158
+ The next benchmark release target is to raise the expanded public suite from the
159
+ current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
160
+ while keeping token precision at **50%+**. The target should be measured on the
161
+ same 100+ public historical-commit suite, with per-language slices published so
162
+ precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
163
+
164
+ Decision gate for the next public table:
165
+
166
+ - full-suite recall is at least 65.0%
167
+ - full-suite token precision is at least 50.0%
168
+ - no major language or task slice loses more than 2 recall points
169
+ - Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
170
+ - any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
171
+ token cost, and time-to-first-correct-file
172
+
173
+ ## Trust
174
+
175
+ AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
176
+ npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
177
+ [`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
178
+ and [`docs/data-flow.md`](docs/data-flow.md).
165
179
 
166
180
  ## Use Cases
167
181
 
168
- - [Claude Code context engine](docs/claude-code-context-engine.md)
169
- - [MCP context engine](docs/mcp-context-engine.md)
170
- - [Cursor context packing](docs/cursor-context-packing.md)
171
- - [AI coding agent context packing](docs/ai-coding-agent-context.md)
172
- - [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
173
- - [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
174
- - [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
175
- - [Docs index](docs/index.md)
182
+ Start with the [docs index](docs/index.md), or jump to guides for
183
+ [Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
184
+ [Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
185
+ and [how AgentPack works](docs/how-agentpack-works.md).
176
186
 
177
187
  ## Install
178
188
 
@@ -300,7 +310,7 @@ budget = 8000
300
310
  output = ".agentpack/context.md"
301
311
  ```
302
312
 
303
- Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use `minimal`, `balanced`, or `deep` when you want progressively more file content in the generated pack.
313
+ Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
304
314
 
305
315
  Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
306
316
 
@@ -417,18 +427,6 @@ THREAD=codex-local make context-thread
417
427
  AGENTPACK_THREAD_ID=codex-local make context-thread
418
428
  ```
419
429
 
420
- ## Benchmark Proof
421
-
422
- AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
423
-
424
- Use real repo evals instead of trusting compression numbers:
425
-
426
- ```bash
427
- agentpack benchmark --release-gate
428
- ```
429
-
430
- Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
431
-
432
430
  ## What A Pack Contains
433
431
 
434
432
  Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
@@ -8,15 +8,17 @@
8
8
  [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
9
9
  [![CI](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml/badge.svg)](https://github.com/vishal2612200/agentpack/actions/workflows/ci.yml)
10
10
 
11
- **Local MCP context router for AI coding agents.**
11
+ **Local context router for AI coding agents.**
12
12
 
13
- Claude Code, Codex, Cursor, and other coding agents can waste tool calls rediscovering your repo before they make the edit you asked for.
13
+ AgentPack gives Claude Code, Codex, Cursor, and other coding agents a ranked starting map before they burn tool calls rediscovering your repo.
14
14
 
15
- AgentPack gives them a ranked map of likely relevant files, tests, rules, and skills for each task. It analyzes your repo locally and packages compact context for CLI and MCP workflows.
15
+ One workflow matters:
16
16
 
17
- How it works: AgentPack compresses repo context into ranked packs, caches scans/summaries/pack metadata for fast refreshes, and retrieves exact file or symbol blocks later when an agent needs more detail. Rendered packs also put stable instructions before volatile task, timestamp, git, and file sections so provider prompt-prefix caches can reuse the front of repeated refreshes. No cloud indexing, embeddings, or API calls are required for scan, summarize, rank, pack, stats, or benchmark.
17
+ ```text
18
+ route -> pack -> agent acts -> benchmark captures miss
19
+ ```
18
20
 
19
- Try the read-only task router without writing context files:
21
+ First route the task to likely files, tests, rules, and skills:
20
22
 
21
23
  ```bash
22
24
  pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
@@ -24,94 +26,72 @@ pipx run --spec agentpack-cli agentpack route --task "fix auth token expiry"
24
26
 
25
27
  ![AgentPack route demo](docs/assets/agentpack-route-demo.svg)
26
28
 
27
- > **Status: alpha (v0.3.16).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
29
+ > **Status: alpha (v0.3.21).** Works, tested, and used in real sessions. Python and JavaScript/TypeScript are the best-supported languages. Current benchmarks are useful regression checks, not broad proof that AgentPack improves coding-agent success. API may change before 1.0.
28
30
  >
29
31
  > **Platform note:** macOS, Linux, and Windows are supported. Windows support targets PowerShell plus Git for Windows. `cmd.exe` and bare Git setups are not a supported path yet.
30
32
  >
31
33
  > **Name note:** PyPI package is `agentpack-cli`, npm package is `@vishal2612200/agentpack`, and the command is `agentpack`. This project is unrelated to AgentPack dataset papers or other repos with the same name.
32
34
 
33
- ## What's New in 0.3.16
35
+ ## What's New in 0.3.21
34
36
 
35
- `0.3.16` bundles `watchdog` in normal installs so `agentpack watch` uses native
36
- filesystem events by default instead of polling after `pipx`, `pip`, or npm
37
- wrapper installation.
37
+ `0.3.21` is a benchmark trust release. It keeps the current honest expanded
38
+ public-suite baseline at **57.0% recall / 50.6% token precision**, removes the
39
+ legacy minimal-mode surface in favor of `balanced`, improves benchmark
40
+ diagnostics and public-suite methodology, and documents the next release target:
41
+ **65%+ recall while holding 50%+ token precision**.
38
42
 
39
- ## What's New in 0.3.15
43
+ ## Core Workflow
40
44
 
41
- AgentPack Router now recommends skills with stronger local signals: richer
42
- frontmatter, confidence thresholds, negative triggers, diversity-aware ranking,
43
- and a pull-based MCP `get_skill` flow. Skill benchmark cases can declare
44
- `expected_skills` and `avoid_skills`, and `agentpack skills feedback` records
45
- local outcome signals for future routing.
45
+ ### 1. Route
46
46
 
47
- ## What's New in 0.3.14
47
+ Use the read-only router when you want quick orientation without writing files:
48
48
 
49
- AgentPack Learn now covers both sides of AI-assisted development: the coding
50
- agent gets compact future-agent lessons, and the developer gets task-specific
51
- learning notes, skill evidence, and practice follow-up.
49
+ ```bash
50
+ agentpack route --task "fix auth token expiry"
51
+ ```
52
52
 
53
- - `agentpack learn --provider-command` adds an opt-in local provider bridge:
54
- AgentPack sends a bounded, redacted report JSON on stdin and accepts
55
- LearningReport-compatible JSON fields on stdout. No hosted service is called
56
- unless your command does it.
57
- - `agentpack learn --dashboard` writes a static
58
- `.agentpack/learning-dashboard.html` for IDE/browser review.
59
- - `agentpack learn --team-export` writes `.agentpack/team-lessons.md`, a
60
- shareable lesson file that omits personal skill history.
61
- - `agentpack learn --feedback`, `--skills`, and `--drills` close the loop from
62
- a task summary to skill memory and next-practice prompts.
63
- - `agentpack dev-check` and `agentpack release-check` now print bounded failure
64
- excerpts, so CI shows the failing test instead of only a red stage name.
53
+ ### 2. Pack
65
54
 
66
- ## Before vs After
55
+ ```bash
56
+ agentpack task set "fix auth token expiry"
57
+ agentpack pack --task auto
58
+ ```
67
59
 
68
- Without AgentPack, a cold coding-agent session often starts with manual repo orientation:
60
+ AgentPack writes `.agentpack/context.md` with selected files, omitted-file
61
+ receipts, task freshness, token stats, and suggested checks.
69
62
 
70
- ```text
71
- Task: fix auth token expiry
63
+ ### 3. Agent Acts
72
64
 
73
- Agent:
74
- - searches for auth files
75
- - opens nearby middleware and config
76
- - may miss related tests
77
- - spends early turns building a repo map
78
- ```
65
+ Point the agent at the pack or use MCP tools. Agent still verifies code before
66
+ editing; AgentPack is map, not correctness proof.
79
67
 
80
- With AgentPack:
68
+ ### 4. Benchmark Captures Miss
69
+
70
+ After a task, capture the files that actually changed:
81
71
 
82
72
  ```bash
83
- agentpack route --task "fix auth token expiry"
73
+ agentpack benchmark capture --since main --task "fix auth token expiry"
74
+ agentpack benchmark --misses
84
75
  ```
85
76
 
86
- ```text
87
- Task:
88
- fix auth token expiry
89
-
90
- Relevant files:
91
- - tests/test_auth.py
92
- - src/app/auth.py
93
- - src/app/users.py
94
-
95
- Suggested commands:
96
- - pytest tests/test_auth.py -q
97
- ```
77
+ Miss diagnostics show whether a required file was ignored, scored too low,
78
+ ranked but cut by budget, or absent from scan.
98
79
 
99
80
  ## Features
100
81
 
101
- - **Task-focused packing**: ranks files from git changes, task terms, symbols, imports, related tests, configs, churn, repo history, and deterministic offline summaries.
102
- - **Budget-aware compression**: emits `full`, `diff`, `symbols`, `skeleton`, or `summary` views instead of all-or-nothing file dumps.
103
- - **Rendered-token accounting and reserve buckets**: budgets against actual markdown while protecting changed files, tests, docs, and dependencies.
104
- - **Execution state**: optional task state files and git-derived fallback status show whether work is planned, in progress, blocked, done, committed, or committed but not pushed.
105
- - **Thread-scoped context**: explicit `--thread <id>` or `--thread auto` isolates task/context files for multiple agents in one repo and warns on same-branch file overlap.
106
- - **Task router**: MCP and CLI surfaces route a task to relevant files, scoped rules, installed skills, suggested commands, and safety warnings without executing skills automatically.
107
- - **Reversible registry and learning layer**: retrieves packed context by block ID, writes developer lessons, and feeds bounded selected-file miss feedback into future ranking.
108
- - **Runtime scorecard and output compression**: `perf --history` tracks activity, while `compress-output` preserves failures, paths, diffs, and search hits from noisy logs.
109
- - **Agent integrations**: installs Claude Code, Cursor, Windsurf, Codex, Antigravity, VS Code tasks, git hooks, and MCP configuration.
110
- - **Local and measurable**: no API calls for scan, summarize, rank, pack, stats, or benchmark; quality is measured with expected-file evals.
82
+ - **Route**: read-only task map with relevant files, tests, rules, skills, commands, and warnings.
83
+ - **Pack**: budgeted context with `full`, `diff`, `symbols`, `skeleton`, or `summary` file views.
84
+ - **Act**: CLI, markdown, MCP, and agent integrations for Claude Code, Codex, Cursor, Windsurf, Antigravity, and generic agents.
85
+ - **Benchmark**: expected-file recall, token precision, miss diagnostics, public commit suites, and E2E A/B reports.
86
+ - **Local**: no cloud indexing, embeddings, or API calls for scan, summarize, rank, pack, stats, or benchmark.
111
87
 
112
88
  ## Benchmark Proof
113
89
 
114
- Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and MarkupSafe, scored against files actually changed by each commit.
90
+ Latest published v0.3.20 release table: 8 pinned public commits from Pallets
91
+ Click, ItsDangerous, and MarkupSafe, scored against files actually changed by
92
+ each commit. The public manifest now also supports 100+ sampled historical
93
+ commits across Python, TypeScript, Go, Java, and monorepo repos for broader
94
+ release runs.
115
95
 
116
96
  | Metric | Result |
117
97
  |---|---:|
@@ -120,18 +100,48 @@ Latest public release gate: 8 real commits from Pallets Click, ItsDangerous, and
120
100
  | Pack p50 | 1,450 tokens |
121
101
  | Pack p95 | 3,805 tokens |
122
102
 
123
- Full table: [`benchmarks/results/2026-05-27-public.md`](benchmarks/results/2026-05-27-public.md). This is public smoke proof, not a claim of universal ranking quality; expand cases for your own repo with `agentpack benchmark capture`.
103
+ Full v0.3.20 table: [`benchmarks/results/2026-06-11-public.md`](benchmarks/results/2026-06-11-public.md). This is scoped benchmark evidence, not a universal quality claim.
104
+ The expanded 109-case public suite is the current optimization baseline:
105
+ **57.0% recall / 50.6% token precision**. It is broader and harder than the
106
+ 8-case published table, and recall remains the active improvement target.
107
+ Reproduce the expanded public suite:
108
+
109
+ ```bash
110
+ agentpack benchmark --public-suite --reproduce v0.3.20
111
+ ```
112
+
113
+ Benchmark methodology lives under [`benchmarks/results/v0.3.20/`](benchmarks/results/v0.3.20/methodology.md).
114
+
115
+ ### Next Release Benchmark Target
116
+
117
+ The next benchmark release target is to raise the expanded public suite from the
118
+ current **57.0% recall / 50.6% token precision** baseline to **65%+ recall**
119
+ while keeping token precision at **50%+**. The target should be measured on the
120
+ same 100+ public historical-commit suite, with per-language slices published so
121
+ precision gains are not hiding TypeScript, Go, Java, or monorepo regressions.
122
+
123
+ Decision gate for the next public table:
124
+
125
+ - full-suite recall is at least 65.0%
126
+ - full-suite token precision is at least 50.0%
127
+ - no major language or task slice loses more than 2 recall points
128
+ - Vite/TypeScript, Gin/Go, and NestJS monorepo misses are reported separately
129
+ - any AgentPack-vs-no-AgentPack A/B claim includes task success, tool calls,
130
+ token cost, and time-to-first-correct-file
131
+
132
+ ## Trust
133
+
134
+ AgentPack is MIT licensed, local-first, and uses PyPI Trusted Publishing plus
135
+ npm provenance for release artifacts. See [`SECURITY.md`](SECURITY.md),
136
+ [`docs/privacy.md`](docs/privacy.md), [`docs/threat-model.md`](docs/threat-model.md),
137
+ and [`docs/data-flow.md`](docs/data-flow.md).
124
138
 
125
139
  ## Use Cases
126
140
 
127
- - [Claude Code context engine](docs/claude-code-context-engine.md)
128
- - [MCP context engine](docs/mcp-context-engine.md)
129
- - [Cursor context packing](docs/cursor-context-packing.md)
130
- - [AI coding agent context packing](docs/ai-coding-agent-context.md)
131
- - [Reduce Claude Code token usage](docs/reduce-claude-code-token-usage.md)
132
- - [AgentPack vs Repomix](docs/agentpack-vs-repomix.md)
133
- - [AgentPack vs Augment Context Engine](docs/agentpack-vs-augment-context-engine.md)
134
- - [Docs index](docs/index.md)
141
+ Start with the [docs index](docs/index.md), or jump to guides for
142
+ [Claude Code](docs/claude-code-context-engine.md), [MCP](docs/mcp-context-engine.md),
143
+ [Cursor](docs/cursor-context-packing.md), [token usage](docs/reduce-claude-code-token-usage.md),
144
+ and [how AgentPack works](docs/how-agentpack-works.md).
135
145
 
136
146
  ## Install
137
147
 
@@ -259,7 +269,7 @@ budget = 8000
259
269
  output = ".agentpack/context.md"
260
270
  ```
261
271
 
262
- Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use `minimal`, `balanced`, or `deep` when you want progressively more file content in the generated pack.
272
+ Use `agentpack pack --mode lite` when you want a cheap ranked map before deeper file reads. Use the default `balanced` mode for normal agent work and benchmark claims. Use `deep` when the task needs broader docs and source context.
263
273
 
264
274
  Use `.agentignore` to remove generated output, vendored code, large exports, or files that repeatedly appear as ranking noise. AgentPack imports obvious generated/noisy entries from gitignore sources during init, but repository-specific outputs should still be added by hand.
265
275
 
@@ -376,18 +386,6 @@ THREAD=codex-local make context-thread
376
386
  AGENTPACK_THREAD_ID=codex-local make context-thread
377
387
  ```
378
388
 
379
- ## Benchmark Proof
380
-
381
- AgentPack is best treated as a ranked starting map. It can reduce repeated orientation work, but the agent and reviewer still own correctness.
382
-
383
- Use real repo evals instead of trusting compression numbers:
384
-
385
- ```bash
386
- agentpack benchmark --release-gate
387
- ```
388
-
389
- Current benchmark evidence is documented in [`benchmarks/README.md`](benchmarks/README.md) and the generated tables under `benchmarks/results/`. Treat these as scoped evidence for the included cases, not a universal performance claim.
390
-
391
389
  ## What A Pack Contains
392
390
 
393
391
  Rendered packs are meant to be readable by humans and directly useful to agents. A typical pack includes:
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "agentpack-cli"
3
- version = "0.3.19"
3
+ version = "0.3.21"
4
4
  description = "Local MCP context router for Claude Code, Codex, Cursor, and AI coding agents."
5
5
  readme = "README.md"
6
6
  requires-python = ">=3.10"
@@ -1,3 +1,3 @@
1
1
  """AgentPack — task-aware context packing for AI coding agents."""
2
2
 
3
- __version__ = "0.3.19"
3
+ __version__ = "0.3.21"