npm - agentsys - Versions diffs - 5.13.4 → 6.0.0 - Mend

agentsys 5.13.4 → 6.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/.claude-plugin/marketplace.json +28 -28
package/.claude-plugin/plugin.json +1 -1
package/.codex-plugin/plugin.json +2 -3
package/AGENTS.md +8 -8
package/CHANGELOG.md +34 -0
package/README.md +11 -116
package/lib/binary/index.js +8 -2
package/lib/binary/shared-helpers.js +160 -0
package/lib/collectors/codebase.js +7 -2
package/lib/collectors/documentation.js +8 -2
package/lib/enhance/agent-patterns.js +17 -4
package/lib/enhance/auto-suppression.js +19 -7
package/lib/enhance/cross-file-analyzer.js +11 -4
package/lib/enhance/docs-patterns.js +6 -2
package/lib/enhance/fixer.js +22 -5
package/lib/enhance/skill-patterns.js +5 -5
package/lib/index.js +2 -0
package/lib/repo-intel/cache.js +171 -0
package/lib/repo-intel/converter.js +130 -0
package/lib/repo-intel/embed/binary.js +242 -0
package/lib/repo-intel/embed/index.js +26 -0
package/lib/repo-intel/embed/orchestrator.js +239 -0
package/lib/repo-intel/embed/preference.js +136 -0
package/lib/repo-intel/enrich.js +198 -0
package/lib/repo-intel/index.js +370 -0
package/lib/repo-intel/installer.js +78 -0
package/lib/repo-intel/queries.js +213 -13
package/lib/repo-intel/updater.js +104 -0
package/lib/repo-map/index.js +19 -254
package/package.json +1 -1
package/scripts/generate-docs.js +13 -18
package/scripts/plugins.txt +2 -2
package/site/assets/js/main.js +5 -13
package/site/content.json +6 -23
package/site/index.html +29 -77
package/site/ux-spec.md +7 -7
package/.kiro/agents/web-session.json +0 -12
package/.kiro/skills/web-auth/SKILL.md +0 -177
package/.kiro/skills/web-browse/SKILL.md +0 -516

package/.claude-plugin/marketplace.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "agentsys",
-  "description": "24 specialized plugins for AI workflow automation - task orchestration, PR workflow, slop detection, code review, drift detection, enhancement analysis, documentation sync, unified static analysis, durable memory, negative behavior memory, skill and system prompt curation, perf investigations, topic research, agent config linting, cross-tool AI consultation, structured AI debate, workflow pattern learning, codebase onboarding, contributor guidance, and Zig language support",
-  "version": "5.13.4",
+  "description": "26 specialized plugins for AI workflow automation - task orchestration, PR workflow, slop detection, code review, drift detection, enhancement analysis, documentation sync, unified static analysis, durable memory, negative behavior memory, skill and system prompt curation, perf investigations, topic research, agent config linting, cross-tool AI consultation, structured AI debate, workflow pattern learning, codebase onboarding, contributor guidance, Zig language support, Mojo language support, and Ada/SPARK language support",
+  "version": "6.0.0",
   "owner": {
     "name": "Avi Fenesh",
     "url": "https://github.com/avifenesh"
@@ -198,19 +198,6 @@
       "category": "productivity",
       "homepage": "https://github.com/agent-sh/learn"
     },
-    {
-      "name": "axiom",
-      "source": {
-        "source": "url",
-        "url": "https://github.com/agent-sh/axiom.git",
-        "ref": "v0.6.1",
-        "commit": "ba77271a4ff7084d2d567cf3173204390be80f3b"
-      },
-      "description": "Personal agent-native knowledge base: load thin context, query durable memories, create project scaffolds, and propose approved records",
-      "version": "0.6.1",
-      "category": "productivity",
-      "homepage": "https://github.com/agent-sh/axiom"
-    },
     {
       "name": "banthis",
       "source": {
@@ -262,19 +249,6 @@
       "category": "productivity",
       "homepage": "https://github.com/agent-sh/debate"
     },
-    {
-      "name": "web-ctl",
-      "source": {
-        "source": "url",
-        "url": "https://github.com/agent-sh/web-ctl.git",
-        "commit": "345e44bc8a7b373728afce6c0d94ef067b5abc82",
-        "ref": "v1.1.0"
-      },
-      "description": "Browser automation and web testing toolkit for AI agents - headless browser control, persistent sessions, auth handoff, and prompt injection defense",
-      "version": "1.1.0",
-      "category": "automation",
-      "homepage": "https://github.com/agent-sh/web-ctl"
-    },
     {
       "name": "skillers",
       "source": {
@@ -325,6 +299,32 @@
       "version": "0.1.0",
       "category": "development",
       "homepage": "https://github.com/agent-sh/zig-lsp"
+    },
+    {
+      "name": "mojo",
+      "source": {
+        "source": "url",
+        "url": "https://github.com/agent-sh/mojo.git",
+        "ref": "v0.2.0",
+        "commit": "4d6f5fe71e03380f8532a0a8419903f4f548a587"
+      },
+      "description": "Teach agents to write idiomatic, correct, performant, current Mojo (v1.0.0b1) - syntax, ownership and CPU/memory optimization (copies, SIMD, vectorize/parallelize), GPU kernels (DeviceContext/LayoutTensor), and Mojo/Python interop; prevents stale pre-2025 syntax",
+      "version": "0.2.0",
+      "category": "development",
+      "homepage": "https://github.com/agent-sh/mojo"
+    },
+    {
+      "name": "ada-spark",
+      "source": {
+        "source": "url",
+        "url": "https://github.com/agent-sh/ada-spark.git",
+        "ref": "v0.1.0",
+        "commit": "d84e4efbd22165d3739dc5002c8385737637890c"
+      },
+      "description": "Teach agents to write idiomatic, correct, current Ada and SPARK (Ada 2022) - contracts (aspects, Pre'Class), the Alire ecosystem, SPARK proof (AoRTE, assurance levels, ownership/borrow), embedded (Ravenscar/Jorvik), and GNAT/GNAT SAS tooling; blocks stale pre-2022 advice (GNAT Community, pragma contracts, CodePeer)",
+      "version": "0.1.0",
+      "category": "development",
+      "homepage": "https://github.com/agent-sh/ada-spark"
     }
   ]
 }

package/.claude-plugin/plugin.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "agentsys",
-  "version": "5.13.4",
+  "version": "6.0.0",
   "description": "Professional-grade slash commands for Claude Code with cross-platform support",
   "keywords": [
     "workflow",

package/.codex-plugin/plugin.json CHANGED Viewed

@@ -4,8 +4,8 @@
   "skills": "./adapters/codex/skills",
   "interface": {
     "displayName": "agentsys",
-    "shortDescription": "AI agent orchestration with 45 skills and 49 agents",
-    "longDescription": "Professional-grade slash commands for AI-powered development workflows. Includes /next-task (task discovery to production), /axiom (durable agent memory), /banthis (negative behavior memory), /skill-curator and /system-prompt-curator (agent configuration curation), /ship (commit to deploy), /audit-project (multi-agent code review), /deslop (AI slop cleanup), /perf (performance investigation), /enhance (config analysis), /consult (cross-tool AI consultation), and more.",
+    "shortDescription": "AI agent orchestration with 44 skills and 49 agents",
+    "longDescription": "Professional-grade slash commands for AI-powered development workflows. Includes /next-task (task discovery to production), /banthis (negative behavior memory), /skill-curator and /system-prompt-curator (agent configuration curation), /ship (commit to deploy), /audit-project (multi-agent code review), /deslop (AI slop cleanup), /perf (performance investigation), /enhance (config analysis), /consult (cross-tool AI consultation), and more.",
     "developerName": "Avi Fenesh",
     "category": "developer-tools",
     "capabilities": [
@@ -20,7 +20,6 @@
     "websiteUrl": "https://agent-sh.github.io/agent-sh.dev/",
     "defaultPrompt": [
       "What should I work on next?",
-      "Load my durable Axiom context",
       "Review this codebase"
     ]
   }

package/AGENTS.md CHANGED Viewed

@@ -76,7 +76,7 @@
 <!-- GEN:START:claude-architecture -->
 ```
 lib/          → Shared library (vendored to plugins)
-plugins/      → 24 plugins, 49 agents (39 file-based + 10 role-based), 45 skills
+plugins/      → 24 plugins, 49 agents (39 file-based + 10 role-based), 44 skills
 adapters/     → Platform adapters (opencode-plugin/, opencode/, codex/)
 checklists/   → Action checklists (9 files)
 bin/cli.js    → npm CLI installer
@@ -93,21 +93,21 @@ bin/cli.js    → npm CLI installer
 | drift-detect | 1 | 1 | Plan drift detection |
 | enhance | 8 | 9 | Code quality analyzers |
 | sync-docs | 1 | 1 | Documentation sync |
-| repo-intel | 1 | 1 | Unified static analysis |
-| axiom | 0 | 1 | Durable agent-native memory |
+| repo-intel | 3 | 1 | Unified static analysis |
 | banthis | 0 | 1 | Durable negative behavior memory |
 | perf | 6 | 8 | Performance investigation |
 | learn | 1 | 1 | Topic research and learning guides |
-| agnix | 1 | 1 | Agent config linting |
+| agnix | 0 | 1 | Agent config linting |
 | consult | 1 | 1 | Cross-tool AI consultation |
 | debate | 1 | 1 | Multi-perspective debate analysis |
-| web-ctl | 1 | 2 | Browser automation for AI agents |
 | skill-curator | 0 | 1 | Skill authoring and review |
 | system-prompt-curator | 0 | 1 | System prompt curation |
 | skillers | 2 | 2 | Workflow pattern learning |
 | onboard | 1 | 1 | Codebase onboarding |
 | can-i-help | 1 | 1 | Contributor guidance |
 | zig-lsp | 0 | 0 |  |
+| mojo | 0 | 1 |  |
+| ada-spark | 0 | 1 |  |
 <!-- GEN:END:claude-architecture -->
 **Pattern**: `Command → Agent → Skill` (orchestration → invocation → implementation)
@@ -176,7 +176,7 @@ agentsys                # Run installer
 <agents>
 ## Agents
-49 agents across 24 plugins (18 have agents; gate-and-ship is commands-only; axiom, banthis, skill-curator, and system-prompt-curator are skill/command-only; zig-lsp is config-only with no commands or agents). Key agents by model:
+49 agents across 24 plugins (16 have agents; gate-and-ship is commands-only; banthis, skill-curator, system-prompt-curator, and agnix are skill/command-only; zig-lsp is config-only with no commands or agents; mojo and ada-spark are skill-only). Key agents by model:
 | Model | Agents | Use Case |
 |-------|--------|----------|
@@ -190,7 +190,7 @@ See [README.md](./README.md#command-details) and [docs/reference/AGENTS.md](./do
 <skills>
 ## Skills
-45 skills across plugins. Agents invoke skills for reusable implementation.
+44 skills across plugins. Agents invoke skills for reusable implementation.
 | Category | Key Skills |
 |----------|------------|
@@ -198,7 +198,7 @@ See [README.md](./README.md#command-details) and [docs/reference/AGENTS.md](./do
 | Enhancement | `enhance-*` (9 skills for plugins, agents, docs, prompts, hooks), `skill-curator`, `system-prompt-curator` |
 | Performance | `baseline`, `benchmark`, `profile`, `theory-tester` |
 | Cleanup | `deslop`, `sync-docs`, `drift-analysis`, `repo-intel` |
-| Memory | `axiom`, `banthis` |
+| Memory | `banthis` |
 See [README.md](./README.md#skills) for full skill list.
 </skills>

package/CHANGELOG.md CHANGED Viewed

@@ -9,6 +9,40 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ## [Unreleased]
+## [6.0.0] - 2026-05-29
+### Removed
+- **BREAKING: Dropped the `axiom` and `web-ctl` plugins from the marketplace** (#365). Both repositories were retired; their marketplace entries, `plugins.txt` rows, `.kiro` mirrors (`web-auth`, `web-browse`, `web-session`), and all site/docs references were scrubbed. Installable plugin count is now 24 (was 26). Users who previously installed `axiom` or `web-ctl` from the marketplace must remove them; they will no longer resolve.
+### Added
+- **Unified `repo-intel` core library** synced from agent-core (#373). The vendored `lib/repo-intel/` now exposes a single surface that folds the former `repo-map` lifecycle and the embedder into one module: `init`/`update`/`status`/`load`/`loadRaw`/`exists`, typed `queries.*`, LLM-augmentation write-path (`applyDescriptors`/`applySummary`), and an opt-in `embed` submodule (orchestrator, preference, binary resolver) for semantic search and duplicate detection. `lib/repo-map` remains as a deprecated compatibility shim. `lib/index.js` now exports `repoIntel` alongside `repoMap`.
+### Fixed
+- `skill-patterns` `side_effect_without_disable` now accepts both the YAML boolean `true` and the quoted string `"true"` for `disable-model-invocation`, so a frontmatter value of `"true"` is no longer wrongly re-flagged.
+- Bounded 19 polynomial-ReDoS regexes and closed 2 prototype-pollution sinks across the synced `collectors`/`enhance` lib (match semantics preserved; verified by equivalence testing).
+- Removed the stale `aiRatio` query test - the analyzer dropped AI-authorship attribution and the query no longer exists (#372).
+## [5.14.0] - 2026-05-21
+### Added
+- Registered the `ada-spark` skill plugin (`agent-sh/ada-spark` v0.1.0, pinned `v0.1.0` / `d84e4ef`) in the marketplace. Teaches agents to write idiomatic, correct, current Ada and SPARK (Ada 2022) - contracts (aspects, `Pre'Class`), the Alire ecosystem, SPARK proof (AoRTE, assurance levels, ownership/borrow), embedded (Ravenscar/Jorvik), and GNAT/GNAT SAS tooling; blocks stale pre-2022 advice (GNAT Community, pragma contracts, CodePeer). Mapped to the `Languages` skill category.
+- Registered the `mojo` skill plugin (`agent-sh/mojo` v0.2.0, pinned `v0.2.0` / `4d6f5fe`) in the marketplace. Teaches agents to write idiomatic, current Mojo (v1.0.0b1) - syntax, ownership and CPU/memory optimization, GPU kernels, and Mojo/Python interop; prevents stale pre-2025 syntax. Mapped to the `Languages` skill category.
+### Changed
+- Synced plugin/skill count surfaces across `README.md`, `AGENTS.md`, `docs/reference/AGENTS.md`, `docs/ARCHITECTURE.md`, `docs/CROSS_PLATFORM.md`, `site/content.json`, `site/index.html`, and `site/ux-spec.md` for the two new language plugins: plugins `24 -> 26`, skills `45 -> 47` (agents unchanged at 50). Added `ada-spark` and `mojo` to `STATIC_PLUGIN_AGENT_COUNTS`, `CATEGORY_MAP`, and `STATIC_SKILLS` in `scripts/generate-docs.js`, and to `scripts/plugins.txt`.
+## [5.13.5] - 2026-05-18
+### Changed
+- Updated `axiom` marketplace pin to `v0.6.2`, which ships the `SessionStart` plugin hook (`hooks/hooks.json` + `hooks/session-start.mjs`), the read-only `axiom before-any --detect-only` mode, an OpenCode `session.created` plugin scaffold, and the `BeforeAnyError` library refactor.
+### Fixed
+- Synced agent / skill / test / rule counts across `README.md`, `AGENTS.md`, `docs/reference/AGENTS.md`, `.codex-plugin/plugin.json`, `site/content.json`, `site/ux-spec.md`, and `site/index.html`. File-based agent count corrected `39 → 40` (total `49 → 50`), test count refreshed `3,513 → 3,518`, agnix references refreshed `399 → 423` rules and `126 → 129` auto-fixable. Updated `STATIC_PLUGIN_AGENT_COUNTS` in `scripts/generate-docs.js`: `repo-intel 1 → 3`, `agnix 1 → 0`.
+- Updated the `/axiom` section in `README.md` to document the new SessionStart hook, `--detect-only` flag, Codex plugin-hooks opt-in (`[features].plugin_hooks = true`), and the OpenCode scaffold limitation pending [sst/opencode#5409](https://github.com/sst/opencode/issues/5409).
+### Tests
+- Updated `__tests__/marketplace-standalone-contract.test.js` to pin the `axiom` expected version, ref, and commit at `v0.6.2 / e3f3fab`.
 ## [5.13.4] - 2026-05-18
 ### Changed

package/README.md CHANGED Viewed

@@ -19,7 +19,7 @@
 </p>
 <p align="center">
-  <b>24 plugins · 49 agents · 45 skills (across all repos) · 30k lines of lib code · 3,513 tests · 5 platforms</b><br>
+  <b>24 plugins · 49 agents · 44 skills (across all repos) · 30k lines of lib code · 3,518 tests · 5 platforms</b><br>
   <em>Plugins distributed as standalone repos under <a href="https://github.com/agent-sh">agent-sh</a> org - agentsys is the marketplace &amp; installer</em>
 </p>
@@ -41,11 +41,11 @@
 AI models can write code. That's not the hard part anymore. The hard part is everything around it - task selection, branch management, code review, artifact cleanup, CI, PR comments, deployment. **AgentSys is the runtime that orchestrates agents to handle all of it** - structured pipelines, gated phases, specialized agents, and persistent state that survives session boundaries.
 ---
-> Building custom skills, agents, hooks, or MCP tools? [agnix](https://github.com/agent-sh/agnix) is the CLI + LSP linter that catches config errors before they fail silently - real-time IDE validation, auto suggestions, auto-fix, and 399 rules for Claude Code, Codex, OpenCode, Cursor, Kiro, Copilot, Gemini CLI, Cline, Windsurf, Roo Code, Amp, and more.
+> Building custom skills, agents, hooks, or MCP tools? [agnix](https://github.com/agent-sh/agnix) is the CLI + LSP linter that catches config errors before they fail silently - real-time IDE validation, auto suggestions, auto-fix, and 423 rules for Claude Code, Codex, OpenCode, Cursor, Kiro, Copilot, Gemini CLI, Cline, Windsurf, Roo Code, Amp, and more.
 ## What This Is
-An agent orchestration system - 24 plugins, 49 agents (39 file-based + 10 role-based specialists in audit-project), and 45 skills that compose into structured pipelines for software development. Each plugin lives in its own standalone repo under the [agent-sh](https://github.com/agent-sh) org. agentsys is the marketplace and installer that ties them together.
+An agent orchestration system - 24 plugins, 49 agents (39 file-based + 10 role-based specialists in audit-project), and 44 skills that compose into structured pipelines for software development. Each plugin lives in its own standalone repo under the [agent-sh](https://github.com/agent-sh) org. agentsys is the marketplace and installer that ties them together.
 Each agent has a single responsibility, a specific model assignment, and defined inputs/outputs. Pipelines enforce phase gates so agents can't skip steps. State persists across sessions so work survives interruptions.
@@ -118,9 +118,8 @@ The investment shifts from model spend to pipeline design. Better prompts, riche
 | [`/next-task`](#next-task) | Task workflow: discovery, implementation, PR, merge |
 | [`/prepare-delivery`](#prepare-delivery) | Pre-ship quality gates: deslop, review, validation, docs sync |
 | [`/gate-and-ship`](#gate-and-ship) | Quality gates then ship (/prepare-delivery + /ship) |
-| [`/axiom`](#axiom) | Durable memory: load, query, list, bootstrap projects, and record approved knowledge |
 | [`/banthis`](#banthis) | Durable negative memory: persist banned agent behaviors |
-| [`/agnix`](#agnix) | Lint agent configurations (399 rules) |
+| [`/agnix`](#agnix) | Lint agent configurations (423 rules) |
 | [`/ship`](#ship) | PR creation, CI monitoring, merge |
 | [`/deslop`](#deslop) | Clean AI slop patterns |
 | [`/perf`](#perf) | Performance investigation with baselines and profiling |
@@ -132,7 +131,6 @@ The investment shifts from model spend to pipeline design. Better prompts, riche
 | [`/learn`](#learn) | Research topics, create learning guides |
 | [`/consult`](#consult) | Cross-tool AI consultation |
 | [`/debate`](#debate) | Structured debate between AI tools |
-| [`/web-ctl`](#web-ctl) | Browser automation for AI agents |
 | [`/release`](#release) | Versioned release with ecosystem detection |
 | [`/skillers`](#skillers) | Workflow pattern learning and automation |
 | [`/skill-curator`](#skill-curator) | Create and improve reliable SKILL.md files |
@@ -146,7 +144,7 @@ Each command works standalone. Together, they compose into end-to-end pipelines.
 ## Skills
-45 skills included across the plugins:
+44 skills included across the plugins:
 | Category | Skills |
 |----------|--------|
@@ -158,10 +156,9 @@ Each command works standalone. Together, they compose into end-to-end pipelines.
 | **Code Review** | `audit-project` |
 | **AI Collaboration** | `consult`, `debate`, `learn`, `recommend`, `skillers-compact` |
 | **Onboarding** | `can-i-help`, `onboard` |
-| **Web** | `web-auth`, `web-browse` |
 | **Release** | `release` |
 | **Analysis** | `drift-analysis`, `repo-intel` |
-| **Memory** | `axiom`, `banthis` |
+| **Memory** | `banthis` |
 | **Linting** | `agnix` |
 **External skill plugins** (standalone repos, installed separately):
@@ -169,6 +166,8 @@ Each command works standalone. Together, they compose into end-to-end pipelines.
 | Category | Skills | Plugin |
 |----------|--------|--------|
 | **Message Queues** | `glide-mq`, `glide-mq-migrate-bullmq`, `glide-mq-migrate-bee` | [agent-sh/glidemq](https://github.com/agent-sh/glidemq) |
+| **Languages** | `mojo` | [agent-sh/mojo](https://github.com/agent-sh/mojo) |
+| **Languages** | `ada-spark` | [agent-sh/ada-spark](https://github.com/agent-sh/ada-spark) |
 Skills are the reusable implementation units. Agents invoke skills; commands orchestrate agents. When you install a plugin, its skills become available to all agents in that session.
@@ -181,7 +180,7 @@ Skills are the reusable implementation units. Agents invoke skills; commands orc
 | [The Approach](#the-approach) | Why it's built this way |
 | [Benchmarks](#benchmarks) | Sonnet + agentsys vs raw Opus |
 | [Commands](#commands) | All 24 commands overview |
-| [Skills](#skills) | 45 skills across plugins |
+| [Skills](#skills) | 44 skills across plugins |
 | [Skill-Only Plugins](#skill-only-plugins) | glide-mq and other non-command plugins |
 | [Command Details](#command-details) | Deep dive into each command |
 | [How Commands Work Together](#how-commands-work-together) | Standalone vs integrated |
@@ -312,35 +311,6 @@ Each piece runs independently - use `/prepare-delivery` alone to review before d
 ---
-### /axiom
-**Purpose:** Durable, queryable memory for agents. Load the smallest useful context, query project or global knowledge, and propose new records without bloating `AGENTS.md`.
-**[axiom](https://github.com/agent-sh/axiom)** is a standalone plugin and CLI. It creates a private `axiom-based` knowledge repo after explicit approval, keeps only thin context loaded automatically, and stores durable decisions, memories, preferences, and project notes in queryable files.
-**What it does:**
-| Command | Use |
-|---------|-----|
-| `axiom before-any --quiet` | Load global thin context at the start of meaningful work |
-| `axiom before-any --project <slug>` | Load project context and create missing project scaffolds |
-| `axiom query "<keyword>" --project <slug>` | Retrieve focused, source-backed project knowledge |
-| `axiom list --topics --project <slug>` | Explore what knowledge exists before querying |
-| `axiom record ...` | Propose a durable record through a temp clone, diff, and human approval |
-**Usage:**
-```bash
-/axiom before-any --quiet
-/axiom before-any --project flowfabric
-/axiom query "lease based" --project flowfabric
-/axiom record --project flowfabric --kind decision "Lease-based claiming v2" "We switched because it gives stronger safety during restarts."
-```
-**External tool:** Requires the [axiom CLI](https://github.com/agent-sh/axiom) from the plugin package.
----
 ### /banthis
 **Purpose:** Durable negative memory for repeated agent mistakes. Turn a user's "stop doing this" correction into a persistent rule in `CLAUDE.md` or `AGENTS.md`.
@@ -389,7 +359,7 @@ agnix catches these issues before they cause problems.
 | **Best Practices** | Tool restrictions, model selection, trigger phrase quality |
 | **Cross-Platform** | Compatibility across Claude Code, Codex, OpenCode, Cursor, Kiro, Copilot, Gemini CLI, Cline, Windsurf, Roo Code, Amp, and more |
-**399 validation rules** (126 auto-fixable) derived from:
+**423 validation rules** (129 auto-fixable) derived from:
 - Official tool specifications (Claude Code, Codex CLI, OpenCode, Cursor, Kiro, GitHub Copilot, Gemini CLI, Cline, Windsurf, Roo Code, Amp, and more)
 - Research papers on agent reliability and prompt injection
 - Real-world testing across 500+ repositories
@@ -895,81 +865,6 @@ agent-knowledge/
 **Agent:** debate-orchestrator (opus model for orchestration)
-### /web-ctl
-**Purpose:** Browser automation for AI agents - navigate, authenticate, and interact with web pages.
-**How it works:**
-Each invocation is a single Node.js process using Playwright. No daemon, no MCP server. Session state persists via Chrome's userDataDir with AES-256-GCM encrypted storage.
-```
-Agent calls skill -> node scripts/web-ctl.js <args> -> Playwright API -> JSON result
-```
-**Session lifecycle:**
-1. `session start <name>` - Create session (encrypted profile directory)
-2. `session auth <name> --url <login-url>` - Opens headed Chrome for human login (2FA, CAPTCHAs). Polls for success URL/selector, encrypts cookies on completion
-3. `run <name> <action>` - Headless actions using persisted cookies
-4. `session end <name>` - Cleanup
-**Actions:**
-| Action | Description | Key flag |
-|--------|-------------|----------|
-| `goto <url>` | Navigate to URL | |
-| `snapshot` | Get accessibility tree (primary page inspection) | |
-| `click <sel>` | Click element | `--wait-stable` |
-| `click-wait <sel>` | Click and wait for DOM + network stability | `--timeout <ms>` |
-| `type <sel> <text>` | Type with human-like delays | |
-| `read <sel>` | Read element text content | |
-| `fill <sel> <value>` | Clear field and set value | |
-| `wait <sel>` | Wait for element to appear | `--timeout <ms>` |
-| `evaluate <js>` | Execute JS in page context | `--allow-evaluate` |
-| `screenshot` | Full-page screenshot | `--path <file>` |
-| `network` | Capture network requests | `--filter <pattern>` |
-| `checkpoint` | Open headed browser for user (CAPTCHAs) | `--timeout <sec>` |
-`click-wait` waits for network idle + no DOM mutations for 500ms before returning. Cuts SPA interactions from multiple agent turns to one.
-**Error handling:**
-All errors return classified codes with actionable recovery suggestions:
-| Code | Recovery suggestion |
-|------|-------------------|
-| `element_not_found` | Snapshot included in response for selector discovery |
-| `timeout` | Increase `--timeout` |
-| `browser_closed` | `session start <name>` |
-| `network_error` | Check URL; verify cookies with `session status` |
-| `no_display` | Use `--vnc` flag |
-| `session_expired` | Re-authenticate |
-**Security:** Output sanitization (cookies/tokens redacted), prompt injection defense (`[PAGE_CONTENT: ...]` delimiters), AES-256-GCM encryption at rest, anti-bot measures (`webdriver=false`, random delays), read-only agent (no Write/Edit tools).
-**Selector syntax:** `role=button[name='Submit']`, `css=div.class`, `text=Click here`, `#id`
-**Usage:**
-```bash
-/web-ctl goto https://example.com
-/web-ctl auth twitter --url https://x.com/i/flow/login
-/web-ctl   # describe what you want to do, agent orchestrates it
-```
-**Install:**
-```bash
-agentsys install web-ctl
-npm install playwright
-npx playwright install chromium
-```
-**Agent:** web-session (sonnet model)
-**Skills:** web-auth (human-in-the-loop auth), web-browse (headless actions)
 ### /release
 > Versioned release with automatic ecosystem and tooling detection
@@ -1327,7 +1222,7 @@ The system is built on research, not guesswork.
 - Instruction following reliability
 **Testing:**
-- 3,513 tests passing
+- 3,518 tests passing
 - Drift-detect validated on 1,000+ repositories
 - E2E workflow testing across all commands
 - Cross-platform validation (Claude Code, OpenCode, Codex CLI, Cursor, Kiro)

package/lib/binary/index.js CHANGED Viewed

@@ -48,6 +48,12 @@ const { promisify } = require('util');
 const execFileAsync = promisify(cp.execFile);
+// repo-intel artifacts grow with history: a mature repo's JSON can exceed 20 MB
+// (agnix measured ~21 MB). Node's execFile default maxBuffer is 1 MB, which
+// silently fails init/update/query on any real repo with "stdout maxBuffer length
+// exceeded". Cap generously; callers can override via options.maxBuffer.
+const ANALYZER_MAX_BUFFER = 256 * 1024 * 1024;
 const { ANALYZER_MIN_VERSION, BINARY_NAME, GITHUB_REPO } = require('./version');
 const PLATFORM_MAP = {
@@ -957,7 +963,7 @@ function ensureBinarySync(options) {
  */
 function runAnalyzer(args, options) {
   const binPath = ensureBinarySync();
-  const opts = Object.assign({ encoding: 'utf8', windowsHide: true }, options);
+  const opts = Object.assign({ encoding: 'utf8', windowsHide: true, maxBuffer: ANALYZER_MAX_BUFFER }, options);
   if (!opts.stdio) opts.stdio = ['pipe', 'pipe', 'pipe'];
   const result = cp.execFileSync(binPath, args, opts);
   return typeof result === 'string' ? result : result.toString('utf8');
@@ -971,7 +977,7 @@ function runAnalyzer(args, options) {
  */
 async function runAnalyzerAsync(args, options) {
   const binPath = await ensureBinary();
-  const opts = Object.assign({ encoding: 'utf8', windowsHide: true }, options);
+  const opts = Object.assign({ encoding: 'utf8', windowsHide: true, maxBuffer: ANALYZER_MAX_BUFFER }, options);
   const result = await execFileAsync(binPath, args, opts);
   return result.stdout;
 }

package/lib/binary/shared-helpers.js ADDED Viewed

@@ -0,0 +1,160 @@
+'use strict';
+/**
+ * Shared HTTP + archive helpers used by both binary resolvers
+ * (`lib/binary/index.js` for `agent-analyzer`, `lib/embed/binary.js`
+ * for `agent-analyzer-embed`).
+ *
+ * Extracted to keep the two resolvers from drifting on HTTP redirect
+ * handling, GitHub auth, and archive extraction details — a single
+ * fix to e.g. the timeout policy or the redirect cap lands once and
+ * applies to both binaries.
+ *
+ * @module lib/binary/shared-helpers
+ */
+const fs = require('fs');
+const path = require('path');
+const os = require('os');
+const https = require('https');
+const cp = require('child_process');
+const DEFAULT_DOWNLOAD_TIMEOUT_MS = 30000;
+const MAX_REDIRECTS = 5;
+/**
+ * Fetch a URL into an in-memory Buffer following up to 5 redirects.
+ *
+ * Honors `GITHUB_TOKEN` / `GH_TOKEN` for authenticated requests
+ * (raises rate limit, lets private-repo asset URLs work). Stalled
+ * connections are killed by the per-request timeout — without this
+ * a stuck socket would hang the process indefinitely.
+ *
+ * @param {string} url
+ * @param {Object} [options]
+ * @param {string} [options.userAgent='agent-sh/binary-resolver']
+ * @param {number} [options.timeoutMs=30000] - per-request timeout
+ * @returns {Promise<Buffer>}
+ */
+function downloadToBuffer(url, options) {
+  const opts = options || {};
+  const userAgent = opts.userAgent || 'agent-sh/binary-resolver';
+  const timeoutMs = opts.timeoutMs || DEFAULT_DOWNLOAD_TIMEOUT_MS;
+  return new Promise(function (resolve, reject) {
+    const ghToken = process.env.GITHUB_TOKEN || process.env.GH_TOKEN;
+    function request(reqUrl, redirectCount) {
+      if (redirectCount > MAX_REDIRECTS) {
+        reject(new Error('Too many redirects fetching from ' + url));
+        return;
+      }
+      const headers = {
+        'User-Agent': userAgent,
+        'Accept': 'application/octet-stream'
+      };
+      if (ghToken) headers['Authorization'] = 'Bearer ' + ghToken;
+      const req = https.get(reqUrl, { headers: headers, timeout: timeoutMs }, function (res) {
+        const sc = res.statusCode;
+        if (sc === 301 || sc === 302 || sc === 307 || sc === 308) {
+          res.resume();
+          var loc = res.headers.location;
+          if (loc && !loc.startsWith('https://')) {
+            reject(new Error('Refusing non-HTTPS redirect to ' + loc));
+            return;
+          }
+          request(loc, redirectCount + 1);
+          return;
+        }
+        if (sc !== 200) {
+          res.resume();
+          const hint = sc === 403 ? ' (rate limited - set GITHUB_TOKEN env var)' : '';
+          reject(new Error('HTTP ' + sc + hint + ' fetching ' + reqUrl));
+          return;
+        }
+        const chunks = [];
+        res.on('data', function (chunk) { chunks.push(chunk); });
+        res.on('end', function () { resolve(Buffer.concat(chunks)); });
+        res.on('error', reject);
+      });
+      req.on('error', reject);
+      req.on('timeout', function () {
+        req.destroy();
+        reject(new Error('Timeout (' + timeoutMs + 'ms) fetching ' + reqUrl));
+      });
+    }
+    request(url, 0);
+  });
+}
+/**
+ * Extract a `.tar.gz` Buffer into `destDir` using the system `tar`.
+ * Available on Linux, macOS, and Windows (built into recent Win10/11).
+ *
+ * @param {Buffer} buf
+ * @param {string} destDir
+ * @returns {Promise<void>}
+ */
+function extractTarGz(buf, destDir) {
+  return new Promise(function (resolve, reject) {
+    const tarDest = process.platform === 'win32' ? destDir.replace(/\\/g, '/') : destDir;
+    const tar = cp.spawn('tar', ['xz', '-C', tarDest], {
+      stdio: ['pipe', 'pipe', 'pipe']
+    });
+    let stderr = '';
+    tar.stderr.on('data', function (d) { stderr += d; });
+    tar.stdin.write(buf);
+    tar.stdin.end();
+    tar.on('close', function (code) {
+      if (code !== 0) {
+        reject(new Error('tar extraction failed (code ' + code + '): ' + stderr));
+      } else {
+        resolve();
+      }
+    });
+    tar.on('error', reject);
+  });
+}
+/**
+ * Extract a `.zip` Buffer into `destDir` using PowerShell's
+ * `Expand-Archive` (Windows-only).
+ *
+ * @param {Buffer} buf
+ * @param {string} destDir
+ * @param {string} binaryName - used as the temp-dir prefix
+ * @returns {Promise<void>}
+ */
+function extractZip(buf, destDir, binaryName) {
+  return new Promise(function (resolve, reject) {
+    var tmpDir = fs.mkdtempSync(path.join(os.tmpdir(), binaryName + '-'));
+    var tmpZip = path.join(tmpDir, 'archive.zip');
+    fs.writeFileSync(tmpZip, buf);
+    var ps = cp.spawn(
+      'powershell',
+      ['-NoProfile', '-NonInteractive', '-Command',
+       'Expand-Archive', '-Path', tmpZip, '-DestinationPath', destDir, '-Force'],
+      { stdio: ['ignore', 'pipe', 'pipe'] }
+    );
+    var stderr = '';
+    ps.stderr.on('data', function (d) { stderr += d; });
+    ps.on('close', function (code) {
+      try { fs.rmSync(tmpDir, { recursive: true, force: true }); } catch (e) { /* ignore */ }
+      if (code !== 0) {
+        reject(new Error('zip extraction failed (code ' + code + '): ' + stderr));
+      } else {
+        resolve();
+      }
+    });
+    ps.on('error', reject);
+  });
+}
+module.exports = {
+  downloadToBuffer,
+  extractTarGz,
+  extractZip,
+  DEFAULT_DOWNLOAD_TIMEOUT_MS
+};

package/lib/collectors/codebase.js CHANGED Viewed

@@ -126,7 +126,10 @@ function extractSymbols(content) {
     symbols.functions.push(match[1]);
   }
-  const arrowPattern = /(?:const|let)\s+([a-zA-Z_$][a-zA-Z0-9_$]*)\s*=\s*(?:async\s*)?\([^)]*\)\s*=>/g;
+  // ReDoS fix: bound the unbounded \s* / async runs and the parameter list so the
+  // matcher cannot backtrack polynomially on pathological input. Bounds are large
+  // enough that all realistic source matches identically to the prior \s*/[^)]* form.
+  const arrowPattern = /(?:const|let)\s{1,1000}([a-zA-Z_$][a-zA-Z0-9_$]*)\s{0,1000}=\s{0,1000}(?:async\s{0,1000})?\([^)]{0,2000}\)\s{0,1000}=>/g;
   while ((match = arrowPattern.exec(content)) !== null) {
     symbols.functions.push(match[1]);
   }
@@ -141,7 +144,9 @@ function extractSymbols(content) {
     symbols.exports.push(match[1]);
   }
-  const moduleExportsPattern = /module\.exports\s*=\s*\{([^}]+)\}/;
+  // ReDoS fix: bound the \s* runs and capture length so the matcher stays linear;
+  // bounds exceed any realistic module.exports declaration so matches are unchanged.
+  const moduleExportsPattern = /module\.exports\s{0,1000}=\s{0,1000}\{([^}]{1,100000})\}/;
   const moduleMatch = content.match(moduleExportsPattern);
   if (moduleMatch) {
     const keys = moduleMatch[1].split(',').map(k => k.trim().split(':')[0].trim());