npm - @crown-dev-studios/review-council - Versions diffs - 0.1.0 - Mend

@crown-dev-studios/review-council 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/README.md +170 -0
package/SKILL.md +262 -0
package/dist/cli.js +9 -0
package/dist/interaction-queue.js +50 -0
package/dist/orchestrate-review-council.js +772 -0
package/dist/render-review-html.js +307 -0
package/dist/review-session.js +77 -0
package/dist/schemas.js +67 -0
package/dist/types.js +1 -0
package/package.json +48 -0
package/references/cli-integration.md +177 -0
package/references/output-contract.md +158 -0
package/schemas/judge-done.schema.json +48 -0
package/schemas/judge-verdict.schema.json +132 -0
package/schemas/review-done.schema.json +42 -0
package/schemas/review-findings.schema.json +114 -0
package/templates/judge.md +51 -0
package/templates/report.html +401 -0
package/templates/reviewer-export.md +50 -0

package/README.md ADDED Viewed

@@ -0,0 +1,170 @@
+# Review Council
+Review Council is a package-first CLI for multi-agent code review orchestration. It runs Claude, Codex, or other local reviewer CLIs against the same target, collects raw artifacts, runs a judge pass, and renders a static review bundle.
+Use it when you want:
+- side-by-side raw reviews before creating final todos
+- isolated reviewer runs or separate worktrees
+- a judge step that confirms, contests, or rejects findings
+- a static HTML report plus machine-readable JSON output
+## Status
+The orchestrator handles the happy path and common failure modes:
+- Stage timeouts with two-phase kill (SIGTERM then SIGKILL) prevent hung runs
+- Automatic retry with exponential backoff handles transient failures
+- Schema validation catches malformed reviewer and judge output
+- Interactive prompts from reviewer CLIs are detected and relayed to the user
+- Partial reviewer failure still allows the judge to run on available data
+- Failed stages surface stderr excerpts and validation errors in the HTML report
+## Requirements
+- Node.js 20+
+- `claude` and/or `codex` on `PATH`
+- a Git working tree to review
+- reviewer CLIs authenticated and able to run non-interactively when possible
+## Install
+Run it directly:
+```bash
+npx @crown-dev-studios/review-council --help
+```
+Other package install paths:
+```bash
+pnpm dlx @crown-dev-studios/review-council --help
+npm install -g @crown-dev-studios/review-council
+review-council --help
+```
+## Quick Start
+From the project root you want to review:
+```bash
+npx @crown-dev-studios/review-council \
+  --target "staged changes" \
+  --review-id staged-changes-review \
+  --claude-command 'claude -p --disable-slash-commands --permission-mode acceptEdits "$(cat "$CLAUDE_DIR/claude-review-export.md")" < /dev/null' \
+  --codex-command 'codex exec --sandbox workspace-write -o "$CODEX_DIR/last-message.txt" "$(cat "$CODEX_DIR/codex-review-export.md")"' \
+  --judge-command 'codex exec --sandbox workspace-write -o "$JUDGE_DIR/last-message.txt" "$(cat "$JUDGE_DIR/judge.md")"'
+```
+That writes a run bundle under `docs/reviews/<review-id>/runs/<run-id>/` in the project being reviewed. Pass `--review-id` explicitly when you want the same review to be easy to correlate across reruns.
+Main outputs:
+- `judge/summary.md`
+- `judge/verdict.json`
+- `bundle.json`
+- `index.html`
+## Skill Install
+Optional: install it as a slash-invocable skill by copying or symlinking this directory:
+```bash
+cp -R ~/src/review-council ~/.claude/skills/review-council
+cp -R ~/src/review-council ~/.codex/skills/review-council
+```
+The skill docs and the published package describe the same runtime: invoke `npx @crown-dev-studios/review-council ...` from the repo you want to review so outputs stay rooted in that caller repo.
+## CLI Options
+```
+--target <target>                 Review target label (required)
+--review-id <id>                  Stable review identifier
+--run-dir <dir>                   Output directory for this run
+--review-profile <id>             Reviewer prompt profile (default: default)
+--judge-profile <id>              Judge prompt profile (default: default)
+--claude-prompt-template <path>   Override Claude reviewer prompt template
+--codex-prompt-template <path>    Override Codex reviewer prompt template
+--judge-prompt-template <path>    Override judge prompt template
+--claude-command <command>        Shell command for the Claude reviewer
+--codex-command <command>         Shell command for the Codex reviewer
+--judge-command <command>         Shell command for the judge stage
+--allow-missing-sentinel          Treat exit code 0 as success without done.json
+--skip-judge                      Skip the judge stage
+--skip-html                       Skip HTML rendering
+--open-html                       Open index.html after rendering (macOS)
+--timeout <ms>                    Stage timeout in ms (default: 300000)
+--retries <n>                     Max retries per stage on failure (default: 2)
+```
+## Operating Notes
+- Use non-interactive reviewer commands when possible. Interactive prompts are detected and relayed to the user, but explicit non-interactive mode is more reliable.
+- Use `claude -p --disable-slash-commands --permission-mode acceptEdits ... < /dev/null` for Claude reviewer runs. This keeps the run in headless mode, disables skills, allows artifact writes into the stage directory without interactive approval prompts, and prevents Claude from waiting on stdin during fully non-interactive runs.
+- Codex reviewer and judge commands must run with a writable sandbox, for example `codex exec --sandbox workspace-write ...`, because they need to write review artifacts into the run directory.
+- `--skip-judge` disables judge prompt rendering, judge command validation, and judge execution.
+- Keep reviewer artifacts inside the run directory.
+- Every reviewer and judge JSON artifact should carry the same `review_id` and `run_id` as `run.json`.
+- Do not create authoritative files in `todos/` during raw review.
+- If you reuse `workflows-review`, run each reviewer in a separate worktree.
+## Failure Triage
+If a run fails or stalls, inspect:
+- `<run>/claude/status.json`
+- `<run>/codex/status.json`
+- `<run>/judge/status.json`
+- each stage's `stdout.log` and `stderr.log`
+The `status.json` for each stage includes `review_id`, `run_id`, `exit_code`, `timed_out`, `attempts`, `missing_artifacts`, `failure_reason`, and `validation_errors`. The HTML report surfaces missing artifacts, stderr excerpts, and validation errors for failed stages in a diagnostics section.
+If a stage exits `0` but does not write `done.json`, the stage is incomplete and the run should be treated as failed.
+## Development
+Contributor workflow from a source checkout:
+```bash
+cd ~/src/review-council
+pnpm install
+pnpm typecheck
+pnpm test
+```
+Package verification:
+```bash
+pnpm verify:package
+```
+That verification path:
+- builds `dist/`
+- inspects `npm pack --dry-run` output with a repo-local npm cache
+- installs the local tarball into a temporary caller repo
+- verifies `review-council --help` and a minimal end-to-end run
+First publish and post-publish checks:
+```bash
+pnpm release:manual
+npm view @crown-dev-studios/review-council version
+npx @crown-dev-studios/review-council --help
+```
+## Files
+- [SKILL.md](SKILL.md)
+- [references/cli-integration.md](references/cli-integration.md)
+- [references/output-contract.md](references/output-contract.md)
+- [src/cli.ts](src/cli.ts)
+- [src/orchestrate-review-council.ts](src/orchestrate-review-council.ts)
+- [src/render-review-html.ts](src/render-review-html.ts)
+- [src/interaction-queue.ts](src/interaction-queue.ts)
+- [src/review-session.ts](src/review-session.ts)
+- [src/schemas.ts](src/schemas.ts)
+- [src/types.ts](src/types.ts)
+- [test/package-smoke.test.mjs](test/package-smoke.test.mjs)
+- [test/validate-schema.test.ts](test/validate-schema.test.ts)

package/SKILL.md ADDED Viewed

@@ -0,0 +1,262 @@
+---
+name: review-council
+description: Orchestrate Claude, Codex, or other local CLI reviewers against the same target, wait for their exported findings, run a judge pass, and generate a static HTML plus markdown review bundle. Use when you want side-by-side raw reviews before creating final todos.
+argument-hint: [staged|branch main..HEAD|pr 123|commit abc123]
+disable-model-invocation: true
+---
+# Review Council
+## Purpose
+`/review-council` is the manual entrypoint for multi-agent code review orchestration.
+This directory is intended to be both a standalone skill repo and the source for the published npm package. The prompt templates, schemas, renderer, and orchestrator all live here.
+It is intentionally separate from `workflows-review`:
+- `workflows-review` is optimized for single-agent review and immediate todo creation
+- `review-council` is optimized for parallel raw review, adjudication, and artifact rendering
+Use this when you want:
+- a Claude review and a Codex review on the same target
+- isolated worktrees or isolated CLI runs per reviewer
+- raw reviewer artifacts stored outside `todos/`
+- a judge step that decides which findings are valid
+- a static HTML page next to the final markdown judge summary
+## Prerequisites
+- Node.js 20+
+- `claude` and/or `codex` on `PATH` for the stages you want to run
+- A Git working tree to review
+- Reviewer CLIs must already be authenticated and able to run non-interactively
+## Quick Start
+1. Put this directory somewhere stable, for example `~/src/review-council`.
+2. Optional: install it as a slash-invocable skill by copying or symlinking this directory to one or both skill locations:
+```bash
+cp -R ~/src/review-council ~/.claude/skills/review-council
+cp -R ~/src/review-council ~/.codex/skills/review-council
+```
+3. Review or customize the command templates in [cli-integration.md](references/cli-integration.md).
+No external `/review-export` command is required. The orchestrator renders self-contained prompt files into each stage directory before launching reviewer CLIs.
+4. From the project root you want to review, run the published CLI. By default it writes each run under `docs/reviews/<review-id>/runs/<run-id>/` in the current project:
+```bash
+npx @crown-dev-studios/review-council \
+  --target "staged changes" \
+  --review-id staged-changes-review \
+  --claude-command 'claude -p --disable-slash-commands --permission-mode acceptEdits "$(cat "$CLAUDE_DIR/claude-review-export.md")" < /dev/null' \
+  --codex-command 'codex exec --sandbox workspace-write -o "$CODEX_DIR/last-message.txt" "$(cat "$CODEX_DIR/codex-review-export.md")"' \
+  --judge-command 'codex exec --sandbox workspace-write -o "$JUDGE_DIR/last-message.txt" "$(cat "$JUDGE_DIR/judge.md")"' \
+  --timeout 300000 \
+  --retries 2
+```
+- `--timeout <ms>`: per-stage timeout (default 300000 — 5 minutes). On timeout the process receives SIGTERM, then SIGKILL after a 5-second grace period.
+- `--retries <n>`: max retries per stage on non-timeout failure (default 2). Uses exponential backoff starting at 2 seconds.
+- For Claude reviewer runs, use `claude -p --disable-slash-commands --permission-mode acceptEdits ... < /dev/null`. This keeps the run headless, disables skills, allows artifact writes into the stage directory without interactive approval prompts, and avoids stdin wait warnings.
+- When using Codex for reviewer or judge stages, include `--sandbox workspace-write` so it can write artifacts into the run directory.
+- `--skip-judge` disables judge prompt rendering, judge command validation, and judge execution.
+- Pass `--review-id` explicitly when you want the same review to be easy to correlate across reruns.
+If the package is already installed globally, `review-council --target ...` is equivalent.
+### Development from a Source Checkout
+The packaged CLI is the supported runtime. Contributor workflow remains source-first:
+```bash
+cd ~/src/review-council
+pnpm install
+pnpm typecheck
+pnpm test
+pnpm verify:package
+```
+This produces:
+- `docs/reviews/<review-id>/runs/<run-id>/judge/summary.md`
+- `docs/reviews/<review-id>/runs/<run-id>/judge/verdict.json`
+- `docs/reviews/<review-id>/runs/<run-id>/bundle.json`
+- `docs/reviews/<review-id>/runs/<run-id>/index.html`
+### Example findings.json
+```json
+{
+  "review_id": "staged-changes-review",
+  "run_id": "20260318-143000123-abc12345",
+  "reviewer": "claude",
+  "target": "staged changes",
+  "generated_at": "2026-03-07T18:30:00Z",
+  "summary": "Found two issues: one SQL injection and one missing index.",
+  "findings": [
+    {
+      "id": "F001",
+      "title": "SQL injection in search endpoint",
+      "severity": "p1",
+      "confidence": "high",
+      "category": "security",
+      "description": "Unsanitized user input passed directly to raw SQL query.",
+      "evidence": "db.query(`SELECT * FROM users WHERE name = '${input}'`)",
+      "recommended_fix": "Use parameterized queries instead of string interpolation.",
+      "files": [
+        { "path": "src/routes/search.ts", "line": 42 }
+      ]
+    },
+    {
+      "id": "F002",
+      "title": "Missing index on users.email",
+      "severity": "p3",
+      "confidence": "medium",
+      "category": "performance",
+      "description": "The users.email column is queried frequently but has no index.",
+      "evidence": "Query plan shows sequential scan on users table.",
+      "recommended_fix": "Add a B-tree index on users.email.",
+      "files": [
+        { "path": "db/migrations/001_create_users.sql" }
+      ]
+    }
+  ]
+}
+```
+### Example verdict.json
+```json
+{
+  "review_id": "staged-changes-review",
+  "run_id": "20260318-143000123-abc12345",
+  "target": "staged changes",
+  "generated_at": "2026-03-07T14:30:00Z",
+  "overall_verdict": "needs-fixes",
+  "summary_markdown": "Two confirmed issues require attention before merge.",
+  "confirmed_findings": [
+    {
+      "title": "SQL injection in search endpoint",
+      "status": "confirmed",
+      "reason": "Both reviewers flagged unsanitized user input passed to raw query.",
+      "final_priority": "p1",
+      "reviewer_ids": ["claude", "codex"]
+    }
+  ],
+  "contested_findings": [
+    {
+      "title": "Missing index on users.email",
+      "status": "contested",
+      "reason": "Claude flagged as p2 but Codex noted the table has <1k rows.",
+      "final_priority": "p3",
+      "reviewer_ids": ["claude"]
+    }
+  ],
+  "rejected_findings": [
+    {
+      "title": "Unused import in helpers.ts",
+      "status": "rejected",
+      "reason": "Import is used in a type-only context; no runtime impact."
+    }
+  ],
+  "todo_recommendations": [
+    {
+      "title": "Parameterize search query to prevent SQL injection",
+      "priority": "p1",
+      "reason": "Confirmed by both reviewers as a security vulnerability."
+    }
+  ]
+}
+```
+## Workflow
+### Step 1: Choose the Review Target
+Normalize the target into one of these forms:
+- `staged changes`
+- `branch main..feature-branch`
+- `pr 123`
+- `commit abc123`
+### Step 2: Spawn Reviewer CLIs
+The parent agent is the orchestrator. It should not do the review itself.
+Its job is to:
+1. Create a run directory
+2. Spawn reviewer CLIs with explicit commands
+3. Wait for both reviewers to finish
+4. Confirm each reviewer wrote `done.json`
+5. Run the judge step
+6. Render HTML
+Use the environment variables documented in [cli-integration.md](references/cli-integration.md). Prefer the rendered stage prompt files under `$CLAUDE_DIR`, `$CODEX_DIR`, and `$JUDGE_DIR` over the source templates under `templates/`.
+### Step 3: Export Raw Reviewer Artifacts
+Each reviewer should write only raw artifacts:
+- `report.md`
+- `findings.json`
+- `done.json`
+Do not create authoritative todos during raw review.
+If you want to reuse the heuristics from `workflows-review`, copy its review bar and agent choices into the reviewer prompts, but stop before todo creation.
+### Step 4: Judge the Combined Result
+The judge reads both raw reviewer outputs and decides:
+- which findings are confirmed
+- which findings are contested
+- which findings are rejected
+- which findings are worth turning into final todos
+The judge writes:
+- `summary.md`
+- `verdict.json`
+- `done.json`
+### Step 5: Render the Reading View
+Render `index.html` after the judge completes.
+The HTML page should make these easy to scan:
+- judge summary
+- candidate findings from each reviewer
+- confirmed versus contested verdicts
+- raw markdown reports from Claude and Codex
+## Important Constraints
+- Do not run `workflows-review` twice in the same working tree if it will write directly to `todos/`
+- If you must reuse `workflows-review` unchanged, run each reviewer in a separate worktree so each run has its own local `todos/`
+- Keep final todo creation as a later, explicit step owned by the judge or a follow-up workflow
+- Interactive prompts from reviewer CLIs are detected and relayed to the user one at a time; explicit non-interactive commands such as `claude -p --disable-slash-commands --permission-mode acceptEdits < /dev/null` or `codex exec` remain the standard mode for raw review runs
+## Supporting Files
+- Output contract: [output-contract.md](references/output-contract.md)
+- CLI examples: [cli-integration.md](references/cli-integration.md)
+- Review schema: [review-findings.schema.json](schemas/review-findings.schema.json)
+- Judge schema: [judge-verdict.schema.json](schemas/judge-verdict.schema.json)
+- Reviewer template: [reviewer-export.md](templates/reviewer-export.md)
+- Judge template: [judge.md](templates/judge.md)
+- HTML template: [report.html](templates/report.html)
+- CLI entrypoint: [src/cli.ts](src/cli.ts)
+- Orchestrator runtime: [src/orchestrate-review-council.ts](src/orchestrate-review-council.ts)
+- Renderer: [src/render-review-html.ts](src/render-review-html.ts)
+- TypeScript package: [package.json](package.json)
+- TypeScript config: [tsconfig.json](tsconfig.json)

package/dist/cli.js ADDED Viewed

@@ -0,0 +1,9 @@
+#!/usr/bin/env node
+import { main } from "./orchestrate-review-council.js";
+try {
+    await main();
+}
+catch (error) {
+    console.error(error);
+    process.exit(1);
+}

package/dist/interaction-queue.js ADDED Viewed

@@ -0,0 +1,50 @@
+import { createInterface } from "node:readline";
+const queue = [];
+let processing = false;
+let readlineInterface = null;
+function getReadline() {
+    if (!readlineInterface) {
+        readlineInterface = createInterface({ input: process.stdin, output: process.stdout });
+    }
+    return readlineInterface;
+}
+function processNext() {
+    if (queue.length === 0) {
+        processing = false;
+        return;
+    }
+    processing = true;
+    const request = queue.shift();
+    if (!request) {
+        processing = false;
+        return;
+    }
+    const reader = getReadline();
+    process.stderr.write(`\n[${request.stage}] needs your input:\n${request.prompt}\n`);
+    reader.question("", (answer) => {
+        try {
+            request.stdinPipe.write(`${answer}\n`);
+        }
+        catch {
+            // The child process may exit before the response is written.
+        }
+        request.resolve();
+        processNext();
+    });
+}
+export function enqueue(request) {
+    queue.push(request);
+    if (!processing) {
+        processNext();
+    }
+}
+export function close() {
+    if (readlineInterface) {
+        readlineInterface.close();
+        readlineInterface = null;
+    }
+    processing = false;
+    for (const request of queue.splice(0)) {
+        request.resolve();
+    }
+}