npm - @agents-forge/aiqa - Versions diffs - 1.0.0 - Mend

@agents-forge/aiqa 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

package/CLAUDE.md +112 -0
package/README.md +281 -0
package/dist/agent.d.ts +41 -0
package/dist/agent.d.ts.map +1 -0
package/dist/agent.js +485 -0
package/dist/agent.js.map +1 -0
package/dist/cli.d.ts +13 -0
package/dist/cli.d.ts.map +1 -0
package/dist/cli.js +195 -0
package/dist/cli.js.map +1 -0
package/dist/config.d.ts +59 -0
package/dist/config.d.ts.map +1 -0
package/dist/config.js +53 -0
package/dist/config.js.map +1 -0
package/dist/index.d.ts +18 -0
package/dist/index.d.ts.map +1 -0
package/dist/index.js +15 -0
package/dist/index.js.map +1 -0
package/dist/session.d.ts +50 -0
package/dist/session.d.ts.map +1 -0
package/dist/session.js +99 -0
package/dist/session.js.map +1 -0
package/dist/subagents/analyst.d.ts +3 -0
package/dist/subagents/analyst.d.ts.map +1 -0
package/dist/subagents/analyst.js +96 -0
package/dist/subagents/analyst.js.map +1 -0
package/dist/subagents/qa-engineer.d.ts +4 -0
package/dist/subagents/qa-engineer.d.ts.map +1 -0
package/dist/subagents/qa-engineer.js +139 -0
package/dist/subagents/qa-engineer.js.map +1 -0
package/dist/subagents/qa-planner.d.ts +3 -0
package/dist/subagents/qa-planner.d.ts.map +1 -0
package/dist/subagents/qa-planner.js +69 -0
package/dist/subagents/qa-planner.js.map +1 -0
package/dist/subagents/qa-reporter.d.ts +4 -0
package/dist/subagents/qa-reporter.d.ts.map +1 -0
package/dist/subagents/qa-reporter.js +94 -0
package/dist/subagents/qa-reporter.js.map +1 -0
package/dist/subagents/qa-reviewer.d.ts +3 -0
package/dist/subagents/qa-reviewer.d.ts.map +1 -0
package/dist/subagents/qa-reviewer.js +97 -0
package/dist/subagents/qa-reviewer.js.map +1 -0
package/package.json +65 -0

package/CLAUDE.md ADDED Viewed

@@ -0,0 +1,112 @@
+# AIQA — Claude Code Instructions
+Single unified AI Quality Engineering Pipeline.
+One command. One Claude session. Full QA suite.
+## Install
+```bash
+npm install @agents-forge/aiqa
+npm install --save-dev @playwright/test
+npm install -g @playwright/cli@latest
+playwright-cli install --skills
+npx playwright install chromium
+```
+## Authentication (auto-detected)
+1. `ANTHROPIC_API_KEY` in `.env`
+2. `claude login`
+3. `gh auth login`
+## CLI Usage
+```bash
+# Full pipeline
+npx @agents-forge/aiqa https://www.saucedemo.com
+# Smoke tests only
+npx @agents-forge/aiqa https://my-app.com --grep @smoke
+# Skip review gate
+npx @agents-forge/aiqa https://my-app.com --skip qa-reviewer
+# Resume after crash
+npx @agents-forge/aiqa https://my-app.com --resume
+# Custom output dir
+npx @agents-forge/aiqa https://my-app.com --dir ./aiqa-output
+# Interactive — prompts for the URL + an optional existing requirements doc
+npx @agents-forge/aiqa
+# Bring your own requirements: drop a .md in .aiqa/requirements/ first, then run.
+# The analyst still explores AND merges your doc with the discovered requirements.
+npx @agents-forge/aiqa https://my-app.com
+```
+## Programmatic Usage
+```typescript
+import { runAIQA } from "@agents-forge/aiqa";
+await runAIQA({
+  target: "https://my-app.com",
+  grep: "@smoke",
+  skip: ["qa-reviewer"],
+  cwd: process.cwd(),
+  verbose: false,
+  resume: false,
+  existingRequirements: ".aiqa/requirements/my-existing-reqs.md", // optional — analyst merges it in
+});
+```
+## Configuration — aiqa.config.ts
+Drop an `aiqa.config.ts` (or .mjs/.js/.json) in the project root for defaults. CLI flags
+override it. Loaded via jiti (no build step).
+```typescript
+import { defineConfig } from "@agents-forge/aiqa";
+export default defineConfig({
+  url: "https://my-app.com",
+  model: "claude-sonnet-4-6",
+  skip: ["qa-reviewer"],
+  paths: { base: ".aiqa", reports: "reports", testScripts: "test-scripts" },
+});
+```
+## How it works
+One Claude session runs all 5 specialist roles:
+1. **analyst** — playwright-cli explores site, captures .aiqa/snapshots/*.yml → requirements.md (if an existing requirements .md is provided, it explores AND merges it in: Part A existing + Part B discovered)
+2. **qa-planner** — reads requirements + snapshots → test_plan.md (risk-aware)
+3. **qa-engineer** — snapshot-aware test generation → test-cases/*.md + tests/*.spec.ts
+4. **qa-reviewer** — validates selectors against snapshots → review_report.md
+5. **qa-reporter** — runs tests, captures failure snapshots → summary_report.md
+## Output files
+All artifacts live under `.aiqa/`; only `playwright.config.ts` is written to the repo root.
+```
+.aiqa/
+├── session.json              ← pipeline state (enables --resume)
+├── auth-state.json           ← saved login session (if any)
+├── snapshots/
+│   ├── home.yml              ← playwright-cli accessibility trees
+│   └── ...
+├── requirements/
+│   └── requirements.md
+├── test-plan/
+│   └── test_plan.md
+├── test-cases/
+│   ├── login.md
+│   └── checkout.md
+├── test-scripts/
+│   ├── login.spec.ts
+│   └── checkout.spec.ts
+└── reports/
+    ├── review_report.md
+    ├── summary_report.md
+    ├── test-results/         ← results.json, results.xml, traces, screenshots
+    └── playwright-report/    ← HTML report
+playwright.config.ts          ← at repo root (so `npx playwright test` finds it)
+```
+## Troubleshooting
+- `playwright-cli not found` → `npm install -g @playwright/cli@latest`
+- Pipeline crashed → `npx @agents-forge/aiqa <url> --resume`
+- Auth failed → set `ANTHROPIC_API_KEY` or `claude login`
+- Browser not installed → `npx playwright install chromium`

package/README.md ADDED Viewed

@@ -0,0 +1,281 @@
+# 🤖 AIQA — AI Assisted Quality Engineering
+[![npm version](https://img.shields.io/npm/v/@agents-forge/aiqa.svg)](https://www.npmjs.com/package/@agents-forge/aiqa)
+One command. One Claude session. Full AI-assisted QA suite — requirements, test plan, test cases, Playwright scripts, a selector-validated review, and an execution report.
+```bash
+npx @agents-forge/aiqa https://www.yourwebsite.com
+```
+---
+## What makes this different
+AIQA is a **Super Agent** — a single Claude session that orchestrates five specialist **subagents**, not a chain of disconnected tools. The Super Agent holds the whole pipeline in one context, so insights and snapshots flow in memory from one subagent to the next:
+```
+            ┌──────────────────────────────────────────────┐
+            │            AIQA — Super Agent                 │
+            │        (one Claude session, shared memory)    │
+            └──────────────────────────────────────────────┘
+                                  │
+   analyst → qa-planner → qa-engineer → qa-reviewer → qa-reporter
+   └──────────────────── subagents ───────────────────────────┘
+```
+### The subagents
+| Subagent | Role | Output |
+|---|---|---|
+| **analyst** | Explores the site with playwright-cli, captures accessibility snapshots of every page | `requirements.md` |
+| **qa-planner** | Uses snapshots to assess real UI complexity and assign risk-based priorities | `test_plan.md` |
+| **qa-engineer** | Generates test cases + Playwright scripts using actual element refs — no guessing | `test-cases/`, `test-scripts/` |
+| **qa-reviewer** | Validates every selector in the specs against the captured snapshots | `review_report.md` |
+| **qa-reporter** | Runs the suite, captures failure snapshots, writes the stakeholder report | `summary_report.md` |
+Every subagent works against the same **playwright-cli accessibility snapshots** the analyst captured — so the test scripts reference real DOM elements, and the reviewer can flag any selector that doesn't exist in the ground-truth snapshots.
+> 📐 For a deep dive into how the Super Agent orchestrates the subagents, the runtime flow, and the key design decisions, see **[docs/architecture.md](docs/architecture.md)**.
+---
+## Install
+```bash
+npm install @agents-forge/aiqa
+npm install --save-dev @playwright/test
+npm install -g @playwright/cli@latest
+playwright-cli install --skills
+npx playwright install chromium
+```
+---
+## Authentication
+Auto-detected — no config needed:
+| Method | Setup |
+|---|---|
+| Anthropic API key | `ANTHROPIC_API_KEY=sk-ant-...` in `.env` |
+| Claude subscription | `npm install -g @anthropic-ai/claude-code` → `claude login` |
+| GitHub Copilot | `gh auth login` |
+---
+## Usage
+```bash
+# Full pipeline — all five subagents
+npx @agents-forge/aiqa https://my-app.com
+# Smoke tests only
+npx @agents-forge/aiqa https://my-app.com --grep @smoke
+# Regression suite to custom dir
+npx @agents-forge/aiqa https://my-app.com --grep @regression --dir ./aiqa-output
+# Skip the review subagent
+npx @agents-forge/aiqa https://my-app.com --skip qa-reviewer
+# Resume after a crash
+npx @agents-forge/aiqa https://my-app.com --resume
+# Interactive — prompts for the URL and an optional existing requirements doc
+npx @agents-forge/aiqa
+# Unattended / CI — don't prompt before overwriting playwright.config.ts
+npx @agents-forge/aiqa https://my-app.com --force
+# Inside VS Code — open the generated docs in Markdown preview when done
+npx @agents-forge/aiqa https://my-app.com --open
+# Verbose mode
+npx @agents-forge/aiqa https://my-app.com --verbose
+```
+---
+## Bring your own requirements (optional)
+You can seed the pipeline with an existing requirements document — the analyst still
+explores the site and then **merges** the two, rather than skipping exploration:
+1. Drop your requirements **`.md`** file into **`.aiqa/requirements/`** (the folder is
+   created for you on first run).
+2. Run AIQA normally (or just `npx @agents-forge/aiqa` and answer the prompts).
+3. The analyst explores the URL, then writes `.aiqa/requirements/requirements.md` with two
+   clearly-labelled parts:
+   - **Part A — Existing Requirements** (carried over from your doc, tagged `[existing]`)
+   - **Part B — Newly Discovered Requirements** (the addon found by exploring, tagged `[discovered]`)
+Nothing from your document is dropped, and the merge happens automatically — no mid-run prompt.
+> **Naming:** your doc can have any name. If you happen to name it `requirements.md` (the
+> same as the generated output), AIQA preserves your copy as `existing-requirements.md`
+> first, then writes the merged result to `requirements.md` — so your original is never lost.
+---
+## ⚠️ Installed into an existing project?
+AIQA writes everything it generates under `.aiqa/`. The only file placed at your repo
+root is `playwright.config.ts` (so `npx playwright test` can auto-discover it). Since
+it's typically run **inside an existing project**, the Super Agent guards that one file:
+- If a `playwright.config.ts` **already exists**, AIQA asks **once, before the run**,
+  whether it may overwrite it.
+- Decline, and your existing config is left untouched — the pipeline runs against it as-is.
+- In a non-interactive shell (CI, piped) it **never silently overwrites** — pass
+  `--force` (or `force: true`) to opt in.
+- Use `--dir <path>` to run the whole pipeline (and its `.aiqa/` folder) in a different directory.
+---
+## What it produces
+Everything lands under `.aiqa/` so your repo root stays clean — only
+`playwright.config.ts` is written to the root (so `npx playwright test` finds it):
+```
+.aiqa/
+├── session.json                  ← pipeline state (resumable)
+├── auth-state.json               ← saved login session (if any)
+├── snapshots/
+│   ├── home.yml                  ← accessibility trees (ground truth)
+│   ├── login.yml
+│   └── failure-<test>.yml        ← captured on test failure
+├── requirements/
+│   └── requirements.md           ← analyst subagent: business analysis
+├── test-plan/
+│   └── test_plan.md              ← qa-planner subagent: strategy + risk analysis
+├── test-cases/
+│   ├── login.md                  ← qa-engineer subagent: plain-English test cases
+│   └── checkout.md
+├── test-scripts/
+│   ├── login.spec.ts             ← qa-engineer subagent: Playwright scripts (snapshot-accurate)
+│   └── checkout.spec.ts
+└── reports/
+    ├── review_report.md          ← qa-reviewer subagent: selector validation + quality review
+    ├── summary_report.md         ← qa-reporter subagent: stakeholder report
+    ├── test-results/             ← results.json, results.xml, traces, failure screenshots
+    └── playwright-report/        ← Playwright HTML report (npx playwright show-report .aiqa/reports/playwright-report)
+playwright.config.ts              ← multi-browser config at repo root (overwrite-guarded)
+```
+---
+## Programmatic Usage
+```typescript
+import { runAIQA } from "@agents-forge/aiqa";
+const result = await runAIQA({
+  target: "https://my-app.com",
+  grep: "@smoke",
+  skip: ["qa-reviewer"],          // skip any subagent by name
+  cwd: "./aiqa-output",
+  resume: false,
+  force: false,                    // true = skip the playwright.config.ts overwrite prompt
+  open: false,                     // true = open the docs in VS Code Markdown preview
+  existingRequirements: ".aiqa/requirements/my-reqs.md", // optional — analyst merges it in
+  model: "claude-sonnet-4-6",      // optional — Claude model id
+  paths: { reports: "reports" },   // optional — override .aiqa folder names
+  verbose: false,
+});
+console.log(`Passed: ${result.passed}`);
+console.log(`Session: ${result.sessionFile}`);
+```
+---
+## Configuration — `aiqa.config.ts`
+Drop an `aiqa.config.ts` (or `.mjs` / `.js` / `.json`) in your project root to set
+defaults. **CLI flags override the config file, which overrides the built-in defaults.**
+Loaded at runtime via [jiti](https://github.com/unjs/jiti) — no build step.
+```typescript
+import { defineConfig } from "@agents-forge/aiqa";
+export default defineConfig({
+  // Run defaults (any of these is overridden by the matching CLI flag)
+  url: "https://my-app.com",
+  grep: "@smoke",
+  skip: ["qa-reviewer"],
+  open: true,
+  force: false,
+  // Model
+  model: "claude-sonnet-4-6",
+  // Rename the .aiqa base + subfolders to taste
+  paths: {
+    base: ".aiqa",
+    requirements: "requirements",
+    plan: "test-plan",
+    testCases: "test-cases",
+    testScripts: "test-scripts",
+    reports: "reports",
+  },
+});
+```
+`defineConfig()` is optional but gives you typed autocomplete. Folder renames flow
+everywhere automatically — including the generated `playwright.config.ts` paths.
+---
+## Skipping subagents
+Each stage is a subagent you can skip by name (`analyst`, `qa-planner`, `qa-engineer`, `qa-reviewer`, `qa-reporter`):
+```bash
+# Analysis + planning only (no tests)
+npx @agents-forge/aiqa https://my-app.com --skip qa-engineer,qa-reviewer,qa-reporter
+# Skip the review subagent
+npx @agents-forge/aiqa https://my-app.com --skip qa-reviewer
+# Write tests but don't run them (skip the reporter subagent)
+npx @agents-forge/aiqa https://my-app.com --skip qa-reporter
+```
+---
+## Resumable pipeline
+If the Super Agent crashes mid-run:
+```bash
+npx @agents-forge/aiqa https://my-app.com --resume
+```
+The session file at `.aiqa/session.json` tracks which subagents completed. On
+`--resume`, any subagent whose output already exists on disk is marked done and
+skipped, so the pipeline picks up where it left off.
+---
+## Troubleshooting
+| Error | Fix |
+|---|---|
+| `playwright-cli not found` | `npm install -g @playwright/cli@latest` |
+| `Browser not installed` | `npx playwright install chromium` |
+| `Authentication failed` | Set `ANTHROPIC_API_KEY` or run `claude login` |
+| Pipeline crashed | Re-run with `--resume` |
+| Won't overwrite my config in CI | Pass `--force` (non-interactive runs never overwrite `playwright.config.ts` silently) |
+| Want to preview docs in VS Code | Run inside VS Code with `--open` (opens requirements / test plan / summary in Markdown preview) |
+| Want to run tests interactively | `npx playwright test --ui` |
+---
+## License
+MIT

package/dist/agent.d.ts ADDED Viewed

@@ -0,0 +1,41 @@
+import { type AIQAPaths } from "./config.js";
+export interface AIQAInput {
+    target: string;
+    grep?: string;
+    skip?: Array<"analyst" | "qa-planner" | "qa-engineer" | "qa-reviewer" | "qa-reporter">;
+    cwd?: string;
+    verbose?: boolean;
+    resume?: boolean;
+    /**
+     * Skip the interactive confirmation before overwriting an existing
+     * playwright.config.ts in the consumer's project. Useful for CI / fully
+     * unattended runs. Defaults to false (prompt before overwriting).
+     */
+    force?: boolean;
+    /**
+     * Path to an existing requirements .md document (e.g. dropped into
+     * .aiqa/requirements/). When set, the analyst still explores the site and
+     * then MERGES this document with the newly discovered requirements.
+     */
+    existingRequirements?: string;
+    /**
+     * When true (and running inside VS Code with the `code` CLI on PATH), open the
+     * generated markdown deliverables in VS Code's Markdown preview after the run.
+     * Adds a '*.md → preview' association to the project's .vscode/settings.json.
+     */
+    open?: boolean;
+    /** Claude model id (e.g. "claude-sonnet-4-6"). From aiqa.config.ts. */
+    model?: string;
+    /** Override .aiqa base + subfolder names. From aiqa.config.ts. */
+    paths?: AIQAPaths;
+}
+export interface AIQAResult {
+    sessionFile: string;
+    outputs: Record<string, string>;
+    passed: boolean;
+    totalDuration: number;
+}
+export type Provider = "anthropic" | "copilot";
+export declare function detectProvider(): Provider;
+export declare function runAIQA(input: AIQAInput): Promise<AIQAResult>;
+//# sourceMappingURL=agent.d.ts.map

package/dist/agent.d.ts.map ADDED Viewed

@@ -0,0 +1 @@

+ {"version":3,"file":"agent.d.ts","sourceRoot":"","sources":["../src/agent.ts"],"names":[],"mappings":"AAMA,OAAO,EAAgB,KAAK,SAAS,EAAE,MAAM,aAAa,CAAC;AAS3D,MAAM,WAAW,SAAS;IACxB,MAAM,EAAE,MAAM,CAAC;IACf,IAAI,CAAC,EAAE,MAAM,CAAC;IACd,IAAI,CAAC,EAAE,KAAK,CAAC,SAAS,GAAG,YAAY,GAAG,aAAa,GAAG,aAAa,GAAG,aAAa,CAAC,CAAC;IACvF,GAAG,CAAC,EAAE,MAAM,CAAC;IACb,OAAO,CAAC,EAAE,OAAO,CAAC;IAClB,MAAM,CAAC,EAAE,OAAO,CAAC;IACjB;;;;OAIG;IACH,KAAK,CAAC,EAAE,OAAO,CAAC;IAChB;;;;OAIG;IACH,oBAAoB,CAAC,EAAE,MAAM,CAAC;IAC9B;;;;OAIG;IACH,IAAI,CAAC,EAAE,OAAO,CAAC;IACf,uEAAuE;IACvE,KAAK,CAAC,EAAE,MAAM,CAAC;IACf,kEAAkE;IAClE,KAAK,CAAC,EAAE,SAAS,CAAC;CACnB;AAED,MAAM,WAAW,UAAU;IACzB,WAAW,EAAE,MAAM,CAAC;IACpB,OAAO,EAAE,MAAM,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IAChC,MAAM,EAAE,OAAO,CAAC;IAChB,aAAa,EAAE,MAAM,CAAC;CACvB;AAED,MAAM,MAAM,QAAQ,GAAG,WAAW,GAAG,SAAS,CAAC;AAI/C,wBAAgB,cAAc,IAAI,QAAQ,CAQzC;AAgSD,wBAAsB,OAAO,CAAC,KAAK,EAAE,SAAS,GAAG,OAAO,CAAC,UAAU,CAAC,CAkMnE"}