npm - sentinelayer-cli - Versions diffs - 0.6.2 → 0.8.1 - Mend

sentinelayer-cli 0.6.2 → 0.8.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (280) hide show

package/README.md +1009 -996
package/bin/create-sentinelayer.js +5 -5
package/bin/sentinelayer-cli.js +4 -4
package/bin/sl.js +5 -5
package/package.json +64 -63
package/src/agents/ai-governance/index.js +12 -0
package/src/agents/ai-governance/tools/base.js +171 -0
package/src/agents/ai-governance/tools/eval-regression.js +47 -0
package/src/agents/ai-governance/tools/hitl-audit.js +81 -0
package/src/agents/ai-governance/tools/index.js +52 -0
package/src/agents/ai-governance/tools/prompt-drift.js +42 -0
package/src/agents/ai-governance/tools/provenance-check.js +69 -0
package/src/agents/backend/index.js +12 -0
package/src/agents/backend/tools/base.js +189 -0
package/src/agents/backend/tools/circuit-breaker-check.js +123 -0
package/src/agents/backend/tools/idempotency-audit.js +105 -0
package/src/agents/backend/tools/index.js +87 -0
package/src/agents/backend/tools/retry-audit.js +132 -0
package/src/agents/backend/tools/timeout-audit.js +144 -0
package/src/agents/code-quality/index.js +12 -0
package/src/agents/code-quality/tools/base.js +159 -0
package/src/agents/code-quality/tools/complexity-measure.js +197 -0
package/src/agents/code-quality/tools/coupling-analysis.js +81 -0
package/src/agents/code-quality/tools/cycle-detect.js +49 -0
package/src/agents/code-quality/tools/dep-graph.js +196 -0
package/src/agents/code-quality/tools/index.js +89 -0
package/src/agents/data-layer/index.js +12 -0
package/src/agents/data-layer/tools/base.js +181 -0
package/src/agents/data-layer/tools/index-audit.js +165 -0
package/src/agents/data-layer/tools/index.js +83 -0
package/src/agents/data-layer/tools/migration-scan.js +135 -0
package/src/agents/data-layer/tools/query-explain.js +120 -0
package/src/agents/data-layer/tools/tenancy-scan.js +166 -0
package/src/agents/documentation/index.js +12 -0
package/src/agents/documentation/tools/api-diff.js +91 -0
package/src/agents/documentation/tools/base.js +151 -0
package/src/agents/documentation/tools/dead-link-check.js +58 -0
package/src/agents/documentation/tools/docstring-coverage.js +78 -0
package/src/agents/documentation/tools/index.js +52 -0
package/src/agents/documentation/tools/readme-freshness.js +61 -0
package/src/agents/envelope/fix-cycle.js +45 -0
package/src/agents/envelope/index.js +31 -0
package/src/agents/envelope/loop.js +150 -0
package/src/agents/envelope/pulse.js +18 -0
package/src/agents/envelope/stream.js +40 -0
package/src/agents/infrastructure/index.js +12 -0
package/src/agents/infrastructure/tools/base.js +171 -0
package/src/agents/infrastructure/tools/checkov-run.js +32 -0
package/src/agents/infrastructure/tools/drift-detect.js +59 -0
package/src/agents/infrastructure/tools/iam-least-priv-check.js +78 -0
package/src/agents/infrastructure/tools/index.js +52 -0
package/src/agents/infrastructure/tools/tflint-run.js +31 -0
package/src/agents/jules/config/definition.js +160 -160
package/src/agents/jules/config/system-prompt.js +182 -182
package/src/agents/jules/error-intake.js +51 -51
package/src/agents/jules/fix-cycle.js +17 -17
package/src/agents/jules/loop.js +460 -450
package/src/agents/jules/pulse.js +10 -10
package/src/agents/jules/stream.js +187 -186
package/src/agents/jules/swarm/file-scanner.js +74 -74
package/src/agents/jules/swarm/index.js +11 -11
package/src/agents/jules/swarm/orchestrator.js +362 -362
package/src/agents/jules/swarm/pattern-hunter.js +123 -123
package/src/agents/jules/swarm/sub-agent.js +315 -309
package/src/agents/jules/tools/aidenid-email.js +189 -189
package/src/agents/jules/tools/auth-audit.js +1708 -1691
package/src/agents/jules/tools/dispatch.js +340 -335
package/src/agents/jules/tools/file-edit.js +2 -2
package/src/agents/jules/tools/file-read.js +2 -2
package/src/agents/jules/tools/frontend-analyze.js +570 -570
package/src/agents/jules/tools/glob.js +2 -2
package/src/agents/jules/tools/grep.js +2 -2
package/src/agents/jules/tools/index.js +29 -29
package/src/agents/jules/tools/path-guards.js +2 -2
package/src/agents/jules/tools/runtime-audit.js +507 -507
package/src/agents/jules/tools/shell.js +2 -2
package/src/agents/jules/tools/url-policy.js +100 -100
package/src/agents/mode.js +113 -0
package/src/agents/observability/index.js +12 -0
package/src/agents/observability/tools/alert-audit.js +39 -0
package/src/agents/observability/tools/base.js +181 -0
package/src/agents/observability/tools/dashboard-gap.js +42 -0
package/src/agents/observability/tools/index.js +54 -0
package/src/agents/observability/tools/log-schema-check.js +74 -0
package/src/agents/observability/tools/span-coverage.js +74 -0
package/src/agents/persona-visuals.js +102 -61
package/src/agents/release/index.js +12 -0
package/src/agents/release/tools/base.js +181 -0
package/src/agents/release/tools/changelog-diff.js +86 -0
package/src/agents/release/tools/feature-flag-audit.js +126 -0
package/src/agents/release/tools/index.js +61 -0
package/src/agents/release/tools/rollback-verify.js +129 -0
package/src/agents/release/tools/semver-check.js +109 -0
package/src/agents/reliability/index.js +12 -0
package/src/agents/reliability/tools/backpressure-check.js +129 -0
package/src/agents/reliability/tools/base.js +181 -0
package/src/agents/reliability/tools/chaos-probe.js +109 -0
package/src/agents/reliability/tools/graceful-degradation-check.js +114 -0
package/src/agents/reliability/tools/health-check-audit.js +111 -0
package/src/agents/reliability/tools/index.js +87 -0
package/src/agents/run-persona.js +109 -0
package/src/agents/security/index.js +12 -0
package/src/agents/security/tools/authz-audit.js +134 -0
package/src/agents/security/tools/base.js +190 -0
package/src/agents/security/tools/crypto-review.js +175 -0
package/src/agents/security/tools/index.js +97 -0
package/src/agents/security/tools/sast-scan.js +175 -0
package/src/agents/security/tools/secrets-scan.js +216 -0
package/src/agents/shared-tools/dispatch-core.js +320 -315
package/src/agents/shared-tools/file-edit.js +180 -180
package/src/agents/shared-tools/file-read.js +100 -100
package/src/agents/shared-tools/glob.js +168 -168
package/src/agents/shared-tools/grep.js +228 -228
package/src/agents/shared-tools/index.js +46 -46
package/src/agents/shared-tools/path-guards.js +161 -161
package/src/agents/shared-tools/shell.js +383 -383
package/src/agents/supply-chain/index.js +12 -0
package/src/agents/supply-chain/tools/attestation-check.js +42 -0
package/src/agents/supply-chain/tools/base.js +151 -0
package/src/agents/supply-chain/tools/index.js +52 -0
package/src/agents/supply-chain/tools/lockfile-integrity.js +73 -0
package/src/agents/supply-chain/tools/package-verify.js +56 -0
package/src/agents/supply-chain/tools/sbom-diff.js +34 -0
package/src/agents/testing/index.js +12 -0
package/src/agents/testing/tools/base.js +202 -0
package/src/agents/testing/tools/coverage-gap.js +144 -0
package/src/agents/testing/tools/flake-detect.js +125 -0
package/src/agents/testing/tools/index.js +85 -0
package/src/agents/testing/tools/mutation-test.js +143 -0
package/src/agents/testing/tools/snapshot-diff.js +103 -0
package/src/ai/aidenid.js +1021 -1009
package/src/ai/client.js +553 -553
package/src/ai/domain-target-store.js +268 -268
package/src/ai/identity-store.js +270 -270
package/src/ai/proxy.js +137 -137
package/src/ai/site-store.js +145 -145
package/src/audit/agents/architecture.js +180 -180
package/src/audit/agents/compliance.js +179 -179
package/src/audit/agents/documentation.js +165 -165
package/src/audit/agents/performance.js +145 -145
package/src/audit/agents/security.js +215 -215
package/src/audit/agents/testing.js +172 -172
package/src/audit/orchestrator.js +557 -557
package/src/audit/package.js +204 -204
package/src/audit/registry.js +284 -284
package/src/audit/replay.js +103 -103
package/src/auth/gate.js +428 -371
package/src/auth/http.js +681 -611
package/src/auth/service.js +1106 -1106
package/src/auth/session-store.js +813 -813
package/src/cli.js +257 -252
package/src/commands/ai/identity-lifecycle.js +1338 -1338
package/src/commands/ai/provision-governance.js +1272 -1272
package/src/commands/ai/shared.js +147 -147
package/src/commands/ai.js +11 -11
package/src/commands/apply.js +12 -12
package/src/commands/audit.js +1171 -1166
package/src/commands/auth.js +419 -419
package/src/commands/chat.js +184 -191
package/src/commands/config.js +184 -184
package/src/commands/cost.js +311 -311
package/src/commands/daemon/core.js +850 -850
package/src/commands/daemon/extended.js +1048 -1048
package/src/commands/daemon/shared.js +213 -213
package/src/commands/daemon.js +11 -11
package/src/commands/guide.js +174 -174
package/src/commands/ingest.js +58 -58
package/src/commands/init.js +55 -55
package/src/commands/legacy-args.js +20 -10
package/src/commands/mcp.js +461 -461
package/src/commands/omargate.js +63 -29
package/src/commands/persona.js +65 -20
package/src/commands/plugin.js +260 -260
package/src/commands/policy.js +132 -132
package/src/commands/prompt.js +238 -238
package/src/commands/review.js +704 -704
package/src/commands/scan.js +865 -872
package/src/commands/session.js +1238 -0
package/src/commands/spec.js +771 -716
package/src/commands/swarm.js +651 -651
package/src/commands/telemetry.js +202 -202
package/src/commands/watch.js +511 -511
package/src/config/agent-dictionary.js +182 -182
package/src/config/io.js +56 -56
package/src/config/paths.js +18 -18
package/src/config/schema.js +55 -55
package/src/config/service.js +184 -184
package/src/coord/events-log.js +141 -0
package/src/coord/handshake.js +719 -0
package/src/coord/index.js +35 -0
package/src/coord/paths.js +84 -0
package/src/coord/priority.js +62 -0
package/src/coord/tarjan.js +157 -0
package/src/cost/budget.js +235 -235
package/src/cost/history.js +188 -188
package/src/cost/tokenizer.js +160 -0
package/src/cost/tracker.js +232 -171
package/src/daemon/artifact-lineage.js +896 -534
package/src/daemon/assignment-ledger.js +1083 -770
package/src/daemon/ast-drift.js +496 -0
package/src/daemon/ast-parser-layer.js +258 -258
package/src/daemon/budget-governor.js +633 -633
package/src/daemon/callgraph-overlay.js +646 -646
package/src/daemon/error-worker.js +1209 -626
package/src/daemon/fix-cycle.js +384 -377
package/src/daemon/hybrid-mapper.js +929 -929
package/src/daemon/ingest-refresh.js +79 -11
package/src/daemon/jira-lifecycle.js +767 -632
package/src/daemon/operator-control.js +657 -657
package/src/daemon/pulse.js +327 -327
package/src/daemon/reliability-lane.js +471 -471
package/src/daemon/scope-engine.js +1068 -0
package/src/daemon/watchdog.js +971 -971
package/src/events/schema.js +190 -0
package/src/guide/generator.js +316 -316
package/src/ingest/engine.js +933 -918
package/src/ingest/ownership.js +380 -0
package/src/interactive/index.js +97 -97
package/src/legacy-cli.js +3228 -2994
package/src/mcp/registry.js +695 -695
package/src/memory/blackboard.js +301 -301
package/src/memory/retrieval.js +581 -581
package/src/orchestrator/kai-chen.js +126 -0
package/src/plugin/manifest.js +553 -553
package/src/policy/packs.js +144 -144
package/src/prompt/generator.js +136 -118
package/src/review/ai-review.js +672 -679
package/src/review/compliance-pack.js +389 -0
package/src/review/investor-dd-config.js +54 -0
package/src/review/investor-dd-file-loop.js +303 -0
package/src/review/investor-dd-file-router.js +406 -0
package/src/review/investor-dd-html-report.js +233 -0
package/src/review/investor-dd-notification.js +120 -0
package/src/review/investor-dd-orchestrator.js +405 -0
package/src/review/investor-dd-persona-runner.js +275 -0
package/src/review/live-validator.js +253 -0
package/src/review/local-review.js +1351 -1305
package/src/review/omargate-interactive.js +68 -68
package/src/review/omargate-orchestrator.js +492 -300
package/src/review/persona-prompts.js +484 -296
package/src/review/reconciliation-rules.js +329 -0
package/src/review/replay.js +235 -235
package/src/review/report.js +664 -664
package/src/review/reproducibility-chain.js +136 -0
package/src/review/scan-modes.js +147 -42
package/src/review/spec-binding.js +487 -487
package/src/scaffold/generator.js +67 -67
package/src/scaffold/templates.js +150 -150
package/src/scan/generator.js +418 -418
package/src/scan/gh-secrets.js +107 -107
package/src/session/agent-registry.js +359 -0
package/src/session/analytics.js +479 -0
package/src/session/daemon.js +1396 -0
package/src/session/file-locks.js +666 -0
package/src/session/paths.js +37 -0
package/src/session/recap.js +567 -0
package/src/session/redact.js +82 -0
package/src/session/runtime-bridge.js +762 -0
package/src/session/scoring.js +406 -0
package/src/session/setup-guides.js +304 -0
package/src/session/store.js +704 -0
package/src/session/stream.js +333 -0
package/src/session/sync.js +753 -0
package/src/session/tasks.js +1054 -0
package/src/session/templates.js +188 -0
package/src/spec/generator.js +619 -519
package/src/spec/regenerate.js +237 -237
package/src/spec/templates.js +91 -91
package/src/swarm/dashboard.js +247 -247
package/src/swarm/factory.js +363 -363
package/src/swarm/pentest.js +934 -934
package/src/swarm/registry.js +419 -419
package/src/swarm/report.js +158 -158
package/src/swarm/runtime.js +569 -576
package/src/swarm/scenario-dsl.js +272 -272
package/src/telemetry/ledger.js +302 -302
package/src/telemetry/session-tracker.js +234 -234
package/src/telemetry/sync.js +203 -203
package/src/ui/command-hints.js +13 -13
package/src/ui/markdown.js +220 -220

package/src/agents/testing/tools/coverage-gap.js ADDED Viewed

@@ -0,0 +1,144 @@
+// coverage-gap — find source files without a matching test file (#A15).
+//
+// Zero-dep static pass: we don't try to read c8 / istanbul coverage JSON
+// (that lives in a later PR). Instead we use filename-convention matching —
+// for every `src/foo/bar.ts`, check whether any of the standard test file
+// names exists. Misses catches the most valuable 80% of coverage gaps while
+// staying fast and self-contained.
+import path from "node:path";
+import { createFinding, isTestFile, toPosix, walkRepoFiles } from "./base.js";
+const SOURCE_EXTENSIONS = new Set([
+  ".js",
+  ".jsx",
+  ".ts",
+  ".tsx",
+  ".mjs",
+  ".cjs",
+  ".py",
+]);
+// Generate plausible test-file locations for a source file. For
+// src/foo/bar.ts, try tests/foo/bar.test.ts, src/foo/bar.test.ts,
+// __tests__/foo/bar.test.ts, tests/foo/test_bar.py (Python), …
+function candidateTestPaths(sourceRelativePath) {
+  const posix = toPosix(sourceRelativePath);
+  const ext = path.extname(posix).toLowerCase();
+  const base = posix.slice(0, posix.length - ext.length);
+  const fileName = path.posix.basename(base);
+  const dir = path.posix.dirname(base);
+  const candidates = new Set();
+  if (ext === ".py") {
+    candidates.add(`${dir}/${fileName}_test.py`);
+    candidates.add(`${dir}/test_${fileName}.py`);
+    candidates.add(`tests/${dir}/${fileName}_test.py`);
+    candidates.add(`tests/${dir}/test_${fileName}.py`);
+  } else {
+    const testExts = [ext, `.test${ext}`];
+    for (const testExt of testExts) {
+      candidates.add(`${base}.test${ext}`);
+      candidates.add(`${base}.spec${ext}`);
+      candidates.add(`${dir}/__tests__/${fileName}.test${ext}`);
+      candidates.add(`${dir}/__tests__/${fileName}${ext}`);
+      candidates.add(`tests/${base}.test${ext}`);
+      candidates.add(`tests/${dir}/${fileName}.test${ext}`);
+      candidates.add(`test/${dir}/${fileName}.test${ext}`);
+      candidates.add(`test/${dir}/${fileName}.spec${ext}`);
+      // mjs test convention: tests/unit.{name}.test.mjs
+      candidates.add(`tests/unit.${fileName}.test.mjs`);
+      candidates.add(`tests/unit.${fileName}.test.js`);
+    }
+  }
+  return candidates;
+}
+function isLikelyEntryFile(relativePath) {
+  const p = toPosix(relativePath);
+  return (
+    /(^|\/)(index|main)\.[jt]sx?$/.test(p) ||
+    /(^|\/)(bin|scripts)\//.test(p) ||
+    /(^|\/)cli\.[jt]s$/.test(p)
+  );
+}
+function isLikelyConfig(relativePath) {
+  const p = toPosix(relativePath);
+  return (
+    /(^|\/)(config|constants|types?|schema|\.d\.ts)(\.[jt]sx?)?$/.test(p) ||
+    /\.d\.ts$/.test(p)
+  );
+}
+export async function runCoverageGap({ rootPath, files = null } = {}) {
+  const resolvedRoot = path.resolve(String(rootPath || "."));
+  // Pass 1: walk the repo once, collect source + test file lists.
+  const sourceFiles = [];
+  const testFiles = new Set();
+  const iterator =
+    Array.isArray(files) && files.length > 0
+      ? iterateExplicitFiles(resolvedRoot, files)
+      : walkRepoFiles({ rootPath: resolvedRoot, extensions: SOURCE_EXTENSIONS });
+  for await (const { relativePath } of iterator) {
+    if (isTestFile(relativePath)) {
+      testFiles.add(toPosix(relativePath));
+      continue;
+    }
+    sourceFiles.push(toPosix(relativePath));
+  }
+  const findings = [];
+  for (const source of sourceFiles) {
+    if (isLikelyEntryFile(source) || isLikelyConfig(source)) {
+      continue;
+    }
+    const candidates = candidateTestPaths(source);
+    const covered = Array.from(testFiles).some((test) => {
+      for (const candidate of candidates) {
+        if (test === candidate || test.endsWith(`/${path.posix.basename(candidate)}`)) {
+          return true;
+        }
+      }
+      return false;
+    });
+    if (covered) {
+      continue;
+    }
+    findings.push(
+      createFinding({
+        tool: "coverage-gap",
+        kind: "testing.coverage-gap",
+        severity: "P2",
+        file: source,
+        line: 1,
+        evidence: `No test file found for source: ${source}`,
+        rootCause:
+          "Source file has no corresponding test under standard naming conventions (`*.test.*`, `*.spec.*`, `test_*.py`, `__tests__/…`).",
+        recommendedFix:
+          "Add a unit test covering the file's exports, or add an explicit `.notest` marker / coverage-ignore annotation if this file is intentionally untested.",
+        confidence: 0.6,
+      })
+    );
+  }
+  return findings;
+}
+async function* iterateExplicitFiles(resolvedRoot, files) {
+  for (const file of files) {
+    const trimmed = String(file || "").trim();
+    if (!trimmed) {
+      continue;
+    }
+    const fullPath = path.isAbsolute(trimmed)
+      ? trimmed
+      : path.join(resolvedRoot, trimmed);
+    const relativePath = path
+      .relative(resolvedRoot, fullPath)
+      .replace(/\\/g, "/");
+    yield { fullPath, relativePath };
+  }
+}

package/src/agents/testing/tools/flake-detect.js ADDED Viewed

@@ -0,0 +1,125 @@
+// flake-detect — flag flakiness smells in test files (#A15).
+//
+// The usual suspects: tests that sleep, rely on wall-clock arithmetic, hit
+// the real network, or seed randomness without a fixed seed. We scan test
+// files specifically (the coverage-gap heuristic for "is this a test") so
+// the tool doesn't flag production code that legitimately uses setTimeout.
+import fsp from "node:fs/promises";
+import path from "node:path";
+import { createFinding, findLineMatches, getLineContent, isTestFile, toPosix, walkRepoFiles } from "./base.js";
+const TEST_EXTENSIONS = new Set([
+  ".js",
+  ".jsx",
+  ".ts",
+  ".tsx",
+  ".mjs",
+  ".cjs",
+  ".py",
+]);
+const RULES = [
+  {
+    id: "flake.sleep-in-test",
+    // setTimeout(fn, 500) or sleep(2) in a test file — schedule-based flake
+    pattern: /\b(?:setTimeout|setInterval|sleep|time\.sleep|asyncio\.sleep)\s*\(\s*(?:\w+\s*,\s*)?\d{3,}\s*[,)]/,
+    severity: "P2",
+    rootCause:
+      "Test sleeps for a fixed wall-clock duration — slow on CI, flaky on loaded machines.",
+    recommendedFix:
+      "Use fake timers (jest.useFakeTimers, vi.useFakeTimers, freezegun) or event-based waits (await page.waitForSelector / waitForResponse).",
+    confidence: 0.7,
+  },
+  {
+    id: "flake.wall-clock-assertion",
+    pattern: /expect\s*\(\s*(?:Date\.now\(\)|new\s+Date\(\)\.getTime\(\))\s*\)/,
+    severity: "P1",
+    rootCause:
+      "Assertion compares against the live wall clock — value drifts between runs.",
+    recommendedFix:
+      "Freeze time (jest.setSystemTime, vi.setSystemTime, freezegun) or pass a Date supplier the SUT reads from.",
+    confidence: 0.8,
+  },
+  {
+    id: "flake.unstubbed-network",
+    // fetch / axios / requests in a test file — likely reaching out to real
+    // network. Real-network hits are the #1 flake source.
+    pattern: /\b(?:fetch|axios(?:\.[a-z]+)?|got(?:\.[a-z]+)?|requests\.(?:get|post|put|patch|delete|request))\s*\(/,
+    severity: "P1",
+    rootCause:
+      "Test makes a live network call. Real-network tests flake on DNS / TLS / rate limits and make CI unreliable.",
+    recommendedFix:
+      "Mock the client with msw / nock / vcr-py, or inject an HTTP transport and pass a fake in tests.",
+    confidence: 0.65,
+  },
+  {
+    id: "flake.unseeded-random",
+    pattern: /\b(?:Math\.random|random\.(?:random|uniform|shuffle|choice))\s*\(/,
+    severity: "P2",
+    rootCause:
+      "Test uses unseeded randomness — two runs can take different branches and produce different results.",
+    recommendedFix:
+      "Seed the generator or pass a stub random() into the SUT via DI. For Jest / Vitest you can mock Math.random.",
+    confidence: 0.55,
+  },
+];
+export async function runFlakeDetect({ rootPath, files = null } = {}) {
+  const resolvedRoot = path.resolve(String(rootPath || "."));
+  const iterator =
+    Array.isArray(files) && files.length > 0
+      ? iterateExplicitFiles(resolvedRoot, files)
+      : walkRepoFiles({ rootPath: resolvedRoot, extensions: TEST_EXTENSIONS });
+  const findings = [];
+  for await (const { fullPath, relativePath } of iterator) {
+    const relPos = toPosix(relativePath);
+    if (!isTestFile(relPos)) {
+      continue;
+    }
+    let content;
+    try {
+      content = await fsp.readFile(fullPath, "utf-8");
+    } catch {
+      continue;
+    }
+    for (const rule of RULES) {
+      for (const match of findLineMatches(content, rule.pattern)) {
+        findings.push(
+          createFinding({
+            tool: "flake-detect",
+            kind: rule.id,
+            severity: rule.severity,
+            file: relPos,
+            line: match.line,
+            evidence: getLineContent(content, match.line),
+            rootCause: rule.rootCause,
+            recommendedFix: rule.recommendedFix,
+            confidence: rule.confidence,
+          })
+        );
+      }
+    }
+  }
+  return findings;
+}
+async function* iterateExplicitFiles(resolvedRoot, files) {
+  for (const file of files) {
+    const trimmed = String(file || "").trim();
+    if (!trimmed) {
+      continue;
+    }
+    const fullPath = path.isAbsolute(trimmed)
+      ? trimmed
+      : path.join(resolvedRoot, trimmed);
+    const relativePath = path
+      .relative(resolvedRoot, fullPath)
+      .replace(/\\/g, "/");
+    yield { fullPath, relativePath };
+  }
+}
+export { RULES as FLAKE_RULES };

package/src/agents/testing/tools/index.js ADDED Viewed

@@ -0,0 +1,85 @@
+// Priya (testing persona) domain-tool registry (#A15).
+import { runCoverageGap } from "./coverage-gap.js";
+import { runFlakeDetect } from "./flake-detect.js";
+import { runMutationTest } from "./mutation-test.js";
+import { runSnapshotDiff } from "./snapshot-diff.js";
+export const TESTING_TOOLS = Object.freeze({
+  "coverage-gap": {
+    id: "coverage-gap",
+    description:
+      "Walk the repo and flag source files that have no matching test file under standard naming conventions (*.test.*, *.spec.*, test_*.py, __tests__/…).",
+    schema: {
+      type: "object",
+      properties: {
+        rootPath: { type: "string" },
+        files: { type: "array", items: { type: "string" } },
+      },
+    },
+    handler: runCoverageGap,
+  },
+  "flake-detect": {
+    id: "flake-detect",
+    description:
+      "Scan test files for flakiness smells: fixed-duration sleeps, wall-clock assertions, live network calls (fetch / axios / requests), unseeded randomness.",
+    schema: {
+      type: "object",
+      properties: {
+        rootPath: { type: "string" },
+        files: { type: "array", items: { type: "string" } },
+      },
+    },
+    handler: runFlakeDetect,
+  },
+  "snapshot-diff": {
+    id: "snapshot-diff",
+    description:
+      "Walk *.snap / *.ambr files and flag stale (> 90 days untouched) or oversized (> 64 KiB) snapshots.",
+    schema: {
+      type: "object",
+      properties: {
+        rootPath: { type: "string" },
+        staleDays: { type: "number" },
+        files: { type: "array", items: { type: "string" } },
+      },
+    },
+    handler: runSnapshotDiff,
+  },
+  "mutation-test": {
+    id: "mutation-test",
+    description:
+      "Configuration-check pass: verify Stryker / mutmut is wired up and the latest mutation report is fresh (< 30 days).",
+    schema: {
+      type: "object",
+      properties: { rootPath: { type: "string" } },
+    },
+    handler: runMutationTest,
+  },
+});
+export const TESTING_TOOL_IDS = Object.freeze(Object.keys(TESTING_TOOLS));
+export async function dispatchTestingTool(toolId, args = {}) {
+  const tool = TESTING_TOOLS[toolId];
+  if (!tool) {
+    throw new Error(`Unknown testing tool: ${toolId}`);
+  }
+  return tool.handler(args);
+}
+export async function runAllTestingTools({ rootPath, files = null } = {}) {
+  const findings = [];
+  for (const toolId of TESTING_TOOL_IDS) {
+    const out = await dispatchTestingTool(toolId, { rootPath, files });
+    findings.push(...out);
+  }
+  return findings;
+}
+export {
+  runCoverageGap,
+  runFlakeDetect,
+  runMutationTest,
+  runSnapshotDiff,
+};

package/src/agents/testing/tools/mutation-test.js ADDED Viewed

@@ -0,0 +1,143 @@
+// mutation-test — check for mutation-testing configuration (#A15).
+//
+// Priya wants mutation testing (Stryker / pitest / mutmut) as the ceiling
+// signal: do the tests actually assert anything, or is coverage a green
+// but empty number? True mutation runs are expensive — this tool ships as
+// a configuration check first (is Stryker wired up? is there an up-to-date
+// report?). The LLM / operator can dispatch a real run from the resulting
+// advisory.
+import fsp from "node:fs/promises";
+import path from "node:path";
+import { createFinding, toPosix } from "./base.js";
+const CONFIG_CANDIDATES = [
+  "stryker.conf.js",
+  "stryker.conf.cjs",
+  "stryker.conf.mjs",
+  "stryker.config.json",
+  ".stryker-tmp",
+  "setup.cfg", // Python mutmut section
+  "mutmut_config.py",
+  "pyproject.toml", // check for [tool.mutmut]
+];
+const REPORT_CANDIDATES = [
+  "reports/mutation/mutation.html",
+  "reports/mutation/mutation.json",
+  "mutmut_results.json",
+];
+const REPORT_FRESH_DAYS = 30;
+async function fileExists(fullPath) {
+  try {
+    const stat = await fsp.stat(fullPath);
+    return { exists: true, mtimeMs: Number(stat.mtimeMs || 0) };
+  } catch {
+    return { exists: false };
+  }
+}
+async function readTextIfExists(fullPath) {
+  try {
+    return await fsp.readFile(fullPath, "utf-8");
+  } catch {
+    return "";
+  }
+}
+export async function runMutationTest({ rootPath } = {}) {
+  const resolvedRoot = path.resolve(String(rootPath || "."));
+  const findings = [];
+  // Config presence check
+  let configFound = false;
+  for (const candidate of CONFIG_CANDIDATES) {
+    const fullPath = path.join(resolvedRoot, candidate);
+    const result = await fileExists(fullPath);
+    if (result.exists) {
+      if (candidate === "pyproject.toml" || candidate === "setup.cfg") {
+        const text = await readTextIfExists(fullPath);
+        if (!/\[tool\.mutmut\]|\[mutmut\]/.test(text)) {
+          continue;
+        }
+      }
+      configFound = true;
+      break;
+    }
+  }
+  if (!configFound) {
+    findings.push(
+      createFinding({
+        tool: "mutation-test",
+        kind: "testing.no-mutation-config",
+        severity: "P3",
+        file: toPosix("pyproject.toml"),
+        line: 0,
+        evidence: "No Stryker / mutmut / pitest configuration file found.",
+        rootCause:
+          "Without mutation testing, the test suite's assertions could be vacuous — 90% line coverage means nothing if the tests don't fail when the code changes.",
+        recommendedFix:
+          "Wire up @stryker-mutator/core (JS/TS) or mutmut (Python). Start with a single critical module and let the score guide new tests.",
+        confidence: 0.5,
+      })
+    );
+    return findings;
+  }
+  // Report freshness check
+  let reportFound = false;
+  let latestReport = 0;
+  for (const candidate of REPORT_CANDIDATES) {
+    const fullPath = path.join(resolvedRoot, candidate);
+    const result = await fileExists(fullPath);
+    if (result.exists) {
+      reportFound = true;
+      latestReport = Math.max(latestReport, result.mtimeMs);
+    }
+  }
+  if (!reportFound) {
+    findings.push(
+      createFinding({
+        tool: "mutation-test",
+        kind: "testing.no-mutation-report",
+        severity: "P3",
+        file: toPosix("reports/mutation/"),
+        line: 0,
+        evidence: "Stryker / mutmut config present but no mutation report on disk.",
+        rootCause:
+          "Config without a report suggests mutation testing is configured but not actually run.",
+        recommendedFix:
+          "Wire a mutation run into CI on a cadence (weekly is reasonable) so drift in assertion quality is visible.",
+        confidence: 0.55,
+      })
+    );
+    return findings;
+  }
+  const ageDays = Math.floor((Date.now() - latestReport) / (24 * 60 * 60 * 1000));
+  if (ageDays > REPORT_FRESH_DAYS) {
+    findings.push(
+      createFinding({
+        tool: "mutation-test",
+        kind: "testing.mutation-report-stale",
+        severity: "P3",
+        file: toPosix("reports/mutation/"),
+        line: 0,
+        evidence: `Latest mutation report is ${ageDays} days old (threshold ${REPORT_FRESH_DAYS})`,
+        rootCause:
+          "Stale mutation reports mean we're not actually watching assertion quality — drift goes undetected until it matters.",
+        recommendedFix:
+          "Schedule a recurring mutation job (weekly) and file an issue auto-generated from the diff vs. the prior run.",
+        confidence: 0.55,
+      })
+    );
+  }
+  return findings;
+}
+export { CONFIG_CANDIDATES, REPORT_CANDIDATES, REPORT_FRESH_DAYS };

package/src/agents/testing/tools/snapshot-diff.js ADDED Viewed

@@ -0,0 +1,103 @@
+// snapshot-diff — flag stale / oversized / obsolete snapshots (#A15).
+//
+// We walk *.snap files (Jest) and *.raw.snap / *.ambr (Ariadne) and flag:
+//   1. Snapshots that haven't been touched in > STALE_DAYS days — stale
+//      values are a legitimate concern.
+//   2. Snapshots larger than LARGE_SIZE_BYTES — huge blobs are an anti-
+//      pattern (unreviewable diffs, hide regressions).
+//   3. Python doctest / pytest-snapshot *.ambr files that reference a
+//      stored block. Same staleness / size rules.
+//
+// We don't try to diff against the producing code — that's the job of the
+// test runner. We only flag maintenance smells.
+import path from "node:path";
+import { createFinding, toPosix, walkRepoFiles } from "./base.js";
+const SNAPSHOT_EXTENSIONS = new Set([
+  ".snap",
+  ".ambr",
+]);
+const STALE_DAYS = 90;
+const LARGE_SIZE_BYTES = 64 * 1024; // 64 KiB
+export async function runSnapshotDiff({ rootPath, files = null, staleDays = STALE_DAYS } = {}) {
+  const resolvedRoot = path.resolve(String(rootPath || "."));
+  const now = Date.now();
+  const staleThreshold = now - staleDays * 24 * 60 * 60 * 1000;
+  const iterator =
+    Array.isArray(files) && files.length > 0
+      ? iterateExplicitFiles(resolvedRoot, files)
+      : walkRepoFiles({ rootPath: resolvedRoot, extensions: SNAPSHOT_EXTENSIONS });
+  const findings = [];
+  for await (const { relativePath, stat } of iterator) {
+    const mtime = stat ? Number(stat.mtimeMs || 0) : 0;
+    const size = stat ? Number(stat.size || 0) : 0;
+    const rel = toPosix(relativePath);
+    if (mtime && mtime < staleThreshold) {
+      const days = Math.floor((now - mtime) / (24 * 60 * 60 * 1000));
+      findings.push(
+        createFinding({
+          tool: "snapshot-diff",
+          kind: "testing.snapshot-stale",
+          severity: "P3",
+          file: rel,
+          line: 0,
+          evidence: `Last modified ${days} days ago (threshold ${staleDays})`,
+          rootCause:
+            "Snapshot has been unchanged for longer than the staleness threshold — a stale snapshot can hide regressions silently.",
+          recommendedFix:
+            "Re-run the test suite with `--updateSnapshot` (or equivalent) after verifying the current output is actually correct. Delete if the underlying code has been removed.",
+          confidence: 0.5,
+        })
+      );
+    }
+    if (size > LARGE_SIZE_BYTES) {
+      findings.push(
+        createFinding({
+          tool: "snapshot-diff",
+          kind: "testing.snapshot-oversized",
+          severity: "P2",
+          file: rel,
+          line: 0,
+          evidence: `Snapshot is ${Math.round(size / 1024)} KiB (threshold ${Math.round(LARGE_SIZE_BYTES / 1024)} KiB)`,
+          rootCause:
+            "Oversized snapshots are unreviewable in PRs and hide meaningful regressions inside unrelated noise.",
+          recommendedFix:
+            "Split the snapshot into smaller focused tests, switch to a structural assertion, or mask non-essential fields (timestamps, IDs) before snapshotting.",
+          confidence: 0.7,
+        })
+      );
+    }
+  }
+  return findings;
+}
+async function* iterateExplicitFiles(resolvedRoot, files) {
+  const fsp = await import("node:fs/promises");
+  for (const file of files) {
+    const trimmed = String(file || "").trim();
+    if (!trimmed) {
+      continue;
+    }
+    const fullPath = path.isAbsolute(trimmed)
+      ? trimmed
+      : path.join(resolvedRoot, trimmed);
+    const relativePath = path
+      .relative(resolvedRoot, fullPath)
+      .replace(/\\/g, "/");
+    let stat = null;
+    try {
+      stat = await fsp.stat(fullPath);
+    } catch {
+      stat = null;
+    }
+    yield { fullPath, relativePath, stat };
+  }
+}
+export { LARGE_SIZE_BYTES, STALE_DAYS };