npm - supipowers - Versions diffs - 1.5.3 → 2.0.0 - Mend

supipowers 1.5.3 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (340) hide show

package/README.md +14 -8
package/bin/install.mjs +20 -5
package/bin/install.ts +95 -0
package/package.json +8 -4
package/skills/context-mode/SKILL.md +17 -10
package/skills/harness/SKILL.md +94 -0
package/skills/ui-design/SKILL.md +63 -0
package/skills/ui-design/sub-agent-templates/component-builder.md +29 -0
package/skills/ui-design/sub-agent-templates/design-critic.md +46 -0
package/skills/ui-design/sub-agent-templates/pencil/component-builder.md +29 -0
package/skills/ui-design/sub-agent-templates/pencil/design-critic.md +42 -0
package/skills/ui-design/sub-agent-templates/pencil/section-assembler.md +27 -0
package/skills/ui-design/sub-agent-templates/section-assembler.md +27 -0
package/skills/ultraplan-discover/SKILL.md +96 -0
package/skills/ultraplan-intake/SKILL.md +89 -0
package/skills/ultraplan-research/SKILL.md +129 -0
package/skills/ultraplan-review/SKILL.md +86 -0
package/skills/ultraplan-review-scope/SKILL.md +111 -0
package/skills/ultraplan-review-structure/SKILL.md +120 -0
package/skills/ultraplan-review-tdd/SKILL.md +142 -0
package/skills/ultraplan-scout/SKILL.md +110 -0
package/skills/ultraplan-synthesize/SKILL.md +124 -0
package/src/{quality/ai-session.ts → ai/final-message.ts} +27 -0
package/src/ai/schema-text.ts +129 -0
package/src/ai/structured-output.ts +274 -0
package/src/ai/template.ts +27 -0
package/src/bootstrap.ts +63 -28
package/src/commands/agents.ts +131 -42
package/src/commands/ai-review.ts +251 -30
package/src/commands/clear.ts +434 -0
package/src/commands/commit.ts +1 -0
package/src/commands/config.ts +242 -44
package/src/commands/context.ts +55 -28
package/src/commands/doctor.ts +234 -6
package/src/commands/fix-pr.ts +306 -131
package/src/commands/generate.ts +111 -21
package/src/commands/memory.ts +192 -0
package/src/commands/model-picker.ts +28 -21
package/src/commands/model.ts +18 -8
package/src/commands/optimize-context.ts +408 -29
package/src/commands/plan.ts +2 -0
package/src/commands/qa.ts +312 -137
package/src/commands/release.ts +259 -76
package/src/commands/review.ts +293 -59
package/src/commands/status.ts +200 -13
package/src/commands/supi.ts +3 -35
package/src/commands/ui-design.ts +394 -0
package/src/commands/ultraplan.ts +1518 -0
package/src/commands/update.ts +86 -0
package/src/config/defaults.ts +62 -0
package/src/config/loader.ts +448 -60
package/src/config/schema.ts +108 -2
package/src/context/optimizer.ts +25 -33
package/src/context/rule-renderer.ts +223 -0
package/src/context/savings.ts +258 -0
package/src/context/startup-check.ts +380 -0
package/src/context/startup-optimizer.ts +355 -0
package/src/context/tokenignore.ts +146 -0
package/src/context-mode/cache-handle.ts +49 -0
package/src/context-mode/cache-preview.ts +71 -0
package/src/context-mode/cache-store.ts +738 -0
package/src/context-mode/compressor.ts +131 -26
package/src/context-mode/dedup.ts +108 -0
package/src/context-mode/detector.ts +35 -4
package/src/context-mode/event-extractor.ts +14 -12
package/src/context-mode/event-store.ts +91 -36
package/src/context-mode/hooks.ts +798 -56
package/src/context-mode/knowledge/store.ts +255 -11
package/src/context-mode/memory-store.ts +325 -0
package/src/context-mode/metrics-recorder.ts +158 -0
package/src/context-mode/metrics-store.ts +765 -0
package/src/context-mode/model.ts +24 -0
package/src/context-mode/processor-keys.ts +29 -0
package/src/context-mode/processors/build.ts +66 -0
package/src/context-mode/processors/docker.ts +57 -0
package/src/context-mode/processors/git.ts +111 -0
package/src/context-mode/processors/json.ts +112 -0
package/src/context-mode/processors/k8s.ts +67 -0
package/src/context-mode/processors/lint.ts +67 -0
package/src/context-mode/processors/log.ts +86 -0
package/src/context-mode/processors/registry.ts +116 -0
package/src/context-mode/processors/test-runner.ts +102 -0
package/src/context-mode/processors/types.ts +20 -0
package/src/context-mode/repomap.ts +400 -0
package/src/context-mode/routing.ts +97 -24
package/src/context-mode/sandbox/runners.ts +5 -1
package/src/context-mode/snapshot-builder.ts +106 -11
package/src/context-mode/source-hash.ts +173 -0
package/src/context-mode/tool-name.ts +11 -0
package/src/context-mode/tools.ts +654 -22
package/src/context-mode/web/fetcher.ts +31 -12
package/src/debug/logger.ts +2 -1
package/src/deps/registry.ts +1 -1
package/src/discipline/failure-summarizer.ts +170 -0
package/src/discipline/failure-taxonomy.ts +131 -0
package/src/discipline/workflow-invariants.ts +125 -0
package/src/discovery/index.ts +31 -0
package/src/discovery/lsp.ts +87 -0
package/src/discovery/rank.ts +144 -0
package/src/discovery/sources.ts +89 -0
package/src/discovery/workflow.ts +87 -0
package/src/docs/contracts.ts +39 -0
package/src/docs/drift.ts +117 -87
package/src/fix-pr/assessment.ts +200 -0
package/src/fix-pr/contracts.ts +47 -0
package/src/fix-pr/fetch-comments.ts +80 -0
package/src/fix-pr/prompt-builder.ts +58 -40
package/src/fix-pr/scripts/exec.ts +34 -0
package/src/fix-pr/scripts/trigger-review.ts +106 -0
package/src/fix-pr/scripts/wait-and-check.ts +108 -0
package/src/fix-pr/types.ts +4 -0
package/src/git/branch-finish.ts +5 -0
package/src/git/commit-contract.ts +83 -0
package/src/git/commit.ts +121 -184
package/src/git/status.ts +62 -8
package/src/harness/anti_slop/architecture-parser.ts +210 -0
package/src/harness/anti_slop/backend-factory.ts +30 -0
package/src/harness/anti_slop/backend.ts +140 -0
package/src/harness/anti_slop/desloppify-adapter.ts +319 -0
package/src/harness/anti_slop/fallow-adapter.ts +305 -0
package/src/harness/anti_slop/installer.ts +227 -0
package/src/harness/anti_slop/queue.ts +216 -0
package/src/harness/anti_slop/recommend.ts +84 -0
package/src/harness/anti_slop/score.ts +180 -0
package/src/harness/anti_slop/synthetic-edit-test.ts +128 -0
package/src/harness/artifacts/agents-md.ts +88 -0
package/src/harness/artifacts/checks-wiring.ts +57 -0
package/src/harness/artifacts/docs-tree.ts +79 -0
package/src/harness/artifacts/lint-configs.ts +136 -0
package/src/harness/artifacts/review-agents.ts +67 -0
package/src/harness/bare-entry.ts +108 -0
package/src/harness/command.ts +1010 -0
package/src/harness/default-agents/design.md +23 -0
package/src/harness/default-agents/discover.md +18 -0
package/src/harness/default-agents/implement.md +24 -0
package/src/harness/default-agents/plan.md +19 -0
package/src/harness/default-agents/research.md +21 -0
package/src/harness/default-agents/validate.md +22 -0
package/src/harness/gc/reporter.ts +28 -0
package/src/harness/gc/runner.ts +136 -0
package/src/harness/hooks/layer-context-inject.ts +155 -0
package/src/harness/hooks/post-session-sweep.ts +130 -0
package/src/harness/hooks/pre-edit-dupe-probe.ts +224 -0
package/src/harness/hooks/register.ts +118 -0
package/src/harness/model.ts +117 -0
package/src/harness/pipeline.ts +348 -0
package/src/harness/project-paths.ts +235 -0
package/src/harness/stage-runner.ts +107 -0
package/src/harness/stages/design.ts +386 -0
package/src/harness/stages/discover.ts +454 -0
package/src/harness/stages/implement.ts +162 -0
package/src/harness/stages/plan.ts +335 -0
package/src/harness/stages/research.ts +263 -0
package/src/harness/stages/validate.ts +684 -0
package/src/harness/storage.ts +467 -0
package/src/harness/tools.ts +426 -0
package/src/lsp/bridge.ts +56 -95
package/src/lsp/capabilities.ts +108 -0
package/src/lsp/contracts.ts +35 -0
package/src/lsp/detector.ts +8 -12
package/src/markdown-frontmatter.ts +68 -0
package/src/mempalace/bridge.ts +129 -0
package/src/mempalace/config.ts +75 -0
package/src/mempalace/format.ts +163 -0
package/src/mempalace/hooks.ts +370 -0
package/src/mempalace/installer-helper.ts +194 -0
package/src/mempalace/python/mempalace_bridge.py +440 -0
package/src/mempalace/runtime.ts +565 -0
package/src/mempalace/schema.ts +264 -0
package/src/mempalace/session-summary.ts +198 -0
package/src/mempalace/tool.ts +186 -0
package/src/mempalace/uv.ts +256 -0
package/src/migrate/runner.ts +354 -0
package/src/planning/approval-flow.ts +206 -9
package/src/planning/plan-writer-prompt.ts +4 -3
package/src/planning/planning-ask-tool.ts +39 -0
package/src/planning/render-markdown.ts +74 -0
package/src/planning/spec.ts +42 -0
package/src/planning/system-prompt.ts +11 -8
package/src/planning/validate.ts +84 -0
package/src/platform/omp.ts +15 -2
package/src/platform/system-prompt.ts +37 -0
package/src/platform/test-utils.ts +3 -0
package/src/platform/types.ts +6 -1
package/src/qa/config.ts +12 -6
package/src/qa/detect-app-type.ts +13 -6
package/src/qa/matrix.ts +12 -6
package/src/qa/prompt-builder.ts +28 -30
package/src/qa/scripts/dev-server-utils.ts +72 -0
package/src/qa/scripts/run-e2e-tests.ts +226 -0
package/src/qa/scripts/start-dev-server.ts +138 -0
package/src/qa/scripts/stop-dev-server.ts +77 -0
package/src/qa/session.ts +13 -7
package/src/quality/ai-setup.ts +27 -25
package/src/quality/contracts.ts +34 -0
package/src/quality/gates/ai-review.ts +20 -58
package/src/quality/gates/command.ts +249 -46
package/src/quality/review-gates.ts +18 -2
package/src/quality/runner.ts +63 -22
package/src/quality/schemas.ts +37 -2
package/src/quality/setup.ts +96 -16
package/src/release/changelog.ts +1 -1
package/src/release/channels/custom.ts +13 -3
package/src/release/channels/types.ts +5 -0
package/src/release/contracts.ts +90 -0
package/src/release/executor.ts +122 -45
package/src/release/prompt.ts +18 -2
package/src/release/targets.ts +86 -0
package/src/release/version.ts +96 -71
package/src/review/agent-loader.ts +221 -109
package/src/review/fixer.ts +10 -6
package/src/review/multi-agent-runner.ts +114 -13
package/src/review/output.ts +12 -139
package/src/review/runner.ts +12 -6
package/src/review/scope.ts +144 -24
package/src/review/types.ts +1 -20
package/src/review/validator.ts +12 -6
package/src/storage/fix-pr-sessions.ts +21 -14
package/src/storage/plans.ts +14 -5
package/src/storage/qa-sessions.ts +25 -19
package/src/storage/reliability-metrics.ts +180 -0
package/src/storage/reports.ts +8 -7
package/src/storage/review-sessions.ts +55 -20
package/src/tool-catalog/active-tool-controller.ts +164 -0
package/src/tool-catalog/active-tool-planner.ts +212 -0
package/src/tool-catalog/tool-groups.ts +102 -0
package/src/types.ts +1399 -5
package/src/ui-design/backend-adapter.ts +78 -0
package/src/ui-design/backends/local-html.ts +82 -0
package/src/ui-design/backends/pencil-mcp.ts +111 -0
package/src/ui-design/components-scanner.ts +124 -0
package/src/ui-design/config.ts +55 -0
package/src/ui-design/pen-scanner.ts +95 -0
package/src/ui-design/pen-selector.ts +72 -0
package/src/ui-design/prompt-builder.ts +73 -0
package/src/ui-design/scanner.ts +136 -0
package/src/ui-design/session.ts +974 -0
package/src/ui-design/system-prompt.ts +312 -0
package/src/ui-design/tokens-scanner.ts +181 -0
package/src/ui-design/types.ts +96 -0
package/src/ultraplan/agent-catalog.ts +522 -0
package/src/ultraplan/authoring/agent-catalog.ts +310 -0
package/src/ultraplan/authoring/authoring-tools.ts +552 -0
package/src/ultraplan/authoring/command-handlers.ts +339 -0
package/src/ultraplan/authoring/markdown.ts +510 -0
package/src/ultraplan/authoring/model.ts +162 -0
package/src/ultraplan/authoring/pipeline.ts +319 -0
package/src/ultraplan/authoring/stage-runner.ts +141 -0
package/src/ultraplan/authoring/stages/approve.ts +249 -0
package/src/ultraplan/authoring/stages/discover.ts +289 -0
package/src/ultraplan/authoring/stages/intake.ts +203 -0
package/src/ultraplan/authoring/stages/research.ts +399 -0
package/src/ultraplan/authoring/stages/review.ts +333 -0
package/src/ultraplan/authoring/stages/scout.ts +188 -0
package/src/ultraplan/authoring/stages/synthesize.ts +348 -0
package/src/ultraplan/authoring/storage.ts +594 -0
package/src/ultraplan/authoring/synth-gate.ts +165 -0
package/src/ultraplan/authoring-draft.ts +653 -0
package/src/ultraplan/authoring-persist.ts +180 -0
package/src/ultraplan/authoring-tool.ts +608 -0
package/src/ultraplan/authoring-wizard.ts +587 -0
package/src/ultraplan/batch/merge.ts +98 -0
package/src/ultraplan/batch/planner.ts +150 -0
package/src/ultraplan/batch/presenter.ts +97 -0
package/src/ultraplan/batch/storage.ts +420 -0
package/src/ultraplan/batch/supervisor.ts +317 -0
package/src/ultraplan/batch/worker.ts +26 -0
package/src/ultraplan/batch/worktree.ts +110 -0
package/src/ultraplan/contracts.ts +1593 -0
package/src/ultraplan/default-agents/authoring/discoverer.md +12 -0
package/src/ultraplan/default-agents/authoring/intake.md +12 -0
package/src/ultraplan/default-agents/authoring/planner.md +12 -0
package/src/ultraplan/default-agents/authoring/researcher.md +12 -0
package/src/ultraplan/default-agents/authoring/scope-checker.md +12 -0
package/src/ultraplan/default-agents/authoring/scout.md +12 -0
package/src/ultraplan/default-agents/authoring/structure-checker.md +12 -0
package/src/ultraplan/default-agents/authoring/tdd-checker.md +12 -0
package/src/ultraplan/default-agents/backend-domain-reviewer.md +10 -0
package/src/ultraplan/default-agents/backend-executor.md +10 -0
package/src/ultraplan/default-agents/backend-stack-reviewer.md +10 -0
package/src/ultraplan/default-agents/backend-tester.md +10 -0
package/src/ultraplan/default-agents/frontend-domain-reviewer.md +10 -0
package/src/ultraplan/default-agents/frontend-executor.md +10 -0
package/src/ultraplan/default-agents/frontend-stack-reviewer.md +10 -0
package/src/ultraplan/default-agents/frontend-tester.md +10 -0
package/src/ultraplan/default-agents/infrastructure-domain-reviewer.md +10 -0
package/src/ultraplan/default-agents/infrastructure-executor.md +10 -0
package/src/ultraplan/default-agents/infrastructure-stack-reviewer.md +10 -0
package/src/ultraplan/default-agents/infrastructure-tester.md +10 -0
package/src/ultraplan/execution/contract.ts +71 -0
package/src/ultraplan/execution/policy.ts +217 -0
package/src/ultraplan/execution/runtime-tools.ts +107 -0
package/src/ultraplan/execution/session-runner.ts +281 -0
package/src/ultraplan/next-router.ts +85 -0
package/src/ultraplan/presenter.ts +359 -0
package/src/ultraplan/project-paths.ts +342 -0
package/src/ultraplan/runtime/active-execution.ts +72 -0
package/src/ultraplan/runtime/apply-mutation.ts +416 -0
package/src/ultraplan/runtime/blockers.ts +243 -0
package/src/ultraplan/runtime/hook-bridge.ts +486 -0
package/src/ultraplan/runtime/launch-context.ts +207 -0
package/src/ultraplan/runtime/migration.ts +524 -0
package/src/ultraplan/runtime/normalize.ts +281 -0
package/src/ultraplan/runtime/proof.ts +260 -0
package/src/ultraplan/runtime/reducer.ts +416 -0
package/src/ultraplan/runtime/repair.ts +251 -0
package/src/ultraplan/runtime/tracker-storage.ts +368 -0
package/src/ultraplan/session-selection.ts +291 -0
package/src/ultraplan/storage.ts +374 -0
package/src/utils/editor.ts +38 -0
package/src/utils/executable.ts +80 -0
package/src/utils/paths.ts +1 -20
package/src/utils/shell.ts +31 -0
package/src/visual/companion.ts +2 -1
package/src/visual/scripts/frame-template.html +60 -0
package/src/visual/scripts/index.js +59 -13
package/src/visual/scripts/package.json +3 -0
package/src/visual/start-server.ts +2 -1
package/src/workspace/git-scope.ts +64 -0
package/src/workspace/locks.ts +23 -0
package/src/workspace/package-manager.ts +117 -0
package/src/workspace/path-mapping.ts +75 -0
package/src/workspace/project-slug.ts +92 -0
package/src/workspace/repo-root.ts +137 -0
package/src/workspace/selector.ts +115 -0
package/src/workspace/state-paths.ts +118 -0
package/src/workspace/targets.ts +313 -0
package/src/fix-pr/scripts/diff-comments.sh +0 -33
package/src/fix-pr/scripts/fetch-pr-comments.sh +0 -25
package/src/fix-pr/scripts/trigger-review.sh +0 -36
package/src/fix-pr/scripts/wait-and-check.sh +0 -37
package/src/qa/scripts/detect-app-type.sh +0 -68
package/src/qa/scripts/discover-routes.sh +0 -143
package/src/qa/scripts/run-e2e-tests.sh +0 -131
package/src/qa/scripts/start-dev-server.sh +0 -46
package/src/qa/scripts/stop-dev-server.sh +0 -36
package/src/review/prompts/fix-output-schema.md +0 -18
package/src/review/prompts/review-output-schema.md +0 -38
package/src/review/template.ts +0 -15
/package/src/{review → ai}/prompts/invalid-output-retry.md +0 -0

package/src/context-mode/web/fetcher.ts CHANGED Viewed

@@ -1,3 +1,4 @@
+import type { KnowledgeOwner } from "../../types.js";
 import { type Chunk, chunkMarkdown } from "../knowledge/chunker.js";
 import type { KnowledgeStore } from "../knowledge/store.js";
 import { htmlToMarkdown } from "./html-to-md.js";
@@ -7,6 +8,8 @@ export interface FetchOptions {
   source?: string;
   /** Bypass 24h TTL cache. */
   force?: boolean;
+  /** Ownership scope for indexed/cached content. Defaults to project-owned when omitted. */
+  owner?: KnowledgeOwner;
 }
 export interface FetchResult {
@@ -28,15 +31,22 @@ export async function fetchAndIndex(
   options?: FetchOptions,
 ): Promise<FetchResult> {
   const source = options?.source ?? new URL(url).hostname;
+  const owner = options?.owner;
+  const resolvedOwner = resolveOwner(owner);
-  // Check cache unless forced
+  // Check cache unless forced. Explicit owners must be isolated exactly; the
+  // default project-owned path also accepts migrated legacy rows so upgraded
+  // stores do not refetch and duplicate visible search results.
   if (!options?.force) {
-    const cached = store.db
-      .prepare("SELECT fetched_at FROM url_cache WHERE url = ? AND source = ?")
-      .get(url, source) as { fetched_at: number } | null;
+    const cacheOwners = owner ? [resolvedOwner] : [resolvedOwner, { ownerScope: "legacy" as const, ownerId: "" }];
+    for (const cacheOwner of cacheOwners) {
+      const cached = store.db
+        .prepare("SELECT fetched_at FROM url_cache WHERE url = ? AND source = ? AND owner_scope = ? AND owner_id = ?")
+        .get(url, source, cacheOwner.ownerScope, cacheOwner.ownerId) as { fetched_at: number } | null;
-    if (cached && Date.now() - cached.fetched_at < TTL_MS) {
-      return buildCachedResult(store, source);
+      if (cached && Date.now() - cached.fetched_at < TTL_MS) {
+        return buildCachedResult(store, source, cacheOwner);
+      }
     }
   }
@@ -51,11 +61,11 @@ export async function fetchAndIndex(
   const markdown = toMarkdown(rawText, contentType);
   const chunks = chunkMarkdown(markdown, source);
-  store.index(chunks, source);
+  store.index(chunks, source, owner);
   store.db.run(
-    "INSERT OR REPLACE INTO url_cache (url, source, fetched_at) VALUES (?, ?, ?)",
-    [url, source, Date.now()],
+    "INSERT OR REPLACE INTO url_cache (url, source, owner_scope, owner_id, fetched_at) VALUES (?, ?, ?, ?, ?)",
+    [url, source, resolvedOwner.ownerScope, resolvedOwner.ownerId, Date.now()],
   );
   return {
@@ -102,11 +112,20 @@ function buildPreview(chunks: Chunk[]): string {
   return out;
 }
+function resolveOwner(owner: KnowledgeOwner | undefined): Required<KnowledgeOwner> {
+  return {
+    ownerScope: owner?.ownerScope ?? "project",
+    ownerId: owner?.ownerId ?? "",
+  };
+}
 /** Reconstruct a cached result by querying stored chunks. */
-function buildCachedResult(store: KnowledgeStore, source: string): FetchResult {
+function buildCachedResult(store: KnowledgeStore, source: string, owner: Required<KnowledgeOwner>): FetchResult {
   const rows = store.db
-    .prepare("SELECT title, body, content_type AS contentType FROM content_chunks WHERE source = ? ORDER BY id")
-    .all(source) as Chunk[];
+    .prepare(
+      "SELECT title, body, content_type AS contentType FROM content_chunks WHERE source = ? AND owner_scope = ? AND owner_id = ? ORDER BY id",
+    )
+    .all(source, owner.ownerScope, owner.ownerId) as Chunk[];
   return {
     preview: buildPreview(rows),

package/src/debug/logger.ts CHANGED Viewed

@@ -1,6 +1,7 @@
 import * as fs from "node:fs";
 import * as path from "node:path";
 import type { PlatformPaths } from "../platform/types.js";
+import { getProjectStatePath } from "../workspace/state-paths.js";
 export type DebugSessionContext = {
   cwd?: string;
@@ -74,7 +75,7 @@ export function createDebugLogger(
     };
   }
-  const filePath = paths.project(cwd, "debug", `tool-${sanitizedTool}__session-${sessionId}.jsonl`);
+  const filePath = getProjectStatePath(paths, cwd, "debug", `tool-${sanitizedTool}__session-${sessionId}.jsonl`);
   const logger: DebugLogger = {
     enabled: true,

package/src/deps/registry.ts CHANGED Viewed

@@ -148,7 +148,7 @@ export const DEPENDENCIES: Dependency[] = [
     binary: "playwright",
     required: false,
     category: "testing",
-    description: "Test runner for E2E tests (run-e2e-tests.sh)",
+    description: "Test runner used by the portable QA Bun entrypoints",
     checkFn: (exec) => checkBinary(exec, "playwright"),
     installCmd: null, // Compound command (&&) — not compatible with installDep's naive split
     url: "https://playwright.dev",

package/src/discipline/failure-summarizer.ts ADDED Viewed

@@ -0,0 +1,170 @@
+// src/discipline/failure-summarizer.ts
+//
+// Offline analyzer that walks stored reliability records and persisted
+// session artifacts, classifies each failure via the failure taxonomy,
+// and produces a compact deterministic report.
+//
+// The summarizer is pure: given the same input records it produces the
+// same report. Every data source is optional — callers pass what they
+// have, the summarizer copes with partial inputs.
+//
+// Phase 8 exit gate: recurring failures are aggregated so the next
+// hardening target is evidence-driven, not anecdotal.
+import type { PlatformPaths } from "../platform/types.js";
+import type { ReliabilityRecord } from "../types.js";
+import { readReliabilityRecords } from "../storage/reliability-metrics.js";
+import {
+  FAILURE_CLASSES,
+  classifyFailure,
+  describeFailureClass,
+  type FailureClass,
+} from "./failure-taxonomy.js";
+export interface FailureOccurrence {
+  /** Timestamp of the underlying event. */
+  ts: string;
+  /** Command that produced the failure. */
+  command: string;
+  /** Specific operation (e.g. "commit-plan"), when known. */
+  operation?: string;
+  /** All classes that fired for this occurrence. */
+  classes: FailureClass[];
+  /** Truthful reason from the record. */
+  reason?: string;
+}
+export interface FailureClassAggregate {
+  class: FailureClass;
+  description: string;
+  /** Total occurrences of this class in the input. */
+  count: number;
+  /** Count per command, sorted alphabetically. */
+  byCommand: Array<{ command: string; count: number }>;
+  /** Up to `exampleCount` representative records for review. */
+  examples: FailureOccurrence[];
+}
+export interface FailureSummary {
+  /** Total non-ok records considered. */
+  totalFailures: number;
+  /** Failure classes that fired at least once, sorted by taxonomy order. */
+  aggregates: FailureClassAggregate[];
+  /** Non-ok records that did NOT match any taxonomy class. */
+  unclassified: FailureOccurrence[];
+}
+export interface SummarizeOptions {
+  /** Number of example occurrences per class. Default 3. */
+  exampleCount?: number;
+}
+function isFailureRecord(record: ReliabilityRecord): boolean {
+  return record.outcome !== "ok";
+}
+function classifyRecord(record: ReliabilityRecord): FailureOccurrence {
+  const classes = classifyFailure({
+    outcome: record.outcome,
+    reason: record.reason,
+    // attempts used by unproductive-retry rule
+    attempts: record.attempts,
+  } as any);
+  return {
+    ts: record.ts,
+    command: record.command,
+    operation: record.operation,
+    classes,
+    reason: record.reason,
+  };
+}
+function aggregate(
+  occurrences: FailureOccurrence[],
+  exampleCount: number,
+): FailureClassAggregate[] {
+  const map = new Map<FailureClass, FailureOccurrence[]>();
+  for (const occ of occurrences) {
+    for (const cls of occ.classes) {
+      const list = map.get(cls) ?? [];
+      list.push(occ);
+      map.set(cls, list);
+    }
+  }
+  const aggregates: FailureClassAggregate[] = [];
+  for (const cls of FAILURE_CLASSES) {
+    const list = map.get(cls);
+    if (!list || list.length === 0) continue;
+    const byCommandMap = new Map<string, number>();
+    for (const occ of list) {
+      byCommandMap.set(occ.command, (byCommandMap.get(occ.command) ?? 0) + 1);
+    }
+    const byCommand = [...byCommandMap.entries()]
+      .map(([command, count]) => ({ command, count }))
+      .sort((a, b) => a.command.localeCompare(b.command));
+    aggregates.push({
+      class: cls,
+      description: describeFailureClass(cls),
+      count: list.length,
+      byCommand,
+      examples: list.slice(0, Math.max(0, exampleCount)),
+    });
+  }
+  return aggregates;
+}
+/**
+ * Summarize an arbitrary list of reliability records. Pure — no filesystem.
+ * Callers can combine records from multiple sources before summarizing.
+ */
+export function summarizeFailures(
+  records: ReliabilityRecord[],
+  options: SummarizeOptions = {},
+): FailureSummary {
+  const exampleCount = options.exampleCount ?? 3;
+  const failures = records.filter(isFailureRecord).map(classifyRecord);
+  const classified = failures.filter((f) => f.classes.length > 0);
+  const unclassified = failures.filter((f) => f.classes.length === 0);
+  return {
+    totalFailures: failures.length,
+    aggregates: aggregate(classified, exampleCount),
+    unclassified,
+  };
+}
+/**
+ * Convenience: load records from the per-cwd reliability store and
+ * summarize. Empty store produces an empty summary (no crashes).
+ */
+export function summarizeLocalFailures(
+  paths: PlatformPaths,
+  cwd: string,
+  options: SummarizeOptions = {},
+): FailureSummary {
+  return summarizeFailures(readReliabilityRecords(paths, cwd), options);
+}
+/**
+ * Format a summary as readable lines. `[]` when there are no failures so
+ * callers can branch on length without a special case.
+ */
+export function formatFailureSummary(summary: FailureSummary): string[] {
+  if (summary.totalFailures === 0) return [];
+  const lines: string[] = [`Failure summary: ${summary.totalFailures} non-ok record(s)`];
+  for (const agg of summary.aggregates) {
+    lines.push(`  [${agg.class}] ${agg.description} \u2014 ${agg.count} occurrence(s)`);
+    for (const per of agg.byCommand) {
+      lines.push(`    \u00b7 ${per.command}: ${per.count}`);
+    }
+  }
+  if (summary.unclassified.length > 0) {
+    lines.push(`  [unclassified] ${summary.unclassified.length} record(s) did not match any taxonomy class`);
+  }
+  return lines;
+}

package/src/discipline/failure-taxonomy.ts ADDED Viewed

@@ -0,0 +1,131 @@
+/**
+ * Workflow failure taxonomy.
+ *
+ * Small, explicit set of failure classes used by summarizer and eval-promotion
+ * to turn raw reliability records + session notes into actionable categories.
+ *
+ * Classification is pure: regex / string checks only, no dynamic evaluation,
+ * deterministic for the same input, never throws.
+ */
+export const FAILURE_CLASSES = [
+	"premature-completion",
+	"wrong-tool-path",
+	"missing-artifact",
+	"verification-skipped",
+	"discovery-miss",
+	"unproductive-retry",
+] as const;
+export type FailureClass = (typeof FAILURE_CLASSES)[number];
+export interface FailureSignals {
+	/** Stored reliability record, optional. */
+	outcome?: "ok" | "blocked" | "retry-exhausted" | "fallback" | "agent-error";
+	/** Reason string from the reliability record or log, optional. */
+	reason?: string;
+	/** Tool call name if the failure involves a blocked/rerouted tool. */
+	toolName?: string;
+	/** Path of an artifact that was expected but not found. */
+	missingArtifactPath?: string;
+	/** Free-text description from debug traces or session notes. */
+	note?: string;
+	/** Attempt count from the reliability record, optional. */
+	attempts?: number;
+}
+// Tool names blocked by `routeToolCall` when context-mode is active.
+// Keep in lock-step with `src/context-mode/routing.ts` — every native tool
+// that the router redirects must classify as `wrong-tool-path` here.
+const BLOCKED_TOOLS = new Set<string>([
+	"search",
+	"find",
+	"bash-grep",
+	"bash-find",
+	"curl",
+	"wget",
+	"fetch",
+	"web_fetch",
+	"WebFetch",
+]);
+const DESCRIPTIONS: Record<FailureClass, string> = {
+	"premature-completion":
+		"Workflow claimed done before required artifact existed.",
+	"wrong-tool-path":
+		"Workflow reached for a blocked tool instead of the preferred ctx_* tool.",
+	"missing-artifact":
+		"Required output (plan file, session, findings.md) was never written.",
+	"verification-skipped":
+		"Agent skipped a mandatory verification step (test, typecheck, eval).",
+	"discovery-miss":
+		"Workflow wandered before finding the right entry point.",
+	"unproductive-retry":
+		"Retry loop spent attempts without making progress.",
+};
+/**
+ * Classify a failure based on signals. Returns one or more matching classes in
+ * priority order (matching `FAILURE_CLASSES` order); empty array when no class
+ * fires. Deterministic — never throws.
+ */
+export function classifyFailure(signals: FailureSignals): FailureClass[] {
+	const reason = signals.reason ?? "";
+	const note = signals.note ?? "";
+	const matches: FailureClass[] = [];
+	// premature-completion
+	if (
+		(signals.outcome === "ok" &&
+			/incomplete|partial|unresolved/i.test(reason)) ||
+		(signals.outcome === "fallback" &&
+			/never produced valid artifact/i.test(reason))
+	) {
+		matches.push("premature-completion");
+	}
+	// wrong-tool-path
+	if (
+		(signals.toolName && BLOCKED_TOOLS.has(signals.toolName)) ||
+		/ctx_/.test(reason)
+	) {
+		matches.push("wrong-tool-path");
+	}
+	// missing-artifact
+	if (
+		signals.missingArtifactPath !== undefined ||
+		(/missing/i.test(reason) && /plan|findings|session/i.test(reason))
+	) {
+		matches.push("missing-artifact");
+	}
+	// verification-skipped
+	if (
+		/without running (validator|tests|typecheck)/i.test(reason) ||
+		/skipped (verification|validation|test)/i.test(reason)
+	) {
+		matches.push("verification-skipped");
+	}
+	// discovery-miss
+	if (
+		/wandered/i.test(reason) ||
+		/wrong file/i.test(reason) ||
+		/searched broadly/i.test(note)
+	) {
+		matches.push("discovery-miss");
+	}
+	// unproductive-retry
+	if (signals.outcome === "retry-exhausted" && (signals.attempts ?? 0) >= 3) {
+		matches.push("unproductive-retry");
+	}
+	return matches;
+}
+/** Canonical human-friendly description per class. */
+export function describeFailureClass(cls: FailureClass): string {
+	return DESCRIPTIONS[cls];
+}

package/src/discipline/workflow-invariants.ts ADDED Viewed

@@ -0,0 +1,125 @@
+// src/discipline/workflow-invariants.ts
+//
+// Runtime invariants that AI-heavy workflows must satisfy before reporting
+// completion. When an invariant fails, the workflow yields a truthful
+// blocker instead of silently claiming success. Used by plan/review/qa/fix-pr
+// completion paths and by Phase 0 evals that test workflow boundaries.
+//
+// Design notes:
+//   - Invariants are pure functions over a workflow-specific context object.
+//   - Invariants return either `{ state: "satisfied" }` or a blocker with a
+//     human-readable `reason`. Keep reasons short and actionable.
+//   - `checkInvariants` returns the FIRST blocker, not a list. Workflows
+//     surface one blocker at a time so the user (or the model) can fix it
+//     and proceed, rather than being handed a noisy report.
+//   - This module owns only the generic abstraction. Workflow-specific
+//     invariant builders live next to their workflow (e.g. plan's PlanSpec
+//     validation in src/planning/approval-flow.ts).
+export type InvariantState =
+  | { state: "satisfied" }
+  | { state: "blocked"; reason: string };
+export interface WorkflowInvariant<TContext> {
+  /** Stable identifier. Used for logging and test assertions. */
+  name: string;
+  /**
+   * Evaluate this invariant against the workflow context. Return a blocker
+   * with a truthful reason if the invariant fails.
+   */
+  check: (ctx: TContext) => InvariantState | Promise<InvariantState>;
+}
+export type InvariantCheckResult =
+  | { state: "satisfied" }
+  | { state: "blocked"; invariant: string; reason: string };
+/**
+ * Run invariants in order against `ctx`. Stop at the first blocker and
+ * return it. Returns `{ state: "satisfied" }` only when every invariant
+ * reports satisfied.
+ */
+export async function checkInvariants<TContext>(
+  invariants: readonly WorkflowInvariant<TContext>[],
+  ctx: TContext,
+): Promise<InvariantCheckResult> {
+  for (const invariant of invariants) {
+    const result = await invariant.check(ctx);
+    if (result.state === "blocked") {
+      return { state: "blocked", invariant: invariant.name, reason: result.reason };
+    }
+  }
+  return { state: "satisfied" };
+}
+// ---------------------------------------------------------------------------
+// Invariant builders — the common shapes workflows compose from
+// ---------------------------------------------------------------------------
+/**
+ * Build an invariant that is satisfied only when the predicate returns true.
+ */
+export function requireCondition<TContext>(
+  name: string,
+  predicate: (ctx: TContext) => boolean | Promise<boolean>,
+  reason: string,
+): WorkflowInvariant<TContext> {
+  return {
+    name,
+    async check(ctx) {
+      const satisfied = await predicate(ctx);
+      return satisfied ? { state: "satisfied" } : { state: "blocked", reason };
+    },
+  };
+}
+/**
+ * Build an invariant that is satisfied only when the artifact exists. The
+ * caller supplies both the existence check and the artifact identifier used
+ * in the blocker reason.
+ */
+export function requireArtifact<TContext>(
+  name: string,
+  exists: (ctx: TContext) => boolean | Promise<boolean>,
+  artifactLabel: string,
+): WorkflowInvariant<TContext> {
+  return requireCondition(
+    name,
+    exists,
+    `Required artifact is missing: ${artifactLabel}.`,
+  );
+}
+/**
+ * Build an invariant that blocks when the workflow still has pending work.
+ * Typical uses: outstanding todos, unresolved review comments, undispatched
+ * follow-up steps.
+ */
+export function requireNoPendingWork<TContext>(
+  name: string,
+  pending: (ctx: TContext) => number | Promise<number>,
+  workLabel: string,
+): WorkflowInvariant<TContext> {
+  return {
+    name,
+    async check(ctx) {
+      const count = await pending(ctx);
+      return count === 0
+        ? { state: "satisfied" }
+        : {
+            state: "blocked",
+            reason: `${count} ${workLabel} still pending \u2014 workflow cannot complete.`,
+          };
+    },
+  };
+}
+/**
+ * Render a blocker result as a single line for notifications, logs, or
+ * prompts. `satisfied` states render as an empty string so callers can join
+ * multiple results without branching.
+ */
+export function formatInvariantResult(result: InvariantCheckResult): string {
+  if (result.state === "satisfied") return "";
+  return `[${result.invariant}] ${result.reason}`;
+}

package/src/discovery/index.ts ADDED Viewed

@@ -0,0 +1,31 @@
+// src/discovery/index.ts
+//
+// Deterministic repo-entry-point discovery. Given a workflow query (e.g.
+// "fix the login bug", "review the latest commit") and context signals
+// (changed files, workspace targets), rank likely-relevant files with a
+// short rationale for each candidate.
+//
+// Used by /supi:review, /supi:plan, /supi:qa, and /supi:fix-pr to start
+// from strong candidates rather than broad wandering.
+//
+// Non-goals:
+//   - Hosted search / vector database
+//   - Replacing native tools (grep/lsp). This layer *orchestrates* them.
+//
+// Phase 6 exit gate: fixture workspaces rank expected files first, every
+// candidate carries rationale, behavior stays stable when inputs are empty.
+export type {
+  DiscoveryCandidate,
+  DiscoveryInput,
+  DiscoveryResult,
+  DiscoverySource,
+} from "./rank.js";
+export { rankDiscoveryCandidates } from "./rank.js";
+export { discoverFromSources } from "./sources.js";
+export { rankWithLspAugmentation } from "./lsp.js";
+export type { LspSymbolLocation, LspAugmentedResult } from "./lsp.js";
+export { suggestCandidatesForWorkflow } from "./workflow.js";
+export type { WorkflowDiscoveryInput, WorkflowDiscoveryResult } from "./workflow.js";

package/src/discovery/lsp.ts ADDED Viewed

@@ -0,0 +1,87 @@
+// src/discovery/lsp.ts
+//
+// LSP-assisted discovery: convert symbol search results into external
+// signals the ranker consumes. When LSP is unavailable or the symbol
+// lookup returns nothing, falls through cleanly — callers should never
+// require LSP for discovery to work.
+//
+// This module deliberately does not talk to LSP directly. Callers pass in
+// a `querySymbols` callback so the same function can be driven by:
+//   - the live platform LSP bridge in production
+//   - a deterministic fixture in tests
+import type { DiscoveryCandidate } from "./rank.js";
+import { rankDiscoveryCandidates, type DiscoveryInput } from "./rank.js";
+export interface LspSymbolLocation {
+  /** Repo-relative path where the symbol is defined or referenced. */
+  path: string;
+  /** Short reason string attached to the candidate. */
+  reason: string;
+  /** Extra score beyond the baseline LSP boost. Optional. */
+  bonus?: number;
+}
+export interface LspDiscoveryInput extends DiscoveryInput {
+  /**
+   * Called with the workflow `query`. Must return a (possibly empty) list
+   * of symbol locations. Any thrown error is caught and treated as
+   * "LSP unavailable" — discovery still returns a ranked list from the
+   * remaining sources.
+   */
+  querySymbols: (query: string) => LspSymbolLocation[] | Promise<LspSymbolLocation[]>;
+}
+export interface LspAugmentedResult {
+  candidates: DiscoveryCandidate[];
+  lspAvailable: boolean;
+  lspHitCount: number;
+}
+const WEIGHT_LSP = 6;
+/**
+ * Run LSP symbol discovery against the query, fold the hits into external
+ * signals, and rank the combined candidate pool. When `querySymbols` throws
+ * or returns [], the result is still valid — discovery degrades, not fails.
+ */
+export async function rankWithLspAugmentation(
+  input: LspDiscoveryInput,
+): Promise<LspAugmentedResult> {
+  let lspAvailable = true;
+  let lspHits: LspSymbolLocation[] = [];
+  if (input.query && input.query.trim().length > 0) {
+    try {
+      lspHits = await input.querySymbols(input.query);
+    } catch {
+      lspAvailable = false;
+      lspHits = [];
+    }
+  }
+  const externalSignals: Record<string, { score: number; rationale: string }> = {
+    ...(input.externalSignals ?? {}),
+  };
+  for (const hit of lspHits) {
+    const prior = externalSignals[hit.path];
+    const score = WEIGHT_LSP + (hit.bonus ?? 0);
+    externalSignals[hit.path] = prior
+      ? {
+          score: prior.score + score,
+          rationale: `${prior.rationale}; ${hit.reason}`,
+        }
+      : { score, rationale: hit.reason };
+  }
+  const ranked = rankDiscoveryCandidates({
+    ...input,
+    externalSignals,
+  });
+  return {
+    candidates: ranked.candidates,
+    lspAvailable,
+    lspHitCount: lspHits.length,
+  };
+}