npm - @vigolium/piolium - Versions diffs - 0.0.1 - Mend

@vigolium/piolium 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (271) hide show

package/LICENSE +21 -0
package/README.md +117 -0
package/agents/access-auditor.md +300 -0
package/agents/assumption-breaker.md +154 -0
package/agents/attack-designer.md +116 -0
package/agents/code-scanner.md +139 -0
package/agents/concurrency-auditor.md +238 -0
package/agents/confirm-writer.md +257 -0
package/agents/context-reviewer.md +274 -0
package/agents/cross-verifier.md +165 -0
package/agents/cve-scout.md +381 -0
package/agents/env-builder.md +282 -0
package/agents/env-profiler.md +205 -0
package/agents/evidence-collector.md +140 -0
package/agents/finding-grader.md +142 -0
package/agents/finding-writer.md +148 -0
package/agents/flow-tracer.md +106 -0
package/agents/goal-backtracer.md +146 -0
package/agents/history-miner.md +467 -0
package/agents/independent-verifier.md +118 -0
package/agents/intent-mapper.md +183 -0
package/agents/longshot-collector.md +128 -0
package/agents/longshot-prober.md +126 -0
package/agents/patch-auditor.md +73 -0
package/agents/poc-author.md +124 -0
package/agents/poc-runner.md +194 -0
package/agents/probe-lead.md +269 -0
package/agents/red-challenger.md +101 -0
package/agents/report-composer.md +208 -0
package/agents/review-adjudicator.md +216 -0
package/agents/spec-auditor.md +155 -0
package/agents/taint-tracer.md +265 -0
package/agents/test-locator.md +209 -0
package/agents/threat-modeler.md +132 -0
package/agents/variant-scanner.md +108 -0
package/agents/variant-spotter.md +110 -0
package/bin/piolium.mjs +376 -0
package/extensions/piolium/_vendor/yaml.bundle.d.mts +6 -0
package/extensions/piolium/_vendor/yaml.bundle.mjs +139 -0
package/extensions/piolium/agent-runner.ts +322 -0
package/extensions/piolium/agents.ts +266 -0
package/extensions/piolium/audit-state.ts +522 -0
package/extensions/piolium/bundled-resources.ts +97 -0
package/extensions/piolium/candidate-scan.ts +966 -0
package/extensions/piolium/command-target.ts +177 -0
package/extensions/piolium/console-stream.ts +57 -0
package/extensions/piolium/export-results.ts +380 -0
package/extensions/piolium/findings.ts +448 -0
package/extensions/piolium/heartbeat.ts +182 -0
package/extensions/piolium/help.ts +234 -0
package/extensions/piolium/index.ts +1865 -0
package/extensions/piolium/longshot.ts +530 -0
package/extensions/piolium/matcher-suggestions.ts +196 -0
package/extensions/piolium/matcher-utils.ts +83 -0
package/extensions/piolium/modes/balanced.ts +750 -0
package/extensions/piolium/modes/confirm-bootstrap.ts +186 -0
package/extensions/piolium/modes/confirm.ts +697 -0
package/extensions/piolium/modes/deep.ts +917 -0
package/extensions/piolium/modes/diff.ts +177 -0
package/extensions/piolium/modes/lite.ts +540 -0
package/extensions/piolium/modes/longshot.ts +595 -0
package/extensions/piolium/modes/merge.ts +204 -0
package/extensions/piolium/modes/phase-runner.ts +267 -0
package/extensions/piolium/modes/reinvest.ts +546 -0
package/extensions/piolium/modes/revisit.ts +279 -0
package/extensions/piolium/modes.ts +48 -0
package/extensions/piolium/phase-labels.ts +123 -0
package/extensions/piolium/phase-status-strip.ts +92 -0
package/extensions/piolium/prompt-prefix-editor.ts +39 -0
package/extensions/piolium/providers/anthropic-vertex.ts +836 -0
package/extensions/piolium/recon.ts +409 -0
package/extensions/piolium/result-stats.ts +105 -0
package/extensions/piolium/retry.ts +120 -0
package/extensions/piolium/scheduler.ts +212 -0
package/extensions/piolium/secrets.ts +368 -0
package/extensions/piolium/tools/web-tools.ts +148 -0
package/package.json +77 -0
package/skills/agentic-actions-auditor/SKILL.md +327 -0
package/skills/agentic-actions-auditor/references/action-profiles.md +186 -0
package/skills/agentic-actions-auditor/references/cross-file-resolution.md +209 -0
package/skills/agentic-actions-auditor/references/foundations.md +94 -0
package/skills/agentic-actions-auditor/references/vector-a-env-var-intermediary.md +77 -0
package/skills/agentic-actions-auditor/references/vector-b-direct-expression-injection.md +83 -0
package/skills/agentic-actions-auditor/references/vector-c-cli-data-fetch.md +83 -0
package/skills/agentic-actions-auditor/references/vector-d-pr-target-checkout.md +88 -0
package/skills/agentic-actions-auditor/references/vector-e-error-log-injection.md +88 -0
package/skills/agentic-actions-auditor/references/vector-f-subshell-expansion.md +82 -0
package/skills/agentic-actions-auditor/references/vector-g-eval-of-ai-output.md +91 -0
package/skills/agentic-actions-auditor/references/vector-h-dangerous-sandbox-configs.md +102 -0
package/skills/agentic-actions-auditor/references/vector-i-wildcard-allowlists.md +88 -0
package/skills/audit/SKILL.md +562 -0
package/skills/audit/assets/icon.svg +7 -0
package/skills/audit/hooks/scripts/validate_phase_output.py +550 -0
package/skills/audit/references/adversarial-review.md +148 -0
package/skills/audit/references/architecture-aware-sast.md +306 -0
package/skills/audit/references/audit-workflow.md +737 -0
package/skills/audit/references/chamber-protocol.md +384 -0
package/skills/audit/references/creative-attack-modes.md +221 -0
package/skills/audit/references/deep-analysis.md +273 -0
package/skills/audit/references/domain-attack-playbooks.md +1129 -0
package/skills/audit/references/knowledge-base-template.md +513 -0
package/skills/audit/references/real-env-validation.md +191 -0
package/skills/audit/references/report-templates.md +417 -0
package/skills/audit/references/triage-and-prereqs.md +134 -0
package/skills/audit/scripts/consolidate_drafts.py +554 -0
package/skills/audit/scripts/partition_findings.py +152 -0
package/skills/audit/scripts/rg-hotspots.sh +121 -0
package/skills/audit/scripts/stamp_file_state.py +349 -0
package/skills/code-reviewer/SKILL.md +65 -0
package/skills/codeql/SKILL.md +281 -0
package/skills/codeql/references/build-fixes.md +90 -0
package/skills/codeql/references/diagnostic-query-templates.md +339 -0
package/skills/codeql/references/extension-yaml-format.md +209 -0
package/skills/codeql/references/important-only-suite.md +153 -0
package/skills/codeql/references/language-details.md +207 -0
package/skills/codeql/references/macos-arm64e-workaround.md +179 -0
package/skills/codeql/references/performance-tuning.md +111 -0
package/skills/codeql/references/quality-assessment.md +172 -0
package/skills/codeql/references/ruleset-catalog.md +63 -0
package/skills/codeql/references/run-all-suite.md +92 -0
package/skills/codeql/references/sarif-processing.md +79 -0
package/skills/codeql/references/threat-models.md +51 -0
package/skills/codeql/workflows/build-database.md +280 -0
package/skills/codeql/workflows/create-data-extensions.md +261 -0
package/skills/codeql/workflows/run-analysis.md +301 -0
package/skills/differential-review/SKILL.md +220 -0
package/skills/differential-review/adversarial.md +203 -0
package/skills/differential-review/methodology.md +234 -0
package/skills/differential-review/patterns.md +300 -0
package/skills/differential-review/reporting.md +369 -0
package/skills/fp-check/SKILL.md +125 -0
package/skills/fp-check/references/bug-class-verification.md +114 -0
package/skills/fp-check/references/deep-verification.md +143 -0
package/skills/fp-check/references/evidence-templates.md +91 -0
package/skills/fp-check/references/false-positive-patterns.md +115 -0
package/skills/fp-check/references/gate-reviews.md +27 -0
package/skills/fp-check/references/standard-verification.md +78 -0
package/skills/insecure-defaults/SKILL.md +117 -0
package/skills/insecure-defaults/references/examples.md +409 -0
package/skills/last30days/SKILL.md +444 -0
package/skills/sarif-parsing/SKILL.md +483 -0
package/skills/sarif-parsing/resources/jq-queries.md +162 -0
package/skills/sarif-parsing/resources/sarif_helpers.py +331 -0
package/skills/security-threat-model/LICENSE.txt +201 -0
package/skills/security-threat-model/SKILL.md +81 -0
package/skills/security-threat-model/agents/openai.yaml +4 -0
package/skills/security-threat-model/references/prompt-template.md +255 -0
package/skills/security-threat-model/references/security-controls-and-assets.md +32 -0
package/skills/semgrep/SKILL.md +212 -0
package/skills/semgrep/references/rulesets.md +162 -0
package/skills/semgrep/references/scan-modes.md +110 -0
package/skills/semgrep/references/scanner-task-prompt.md +140 -0
package/skills/semgrep/scripts/merge_sarif.py +203 -0
package/skills/semgrep/workflows/scan-workflow.md +311 -0
package/skills/semgrep-rule-creator/SKILL.md +168 -0
package/skills/semgrep-rule-creator/references/quick-reference.md +202 -0
package/skills/semgrep-rule-creator/references/workflow.md +240 -0
package/skills/semgrep-rule-variant-creator/SKILL.md +205 -0
package/skills/semgrep-rule-variant-creator/references/applicability-analysis.md +250 -0
package/skills/semgrep-rule-variant-creator/references/language-syntax-guide.md +324 -0
package/skills/semgrep-rule-variant-creator/references/workflow.md +518 -0
package/skills/sharp-edges/SKILL.md +292 -0
package/skills/sharp-edges/references/auth-patterns.md +252 -0
package/skills/sharp-edges/references/case-studies.md +274 -0
package/skills/sharp-edges/references/config-patterns.md +333 -0
package/skills/sharp-edges/references/crypto-apis.md +190 -0
package/skills/sharp-edges/references/lang-c.md +205 -0
package/skills/sharp-edges/references/lang-csharp.md +285 -0
package/skills/sharp-edges/references/lang-go.md +270 -0
package/skills/sharp-edges/references/lang-java.md +263 -0
package/skills/sharp-edges/references/lang-javascript.md +269 -0
package/skills/sharp-edges/references/lang-kotlin.md +265 -0
package/skills/sharp-edges/references/lang-php.md +245 -0
package/skills/sharp-edges/references/lang-python.md +274 -0
package/skills/sharp-edges/references/lang-ruby.md +273 -0
package/skills/sharp-edges/references/lang-rust.md +272 -0
package/skills/sharp-edges/references/lang-swift.md +287 -0
package/skills/sharp-edges/references/language-specific.md +588 -0
package/skills/spec-to-code-compliance/SKILL.md +357 -0
package/skills/spec-to-code-compliance/resources/COMPLETENESS_CHECKLIST.md +69 -0
package/skills/spec-to-code-compliance/resources/IR_EXAMPLES.md +417 -0
package/skills/spec-to-code-compliance/resources/OUTPUT_REQUIREMENTS.md +105 -0
package/skills/supply-chain-risk-auditor/SKILL.md +67 -0
package/skills/supply-chain-risk-auditor/resources/results-template.md +41 -0
package/skills/variant-analysis/METHODOLOGY.md +327 -0
package/skills/variant-analysis/SKILL.md +142 -0
package/skills/variant-analysis/resources/codeql/cpp.ql +119 -0
package/skills/variant-analysis/resources/codeql/go.ql +69 -0
package/skills/variant-analysis/resources/codeql/java.ql +71 -0
package/skills/variant-analysis/resources/codeql/javascript.ql +63 -0
package/skills/variant-analysis/resources/codeql/python.ql +80 -0
package/skills/variant-analysis/resources/semgrep/cpp.yaml +98 -0
package/skills/variant-analysis/resources/semgrep/go.yaml +63 -0
package/skills/variant-analysis/resources/semgrep/java.yaml +61 -0
package/skills/variant-analysis/resources/semgrep/javascript.yaml +60 -0
package/skills/variant-analysis/resources/semgrep/python.yaml +72 -0
package/skills/variant-analysis/resources/variant-report-template.md +75 -0
package/skills/vuln-report/SKILL.md +137 -0
package/skills/vuln-report/agents/openai.yaml +4 -0
package/skills/vuln-report/references/report-template.md +135 -0
package/skills/wooyun-legacy/SKILL.md +367 -0
package/skills/wooyun-legacy/references/bank-penetration.md +222 -0
package/skills/wooyun-legacy/references/checklists/command-execution-checklist.md +119 -0
package/skills/wooyun-legacy/references/checklists/csrf-checklist.md +74 -0
package/skills/wooyun-legacy/references/checklists/file-upload-checklist.md +108 -0
package/skills/wooyun-legacy/references/checklists/info-disclosure-checklist.md +114 -0
package/skills/wooyun-legacy/references/checklists/logic-flaws-checklist.md +95 -0
package/skills/wooyun-legacy/references/checklists/misconfig-checklist.md +124 -0
package/skills/wooyun-legacy/references/checklists/path-traversal-checklist.md +87 -0
package/skills/wooyun-legacy/references/checklists/rce-checklist.md +93 -0
package/skills/wooyun-legacy/references/checklists/sql-injection-checklist.md +97 -0
package/skills/wooyun-legacy/references/checklists/ssrf-checklist.md +99 -0
package/skills/wooyun-legacy/references/checklists/unauthorized-access-checklist.md +89 -0
package/skills/wooyun-legacy/references/checklists/weak-password-checklist.md +115 -0
package/skills/wooyun-legacy/references/checklists/xss-checklist.md +103 -0
package/skills/wooyun-legacy/references/checklists/xxe-checklist.md +130 -0
package/skills/wooyun-legacy/references/info-disclosure.md +975 -0
package/skills/wooyun-legacy/references/logic-flaws.md +721 -0
package/skills/wooyun-legacy/references/path-traversal.md +1191 -0
package/skills/wooyun-legacy/references/telecom-penetration.md +156 -0
package/skills/wooyun-legacy/references/unauthorized-access.md +980 -0
package/skills/wooyun-legacy/references/xss.md +746 -0
package/skills/zeroize-audit/SKILL.md +371 -0
package/skills/zeroize-audit/configs/c.yaml +21 -0
package/skills/zeroize-audit/configs/default.yaml +128 -0
package/skills/zeroize-audit/configs/rust.yaml +83 -0
package/skills/zeroize-audit/prompts/report_template.md +238 -0
package/skills/zeroize-audit/prompts/system.md +163 -0
package/skills/zeroize-audit/prompts/task.md +97 -0
package/skills/zeroize-audit/references/compile-commands.md +231 -0
package/skills/zeroize-audit/references/detection-strategy.md +191 -0
package/skills/zeroize-audit/references/ir-analysis.md +252 -0
package/skills/zeroize-audit/references/mcp-analysis.md +221 -0
package/skills/zeroize-audit/references/poc-generation.md +470 -0
package/skills/zeroize-audit/references/rust-zeroization-patterns.md +867 -0
package/skills/zeroize-audit/schemas/input.json +83 -0
package/skills/zeroize-audit/schemas/output.json +140 -0
package/skills/zeroize-audit/tools/analyze_asm.sh +202 -0
package/skills/zeroize-audit/tools/analyze_cfg.py +381 -0
package/skills/zeroize-audit/tools/analyze_heap.sh +211 -0
package/skills/zeroize-audit/tools/analyze_ir_semantic.py +429 -0
package/skills/zeroize-audit/tools/diff_ir.sh +135 -0
package/skills/zeroize-audit/tools/diff_rust_mir.sh +189 -0
package/skills/zeroize-audit/tools/emit_asm.sh +67 -0
package/skills/zeroize-audit/tools/emit_ir.sh +77 -0
package/skills/zeroize-audit/tools/emit_rust_asm.sh +178 -0
package/skills/zeroize-audit/tools/emit_rust_ir.sh +150 -0
package/skills/zeroize-audit/tools/emit_rust_mir.sh +158 -0
package/skills/zeroize-audit/tools/extract_compile_flags.py +284 -0
package/skills/zeroize-audit/tools/generate_poc.py +1329 -0
package/skills/zeroize-audit/tools/mcp/apply_confidence_gates.py +113 -0
package/skills/zeroize-audit/tools/mcp/check_mcp.sh +68 -0
package/skills/zeroize-audit/tools/mcp/normalize_mcp_evidence.py +125 -0
package/skills/zeroize-audit/tools/scripts/check_llvm_patterns.py +481 -0
package/skills/zeroize-audit/tools/scripts/check_mir_patterns.py +554 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm.py +424 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm_aarch64.py +300 -0
package/skills/zeroize-audit/tools/scripts/check_rust_asm_x86.py +283 -0
package/skills/zeroize-audit/tools/scripts/find_dangerous_apis.py +375 -0
package/skills/zeroize-audit/tools/scripts/semantic_audit.py +923 -0
package/skills/zeroize-audit/tools/track_dataflow.sh +196 -0
package/skills/zeroize-audit/tools/validate_rust_toolchain.sh +298 -0
package/skills/zeroize-audit/workflows/phase-0-preflight.md +150 -0
package/skills/zeroize-audit/workflows/phase-1-source-analysis.md +144 -0
package/skills/zeroize-audit/workflows/phase-2-compiler-analysis.md +139 -0
package/skills/zeroize-audit/workflows/phase-3-interim-report.md +46 -0
package/skills/zeroize-audit/workflows/phase-4-poc-generation.md +46 -0
package/skills/zeroize-audit/workflows/phase-5-poc-validation.md +136 -0
package/skills/zeroize-audit/workflows/phase-6-final-report.md +44 -0
package/skills/zeroize-audit/workflows/phase-7-test-generation.md +42 -0
package/themes/piolium-srcery.json +94 -0

package/extensions/piolium/modes/merge.ts ADDED Viewed

@@ -0,0 +1,204 @@
+/**
+ * Merge mode (`/piolium-merge`).
+ *
+ * Combines multiple `piolium/` result trees into one. Two stages:
+ *
+ *   M1-M3 (deterministic): copy + collision-rename + per-finding validation.
+ *   M4-M7 (agent-driven):  semantic dedup + quarantine + renumber + final report.
+ *
+ * MVP scope:
+ *   - The deterministic stage is fully implemented in TypeScript here.
+ *   - The agent-driven stage runs as a single report-composer pass with
+ *     a long task prompt covering all of M2-M7.
+ *
+ * Each input directory is identified by an alias (`a`, `b`, ...) that gets
+ * prepended to colliding finding ids so the dedup agent has clean inputs.
+ */
+import {
+	cpSync,
+	existsSync,
+	mkdirSync,
+	readdirSync,
+	renameSync,
+	statSync,
+	writeFileSync,
+} from "node:fs";
+import { basename, join } from "node:path";
+import type { AgentRuntimeModel } from "../agent-runner.ts";
+import { loadAgents } from "../agents.ts";
+import { applyPhaseStatus, initAudit, markAuditStatus } from "../audit-state.ts";
+import { runReconAsync } from "../recon.ts";
+import { type PhaseUiHooks, runAgentPhase } from "./phase-runner.ts";
+export interface RunMergeOptions {
+	cwd: string;
+	/** Source `piolium/` trees to merge. Must be ≥2. */
+	sources: string[];
+	signal?: AbortSignal;
+	ui?: PhaseUiHooks;
+	agentRuntime?: AgentRuntimeModel;
+}
+export interface RunMergeResult {
+	auditId: string;
+	status: "complete" | "failed";
+	mergedFindings: string[];
+}
+const ATTACK_SURFACE_DIR = "piolium/attack-surface";
+export const MERGE_ATTACK_SURFACE_SUMMARY = `${ATTACK_SURFACE_DIR}/merge-summary.md`;
+function aliasFor(index: number): string {
+	return String.fromCharCode("a".charCodeAt(0) + index);
+}
+function copyTree(src: string, dest: string): void {
+	cpSync(src, dest, { recursive: true });
+}
+function copyFindings(src: string, dest: string, alias: string): string[] {
+	const srcFindings = join(src, "findings");
+	if (!existsSync(srcFindings)) return [];
+	const destFindings = join(dest, "findings");
+	mkdirSync(destFindings, { recursive: true });
+	const written: string[] = [];
+	for (const entry of readdirSync(srcFindings)) {
+		const srcDir = join(srcFindings, entry);
+		if (!statSync(srcDir).isDirectory()) continue;
+		const renamed = `${alias}-${entry}`;
+		const destDir = join(destFindings, renamed);
+		if (existsSync(destDir)) continue; // shouldn't happen with alias prefix
+		mkdirSync(destDir, { recursive: true });
+		copyTree(srcDir, destDir);
+		written.push(destDir);
+	}
+	return written;
+}
+function copyAttackSurface(src: string, dest: string, alias: string): string | undefined {
+	const srcAttackSurface = join(src, "attack-surface");
+	if (!existsSync(srcAttackSurface)) return undefined;
+	const destRoot = join(dest, "attack-surface");
+	mkdirSync(destRoot, { recursive: true });
+	const destAttackSurface = join(destRoot, alias);
+	if (existsSync(destAttackSurface)) return destAttackSurface;
+	copyTree(srcAttackSurface, destAttackSurface);
+	return destAttackSurface;
+}
+export async function runMergeAudit(opts: RunMergeOptions): Promise<RunMergeResult> {
+	const { cwd, signal, ui } = opts;
+	if (opts.sources.length < 2) {
+		throw new Error("Merge requires at least two source piolium/ trees.");
+	}
+	ui?.setStatus?.("piolium-merge", "● preparing recon");
+	const recon = await runReconAsync(cwd, { signal });
+	const audit = await initAudit(cwd, {
+		mode: "merge",
+		...(recon.commit ? { commit: recon.commit } : { commit: null }),
+		...(recon.branch ? { branch: recon.branch } : { branch: "nogit" }),
+		...(recon.repository ? { repository: recon.repository } : {}),
+		history_available: recon.historyAvailable,
+		agent_sdk: "pi",
+	});
+	const workspace = join(cwd, "piolium", "merge-workspace");
+	mkdirSync(workspace, { recursive: true });
+	mkdirSync(join(cwd, ATTACK_SURFACE_DIR), { recursive: true });
+	// M1: copy each source's findings/ and attack-surface/ into the workspace under aliases.
+	const merged: string[] = [];
+	const attackSurfaceSnapshots: Record<string, string> = {};
+	const aliasMap: Record<string, string> = {};
+	for (let i = 0; i < opts.sources.length; i++) {
+		const src = opts.sources[i];
+		if (!src) continue;
+		const alias = aliasFor(i);
+		aliasMap[alias] = src;
+		const written = copyFindings(src, workspace, alias);
+		merged.push(...written);
+		const attackSurface = copyAttackSurface(src, workspace, alias);
+		if (attackSurface) attackSurfaceSnapshots[alias] = attackSurface;
+	}
+	writeFileSync(
+		join(workspace, "findings-index.json"),
+		`${JSON.stringify({ aliasMap, merged: merged.map((p) => basename(p)) }, null, "\t")}\n`,
+	);
+	writeFileSync(
+		join(workspace, "attack-surface-index.json"),
+		`${JSON.stringify(
+			{
+				aliasMap,
+				attackSurfaceSnapshots: Object.fromEntries(
+					Object.entries(attackSurfaceSnapshots).map(([alias, path]) => [alias, basename(path)]),
+				),
+			},
+			null,
+			"\t",
+		)}\n`,
+	);
+	// M2-M7: agent-driven semantic dedup + renumber + final report.
+	// Upstream assigns finding-writer to M3 (auto-fix) and report-composer to
+	// M6 (regenerate summaries); the rest are deterministic. piolium runs the
+	// whole M2-M7 tail as one report-composer pass.
+	const { agents } = loadAgents({ cwd });
+	const synth = agents.get("report-composer");
+	const task = [
+		"You are running /piolium-merge: combining multiple archon-audit result trees into one canonical piolium/ output.",
+		"",
+		`Workspace: ${workspace}`,
+		"Each finding directory there is named `<alias>-<original-id>-<slug>` (alias = a/b/c... per source).",
+		"Each source attack-surface corpus, when present, is copied under `merge-workspace/attack-surface/<alias>/`.",
+		`Source map (alias → path):\n${Object.entries(aliasMap)
+			.map(([k, v]) => `  ${k}: ${v}`)
+			.join("\n")}`,
+		"",
+		"Steps:",
+		"  M2 — semantic dedup: identify findings that describe the same root cause across aliases. Decide canonical winner. Record decisions in `merge-workspace/dedup-decisions.json`.",
+		"  M3 — auto-fix: repair frontmatter, malformed PoC JSON, naming violations.",
+		"  M4 — quarantine: move unfixable findings to `piolium/quarantine/<orig-id>-<slug>/QUARANTINE.md` with reason.",
+		"  M5 — renumber: assign deterministic IDs by severity (M-001 critical … M-NNN info). Write `merge-workspace/rename-map.json`.",
+		"  M6 — apply rename: rename surviving finding directories under `piolium/findings/` and rewrite per-report internal links.",
+		`  M7 — merge durable source context into \`${MERGE_ATTACK_SURFACE_SUMMARY}\`, then regenerate \`piolium/final-audit-report.md\` from the merged findings with an Attack Surface Summary linking \`${ATTACK_SURFACE_DIR}/\`.`,
+		"",
+		"Cap surviving findings at 60. Quality > quantity.",
+	].join("\n");
+	let failed = false;
+	try {
+		await runAgentPhase({
+			cwd,
+			audit,
+			phaseName: "M1",
+			statusKey: "piolium-merge",
+			statusLabel: "● merge dedup",
+			agent: synth,
+			missingAgentMessage: "report-composer missing",
+			task,
+			gate: () =>
+				existsSync(join(cwd, "piolium/final-audit-report.md")) &&
+				existsSync(join(cwd, MERGE_ATTACK_SURFACE_SUMMARY)),
+			mode: "merge",
+			ui,
+			agentRuntime: opts.agentRuntime,
+			...(signal ? { signal } : {}),
+		});
+	} catch {
+		failed = true;
+	}
+	// The single agent pass covers M1-M7; reflect that across the tracked
+	// phase set so the status strip isn't stuck showing M2-M7 pending.
+	for (const p of ["M1", "M2", "M3", "M4", "M5", "M6", "M7"]) {
+		await applyPhaseStatus(cwd, audit, p, { status: failed ? "failed" : "complete" });
+	}
+	await markAuditStatus(cwd, audit.audit_id, failed ? "failed" : "complete");
+	void renameSync; // placeholder for future deterministic rename pass
+	ui?.notify?.(failed ? "Merge failed." : "Merge complete.", failed ? "error" : "info");
+	return { auditId: audit.audit_id, status: failed ? "failed" : "complete", mergedFindings: merged };
+}

package/extensions/piolium/modes/phase-runner.ts ADDED Viewed

@@ -0,0 +1,267 @@
+/**
+ * Shared helper for orchestrators (lite/balanced/deep/etc.) — wraps a single
+ * phase invocation with audit-state transitions, gate verification, and
+ * structured logging via UI hooks.
+ */
+import { randomUUID } from "node:crypto";
+import type { AgentSessionEvent } from "@earendil-works/pi-coding-agent";
+import { type AgentRunError, type AgentRuntimeModel, runAgent } from "../agent-runner.ts";
+import type { RuntimeContext } from "../agent-runner.ts";
+import type { AgentDefinition } from "../agents.ts";
+import { type AuditRunState, applyPhaseStatus } from "../audit-state.ts";
+import {
+	DEFAULT_HEARTBEAT_INTERVAL_MS,
+	type PhaseHeartbeat,
+	createPhaseHeartbeatTracker,
+	heartbeatStateFields,
+} from "../heartbeat.ts";
+import {
+	errorMessage,
+	readNonNegativeIntEnv,
+	readPositiveIntEnv,
+	retryBackoffMs,
+	sleep,
+} from "../retry.ts";
+export interface PhaseUiHooks {
+	notify?: (text: string, level: "info" | "warning" | "error") => void;
+	setStatus?: (key: string, text?: string) => void;
+	/**
+	 * Forwarded copy of every child agent event. Wire this from the command
+	 * handler to surface tool calls + assistant text in the parent chat;
+	 * otherwise the subagent runs silently and the user only sees a footer
+	 * status indicator.
+	 */
+	onAgentEvent?: (phase: string, event: AgentSessionEvent) => void;
+	/**
+	 * Periodic parent-side health signal while a child agent is running.
+	 * This fires even when the child model is quiet, so the UI can prove the
+	 * phase has not been forgotten.
+	 */
+	onPhaseHeartbeat?: (phase: string, heartbeat?: PhaseHeartbeat) => void;
+}
+export interface RunAgentPhaseOptions {
+	cwd: string;
+	audit: AuditRunState;
+	phaseName: string;
+	statusKey: string;
+	statusLabel: string;
+	agent: AgentDefinition | undefined;
+	missingAgentMessage: string;
+	task: string;
+	runtimeExtras?: Partial<Omit<RuntimeContext, "cwd" | "mode">>;
+	gate: () => boolean;
+	signal?: AbortSignal;
+	ui?: PhaseUiHooks;
+	mode: AuditRunState["mode"];
+	agentRuntime?: AgentRuntimeModel;
+	timeoutMs?: number;
+	/** Number of retries after the first attempt. Defaults to PIOLIUM_PHASE_MAX_RETRIES or 5. */
+	maxRetries?: number;
+	retryBackoffBaseMs?: number;
+	retryBackoffMaxMs?: number;
+}
+const HEARTBEAT_INTERVAL_MS = readPositiveIntEnv(
+	"PIOLIUM_HEARTBEAT_INTERVAL_MS",
+	DEFAULT_HEARTBEAT_INTERVAL_MS,
+);
+function defaultPhaseMaxRetries(): number {
+	return readNonNegativeIntEnv("PIOLIUM_PHASE_MAX_RETRIES", 5);
+}
+function defaultPhaseBackoffBaseMs(): number {
+	return readPositiveIntEnv("PIOLIUM_PHASE_BACKOFF_BASE_MS", 5000);
+}
+function defaultPhaseBackoffMaxMs(): number {
+	return readPositiveIntEnv("PIOLIUM_PHASE_BACKOFF_MAX_MS", 120_000);
+}
+function makePhaseSignal(
+	parent: AbortSignal | undefined,
+	timeoutMs: number | undefined,
+	phaseName: string,
+): { signal?: AbortSignal; cleanup: () => void } {
+	if (!timeoutMs || timeoutMs <= 0) {
+		return { ...(parent ? { signal: parent } : {}), cleanup: () => {} };
+	}
+	const ctrl = new AbortController();
+	let timeout: ReturnType<typeof setTimeout> | undefined = setTimeout(() => {
+		ctrl.abort(new Error(`Phase ${phaseName} timed out after ${timeoutMs}ms`));
+	}, timeoutMs);
+	const onParentAbort = () => {
+		ctrl.abort(parent?.reason ?? new Error(`Phase ${phaseName} aborted`));
+	};
+	if (parent) {
+		if (parent.aborted) onParentAbort();
+		else parent.addEventListener("abort", onParentAbort, { once: true });
+	}
+	return {
+		signal: ctrl.signal,
+		cleanup: () => {
+			if (timeout) clearTimeout(timeout);
+			timeout = undefined;
+			if (parent) parent.removeEventListener("abort", onParentAbort);
+		},
+	};
+}
+export async function runAgentPhase(opts: RunAgentPhaseOptions): Promise<void> {
+	const { cwd, audit, phaseName, statusKey, statusLabel, agent, ui, gate, mode } = opts;
+	if (audit.phases[phaseName]?.status === "complete" && gate()) return;
+	const maxRetries = Math.max(0, opts.maxRetries ?? defaultPhaseMaxRetries());
+	const maxAttempts = maxRetries + 1;
+	const backoffBaseMs = opts.retryBackoffBaseMs ?? defaultPhaseBackoffBaseMs();
+	const backoffMaxMs = opts.retryBackoffMaxMs ?? defaultPhaseBackoffMaxMs();
+	const onAgentEvent = ui?.onAgentEvent;
+	const onPhaseHeartbeat = ui?.onPhaseHeartbeat;
+	try {
+		if (!agent) {
+			await applyPhaseStatus(cwd, audit, phaseName, {
+				status: "failed",
+				error: opts.missingAgentMessage,
+			});
+			throw new Error(opts.missingAgentMessage);
+		}
+		for (let attempt = 1; attempt <= maxAttempts; attempt++) {
+			const attemptLabel =
+				maxAttempts > 1 ? `${statusLabel} (${attempt}/${maxAttempts})` : statusLabel;
+			ui?.setStatus?.(statusKey, attemptLabel);
+			await applyPhaseStatus(cwd, audit, phaseName, {
+				status: "in_progress",
+				attempt,
+				max_attempts: maxAttempts,
+				retry_backoff_ms: null,
+				next_retry_at: null,
+				...(attempt > 1 ? { error: `Retry attempt ${attempt}/${maxAttempts} running.` } : {}),
+			});
+			const runId = `${phaseName.toLowerCase()}-${audit.audit_id.replace(/[:.]/g, "-")}-a${attempt}-${randomUUID().slice(0, 8)}`;
+			const phaseSignal = makePhaseSignal(opts.signal, opts.timeoutMs, phaseName);
+			const heartbeat = createPhaseHeartbeatTracker({
+				phase: phaseName,
+				label: attemptLabel,
+				runId,
+			});
+			let heartbeatTimer: ReturnType<typeof setInterval> | undefined;
+			const emitHeartbeat = () => {
+				const snapshot = heartbeat.snapshot();
+				onPhaseHeartbeat?.(phaseName, snapshot);
+				void applyPhaseStatus(cwd, audit, phaseName, {
+					status: "in_progress",
+					...heartbeatStateFields(snapshot),
+				}).catch(() => {});
+			};
+			try {
+				emitHeartbeat();
+				heartbeatTimer = setInterval(emitHeartbeat, HEARTBEAT_INTERVAL_MS);
+				await runAgent({
+					agent,
+					task: opts.task,
+					runId,
+					runtime: { cwd, mode, phase: phaseName, ...opts.runtimeExtras },
+					...(opts.agentRuntime ? opts.agentRuntime : {}),
+					...(phaseSignal.signal ? { signal: phaseSignal.signal } : {}),
+					onEvent: (event) => {
+						heartbeat.recordEvent(event);
+						if (event.type === "tool_execution_start" || event.type === "tool_execution_end") {
+							onPhaseHeartbeat?.(phaseName, heartbeat.snapshot());
+						}
+						onAgentEvent?.(phaseName, event);
+					},
+				});
+				if (!gate()) {
+					throw new Error(`Phase ${phaseName} gate failed — expected artifact missing.`);
+				}
+				await applyPhaseStatus(cwd, audit, phaseName, {
+					status: "complete",
+					attempt,
+					max_attempts: maxAttempts,
+					retry_backoff_ms: null,
+					next_retry_at: null,
+					last_error: null,
+				});
+				return;
+			} catch (err) {
+				const message = errorMessage(err);
+				const failure = err as Partial<AgentRunError>;
+				const artifacts = failure.result?.transcriptPath ? [failure.result.transcriptPath] : undefined;
+				if (gate()) {
+					await applyPhaseStatus(cwd, audit, phaseName, {
+						status: "complete",
+						attempt,
+						max_attempts: maxAttempts,
+						retry_backoff_ms: null,
+						next_retry_at: null,
+						last_error: null,
+						...(artifacts ? { artifacts } : {}),
+					});
+					ui?.notify?.(
+						`Phase ${phaseName} errored but its required artifact exists; treating it as complete.`,
+						"warning",
+					);
+					return;
+				}
+				if (opts.signal?.aborted || attempt >= maxAttempts) {
+					await applyPhaseStatus(cwd, audit, phaseName, {
+						status: "failed",
+						error:
+							attempt >= maxAttempts && maxRetries > 0
+								? `Failed after ${maxRetries} retries: ${message}`
+								: message,
+						attempt,
+						max_attempts: maxAttempts,
+						retry_backoff_ms: null,
+						next_retry_at: null,
+						last_error: message,
+						...(artifacts ? { artifacts } : {}),
+					});
+					throw err;
+				}
+				const backoffMs = retryBackoffMs(attempt, backoffBaseMs, backoffMaxMs);
+				const nextRetryAt = new Date(Date.now() + backoffMs).toISOString();
+				await applyPhaseStatus(cwd, audit, phaseName, {
+					status: "in_progress",
+					error: `Attempt ${attempt}/${maxAttempts} failed: ${message}. Retrying at ${nextRetryAt}.`,
+					attempt,
+					max_attempts: maxAttempts,
+					retry_backoff_ms: backoffMs,
+					next_retry_at: nextRetryAt,
+					last_error: message,
+					...(artifacts ? { artifacts } : {}),
+				});
+				ui?.notify?.(
+					`Phase ${phaseName} attempt ${attempt}/${maxAttempts} failed; retrying in ${Math.ceil(backoffMs / 1000)}s.`,
+					"warning",
+				);
+				ui?.setStatus?.(statusKey, `${statusLabel} retrying in ${Math.ceil(backoffMs / 1000)}s`);
+				await sleep(backoffMs, opts.signal);
+			} finally {
+				if (heartbeatTimer) clearInterval(heartbeatTimer);
+				onPhaseHeartbeat?.(phaseName, undefined);
+				phaseSignal.cleanup();
+			}
+		}
+	} finally {
+		ui?.setStatus?.(statusKey, undefined);
+	}
+	await applyPhaseStatus(cwd, audit, phaseName, {
+		status: "failed",
+		error: `Phase ${phaseName} failed unexpectedly without throwing.`,
+	});
+	throw new Error(`Phase ${phaseName} failed`);
+}