npm - substrate-ai - Versions diffs - 0.20.5 → 0.20.7 - Mend

substrate-ai 0.20.5 → 0.20.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

package/dist/cli/index.js +23 -6
package/dist/{health-CQTK6ltK.js → health-3-qy8XEI.js} +1 -1
package/dist/{health-DHLR9Iz1.js → health-BIS34IYK.js} +57 -2
package/dist/{run-ofO9AWFc.js → run-BAc1zfMQ.js} +2 -2
package/dist/{run-s6bRK0LF.js → run-Dif8PJRd.js} +2 -2
package/package.json +1 -1
package/packs/bmad/prompts/create-story.md +90 -0

package/dist/cli/index.js CHANGED Viewed

@@ -1,10 +1,10 @@
 #!/usr/bin/env node
-import { FileStateStore, RunManifest, SUBSTRATE_OWNED_SETTINGS_KEYS, SupervisorLock, VALID_PHASES, WorkGraphRepository, buildPipelineStatusOutput, createDatabaseAdapter, createStateStore, findPackageRoot, formatOutput, formatPipelineStatusHuman, formatPipelineSummary, formatTokenTelemetry, getAllDescendantPids, getAutoHealthData, getSubstrateDefaultSettings, inspectProcessTree, parseDbTimestampAsUtc, registerHealthCommand, resolveBmadMethodSrcPath, resolveBmadMethodVersion, resolveMainRepoRoot, resolveRunManifest } from "../health-DHLR9Iz1.js";
+import { FileStateStore, RunManifest, SUBSTRATE_OWNED_SETTINGS_KEYS, SupervisorLock, VALID_PHASES, WorkGraphRepository, ZERO_FINDING_COUNTS, buildPipelineStatusOutput, createDatabaseAdapter, createStateStore, findPackageRoot, formatOutput, formatPipelineStatusHuman, formatPipelineSummary, formatTokenTelemetry, getAllDescendantPids, getAutoHealthData, getSubstrateDefaultSettings, inspectProcessTree, parseDbTimestampAsUtc, registerHealthCommand, resolveBmadMethodSrcPath, resolveBmadMethodVersion, resolveMainRepoRoot, resolveRunManifest, rollupFindingCounts } from "../health-BIS34IYK.js";
 import { createLogger } from "../logger-KeHncl-f.js";
 import { createEventBus } from "../helpers-CElYrONe.js";
 import { AdapterRegistry, BudgetConfigSchema, CURRENT_CONFIG_FORMAT_VERSION, CURRENT_TASK_GRAPH_VERSION, ConfigError, CostTrackerConfigSchema, DEFAULT_CONFIG, DoltClient, DoltNotInstalled, GlobalSettingsSchema, IngestionServer, MonitorDatabaseImpl, OPERATIONAL_FINDING, PartialGlobalSettingsSchema, PartialProviderConfigSchema, ProvidersSchema, RoutingRecommender, STORY_METRICS, TelemetryConfigSchema, addTokenUsage, aggregateTokenUsageForRun, checkDoltInstalled, compareRunMetrics, createAmendmentRun, createConfigSystem, createDecision, createDoltClient, createPipelineRun, getActiveDecisions, getAllCostEntriesFiltered, getBaselineRunMetrics, getDecisionsByCategory, getDecisionsByPhaseForRun, getLatestCompletedRun, getLatestRun, getPipelineRunById, getPlanningCostTotal, getRetryableEscalations, getRunMetrics, getRunningPipelineRuns, getSessionCostSummary, getSessionCostSummaryFiltered, getStoryMetricsForRun, getTokenUsageSummary, incrementRunRestarts, initSchema, initializeDolt, listRunMetrics, loadParentRunDecisions, supersedeDecision, tagRunAsBaseline, updatePipelineRun } from "../dist-srr3BfCc.js";
 import "../adapter-registry-DXLMTmfD.js";
-import { AdapterTelemetryPersistence, AppError, DoltRepoMapMetaRepository, DoltSymbolRepository, ERR_REPO_MAP_STORAGE_WRITE, EpicIngester, GitClient, GrammarLoader, RepoMapInjector, RepoMapModule, RepoMapQueryEngine, RepoMapStorage, SymbolParser, createContextCompiler, createDispatcher, createEventEmitter, createImplementationOrchestrator, createPackLoader, createPhaseOrchestrator, createStopAfterGate, createTelemetryAdvisor, formatPhaseCompletionSummary, getFactoryRunSummaries, getScenarioResultsForRun, getTwinRunsForRun, listGraphRuns, registerExportCommand, registerFactoryCommand, registerRunCommand, registerScenariosCommand, resolveStoryKeys, runAnalysisPhase, runPlanningPhase, runSolutioningPhase, validateStopAfterFromConflict } from "../run-ofO9AWFc.js";
+import { AdapterTelemetryPersistence, AppError, DoltRepoMapMetaRepository, DoltSymbolRepository, ERR_REPO_MAP_STORAGE_WRITE, EpicIngester, GitClient, GrammarLoader, RepoMapInjector, RepoMapModule, RepoMapQueryEngine, RepoMapStorage, SymbolParser, createContextCompiler, createDispatcher, createEventEmitter, createImplementationOrchestrator, createPackLoader, createPhaseOrchestrator, createStopAfterGate, createTelemetryAdvisor, formatPhaseCompletionSummary, getFactoryRunSummaries, getScenarioResultsForRun, getTwinRunsForRun, listGraphRuns, registerExportCommand, registerFactoryCommand, registerRunCommand, registerScenariosCommand, resolveStoryKeys, runAnalysisPhase, runPlanningPhase, runSolutioningPhase, validateStopAfterFromConflict } from "../run-BAc1zfMQ.js";
 import "../errors-CSTQNabo.js";
 import "../routing-CcBOCuC9.js";
 import "../decisions-C0pz9Clx.js";
@@ -3619,9 +3619,11 @@ async function runStatusAction(options) {
 			if (run === void 0) run = await getLatestRun(adapter);
 		}
 		let workGraph;
+		let manifestPerStoryState;
 		const { manifest: resolvedManifest } = await resolveRunManifest(dbRoot, run?.id);
 		if (resolvedManifest !== null) try {
 			const manifestData = await resolvedManifest.read();
+			manifestPerStoryState = manifestData.per_story_state;
 			workGraph = buildWorkGraphFromManifest(manifestData.per_story_state);
 			logger$12.debug({ runId: run?.id }, "status: workGraph built from manifest per_story_state");
 		} catch {
@@ -3665,7 +3667,7 @@ async function runStatusAction(options) {
 			logger$12.debug({ err }, "Work graph query failed, continuing without work graph data");
 		}
 		if (run === void 0) {
-			const { inspectProcessTree: inspectProcessTree$1 } = await import("../health-CQTK6ltK.js");
+			const { inspectProcessTree: inspectProcessTree$1 } = await import("../health-3-qy8XEI.js");
 			const substrateDirPath = join(projectRoot, ".substrate");
 			const processInfo = inspectProcessTree$1({
 				projectRoot,
@@ -3708,6 +3710,8 @@ async function runStatusAction(options) {
 						for (const [phase, secs] of Object.entries(parsed)) phaseBreakdown[phase] = Math.round(secs * 1e3);
 					}
 				} catch {}
+				const verificationResult = manifestPerStoryState?.[row.story_key]?.verification_result;
+				const verificationFindings = rollupFindingCounts(verificationResult);
 				return {
 					story_key: row.story_key,
 					result: row.result,
@@ -3718,7 +3722,8 @@ async function runStatusAction(options) {
 						output: row.output_tokens ?? 0
 					},
 					review_cycles: row.review_cycles ?? 0,
-					dispatches: row.dispatches ?? 0
+					dispatches: row.dispatches ?? 0,
+					verification_findings: verificationFindings
 				};
 			});
 			let pipelineWallClockMs = 0;
@@ -5191,7 +5196,7 @@ async function runSupervisorAction(options, deps = {}) {
 								await initSchema(expAdapter);
 								const { runRunAction: runPipeline } = await import(
 									/* @vite-ignore */
-									"../run-s6bRK0LF.js"
+									"../run-Dif8PJRd.js"
 );
 								const runStoryFn = async (opts) => {
 									const exitCode = await runPipeline({
@@ -5953,6 +5958,14 @@ async function runMetricsAction(options) {
 				phaseBreakdownMap[run$1.run_id] = raw !== void 0 ? raw : null;
 			}
 		} catch {}
+		const findingCountsByStoryRun = new Map();
+		const uniqueRunIds = Array.from(new Set(storyMetrics.map((sm) => sm.run_id).filter((id) => id !== "")));
+		for (const uniqueRunId of uniqueRunIds) try {
+			const { manifest } = await resolveRunManifest(dbRoot, uniqueRunId);
+			if (manifest === null) continue;
+			const data = await manifest.read();
+			for (const [storyKey, entry] of Object.entries(data.per_story_state)) findingCountsByStoryRun.set(`${storyKey}:${uniqueRunId}`, rollupFindingCounts(entry.verification_result));
+		} catch {}
 		let factoryRuns = [];
 		try {
 			factoryRuns = await getFactoryRunSummaries(adapter, limit);
@@ -5965,10 +5978,14 @@ async function runMetricsAction(options) {
 				type: "sdlc",
 				phase_token_breakdown: phaseBreakdownMap[run$1.run_id] ?? null
 			}));
+			const storyMetricsWithFindings = storyMetrics.map((sm) => ({
+				...sm,
+				verification_findings: findingCountsByStoryRun.get(`${sm.story_key}:${sm.run_id}`) ?? { ...ZERO_FINDING_COUNTS }
+			}));
 			const jsonPayload = {
 				runs: runsWithBreakdown,
 				graph_runs: factoryRuns,
-				story_metrics: storyMetrics
+				story_metrics: storyMetricsWithFindings
 			};
 			if (doltMetrics !== void 0) if (aggregate) {
 				const aggregateResults = doltMetrics.map((m) => ({

package/dist/{health-CQTK6ltK.js → health-3-qy8XEI.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { DEFAULT_STALL_THRESHOLD_SECONDS, getAllDescendantPids, getAutoHealthData, inspectProcessTree, isOrchestratorProcessLine, registerHealthCommand, runHealthAction } from "./health-DHLR9Iz1.js";
+import { DEFAULT_STALL_THRESHOLD_SECONDS, getAllDescendantPids, getAutoHealthData, inspectProcessTree, isOrchestratorProcessLine, registerHealthCommand, runHealthAction } from "./health-BIS34IYK.js";
 import "./logger-KeHncl-f.js";
 import "./dist-srr3BfCc.js";
 import "./decisions-C0pz9Clx.js";

package/dist/{health-DHLR9Iz1.js → health-BIS34IYK.js} RENAMED Viewed

@@ -4486,6 +4486,61 @@ var RunManifest = class RunManifest {
 	}
 };
+//#endregion
+//#region packages/sdlc/dist/run-model/verification-findings-counts.js
+/**
+* Verification finding count roll-up — Story 55-3b.
+*
+* Collapses every finding across every check in a StoredVerificationSummary
+* into a `{error, warn, info}` triple, suitable for per-story surfacing in
+* the status/metrics CLI JSON payloads.
+*
+* Intentionally pure: no I/O, no logger, no throw. Fits cleanly in the
+* run-model package so both the status and metrics commands (and any
+* future consumer) can share a single implementation and one set of tests.
+*/
+/** Zero-counts object used as the default return value and as the identity
+*  element in consumer-side accumulations. */
+const ZERO_FINDING_COUNTS = Object.freeze({
+	error: 0,
+	warn: 0,
+	info: 0
+});
+/**
+* Sum findings across every check in the summary, grouped by severity.
+*
+* Backward-compatible — when the summary is `undefined`, or a check has no
+* `findings` field (legacy manifests written before Story 55-2 migrated the
+* checks), the absent arrays contribute 0 to every severity. No severity
+* ever reports undefined.
+*/
+function rollupFindingCounts(summary) {
+	if (summary === void 0 || summary === null) return { ...ZERO_FINDING_COUNTS };
+	let error = 0;
+	let warn = 0;
+	let info = 0;
+	for (const check of summary.checks) {
+		const findings = check.findings;
+		if (findings === void 0) continue;
+		for (const finding of findings) switch (finding.severity) {
+			case "error":
+				error += 1;
+				break;
+			case "warn":
+				warn += 1;
+				break;
+			case "info":
+				info += 1;
+				break;
+		}
+	}
+	return {
+		error,
+		warn,
+		info
+	};
+}
 //#endregion
 //#region packages/sdlc/dist/run-model/supervisor-lock.js
 const defaultLogger = console;
@@ -5230,5 +5285,5 @@ function registerHealthCommand(program, _version = "0.0.0", projectRoot = proces
 }
 //#endregion
-export { BMAD_BASELINE_TOKENS_FULL, DEFAULT_STALL_THRESHOLD_SECONDS, DoltMergeConflict, FileStateStore, FindingsInjector, RunManifest, STOP_AFTER_VALID_PHASES, STORY_KEY_PATTERN$1 as STORY_KEY_PATTERN, SUBSTRATE_OWNED_SETTINGS_KEYS, SupervisorLock, VALID_PHASES, WorkGraphRepository, __commonJS, __require, __toESM, applyConfigToGraph, buildPipelineStatusOutput, createDatabaseAdapter$1 as createDatabaseAdapter, createDefaultVerificationPipeline, createGraphOrchestrator, createSdlcCodeReviewHandler, createSdlcCreateStoryHandler, createSdlcDevStoryHandler, createSdlcPhaseHandler, createStateStore, detectCycles, extractTargetFilesFromStoryContent, findPackageRoot, formatOutput, formatPipelineStatusHuman, formatPipelineSummary, formatTokenTelemetry, getAllDescendantPids, getAutoHealthData, getSubstrateDefaultSettings, inspectProcessTree, isOrchestratorProcessLine, parseDbTimestampAsUtc, registerHealthCommand, renderFindings, resolveBmadMethodSrcPath, resolveBmadMethodVersion, resolveGraphPath, resolveMainRepoRoot, resolveRunManifest, runHealthAction, validateStoryKey };
-//# sourceMappingURL=health-DHLR9Iz1.js.map
+export { BMAD_BASELINE_TOKENS_FULL, DEFAULT_STALL_THRESHOLD_SECONDS, DoltMergeConflict, FileStateStore, FindingsInjector, RunManifest, STOP_AFTER_VALID_PHASES, STORY_KEY_PATTERN$1 as STORY_KEY_PATTERN, SUBSTRATE_OWNED_SETTINGS_KEYS, SupervisorLock, VALID_PHASES, WorkGraphRepository, ZERO_FINDING_COUNTS, __commonJS, __require, __toESM, applyConfigToGraph, buildPipelineStatusOutput, createDatabaseAdapter$1 as createDatabaseAdapter, createDefaultVerificationPipeline, createGraphOrchestrator, createSdlcCodeReviewHandler, createSdlcCreateStoryHandler, createSdlcDevStoryHandler, createSdlcPhaseHandler, createStateStore, detectCycles, extractTargetFilesFromStoryContent, findPackageRoot, formatOutput, formatPipelineStatusHuman, formatPipelineSummary, formatTokenTelemetry, getAllDescendantPids, getAutoHealthData, getSubstrateDefaultSettings, inspectProcessTree, isOrchestratorProcessLine, parseDbTimestampAsUtc, registerHealthCommand, renderFindings, resolveBmadMethodSrcPath, resolveBmadMethodVersion, resolveGraphPath, resolveMainRepoRoot, resolveRunManifest, rollupFindingCounts, runHealthAction, validateStoryKey };
+//# sourceMappingURL=health-BIS34IYK.js.map

package/dist/{run-ofO9AWFc.js → run-BAc1zfMQ.js} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { BMAD_BASELINE_TOKENS_FULL, DoltMergeConflict, FileStateStore, FindingsInjector, RunManifest, STOP_AFTER_VALID_PHASES, STORY_KEY_PATTERN, VALID_PHASES, WorkGraphRepository, __commonJS, __require, __toESM, applyConfigToGraph, buildPipelineStatusOutput, createDatabaseAdapter, createDefaultVerificationPipeline, createGraphOrchestrator, createSdlcCodeReviewHandler, createSdlcCreateStoryHandler, createSdlcDevStoryHandler, createSdlcPhaseHandler, detectCycles, extractTargetFilesFromStoryContent, formatOutput, formatPipelineSummary, formatTokenTelemetry, inspectProcessTree, parseDbTimestampAsUtc, renderFindings, resolveGraphPath, resolveMainRepoRoot, validateStoryKey } from "./health-DHLR9Iz1.js";
+import { BMAD_BASELINE_TOKENS_FULL, DoltMergeConflict, FileStateStore, FindingsInjector, RunManifest, STOP_AFTER_VALID_PHASES, STORY_KEY_PATTERN, VALID_PHASES, WorkGraphRepository, __commonJS, __require, __toESM, applyConfigToGraph, buildPipelineStatusOutput, createDatabaseAdapter, createDefaultVerificationPipeline, createGraphOrchestrator, createSdlcCodeReviewHandler, createSdlcCreateStoryHandler, createSdlcDevStoryHandler, createSdlcPhaseHandler, detectCycles, extractTargetFilesFromStoryContent, formatOutput, formatPipelineSummary, formatTokenTelemetry, inspectProcessTree, parseDbTimestampAsUtc, renderFindings, resolveGraphPath, resolveMainRepoRoot, validateStoryKey } from "./health-BIS34IYK.js";
 import { createLogger } from "./logger-KeHncl-f.js";
 import { TypedEventBusImpl, createEventBus, createTuiApp, isTuiCapable, printNonTtyWarning, sleep } from "./helpers-CElYrONe.js";
 import { ADVISORY_NOTES, Categorizer, ConsumerAnalyzer, DEFAULT_GLOBAL_SETTINGS, DispatcherImpl, DoltClient, ESCALATION_DIAGNOSIS, EXPERIMENT_RESULT, EfficiencyScorer, IngestionServer, LogTurnAnalyzer, OPERATIONAL_FINDING, Recommender, RoutingRecommender, RoutingResolver, RoutingTelemetry, RoutingTokenAccumulator, RoutingTuner, STORY_METRICS, STORY_OUTCOME, SubstrateConfigSchema, TEST_EXPANSION_FINDING, TEST_PLAN, TelemetryNormalizer, TelemetryPipeline, TurnAnalyzer, addTokenUsage, aggregateTokenUsageForRun, aggregateTokenUsageForStory, callLLM, createConfigSystem, createDatabaseAdapter$1, createDecision, createPipelineRun, createRequirement, detectInterfaceChanges, getArtifactByTypeForRun, getArtifactsByRun, getDecisionsByCategory, getDecisionsByPhase, getDecisionsByPhaseForRun, getLatestRun, getPipelineRunById, getRunMetrics, getRunningPipelineRuns, getStoryMetricsForRun, getTokenUsageSummary, initSchema, listRequirements, loadModelRoutingConfig, registerArtifact, updatePipelineRun, updatePipelineRunConfig, upsertDecision, writeRunMetrics, writeStoryMetrics } from "./dist-srr3BfCc.js";
@@ -43840,4 +43840,4 @@ function registerRunCommand(program, _version = "0.0.0", projectRoot = process.c
 //#endregion
 export { AdapterTelemetryPersistence, AppError, DoltRepoMapMetaRepository, DoltSymbolRepository, ERR_REPO_MAP_STORAGE_WRITE, EpicIngester, GitClient, GrammarLoader, RepoMapInjector, RepoMapModule, RepoMapQueryEngine, RepoMapStorage, SymbolParser, createContextCompiler, createDispatcher, createEventEmitter, createImplementationOrchestrator, createPackLoader, createPhaseOrchestrator, createStopAfterGate, createTelemetryAdvisor, formatPhaseCompletionSummary, getFactoryRunSummaries, getScenarioResultsForRun, getTwinRunsForRun, listGraphRuns, normalizeGraphSummaryToStatus, registerExportCommand, registerFactoryCommand, registerRunCommand, registerScenariosCommand, resolveMaxReviewCycles, resolveStoryKeys, runAnalysisPhase, runPlanningPhase, runRunAction, runSolutioningPhase, validateStopAfterFromConflict, wireNdjsonEmitter };
-//# sourceMappingURL=run-ofO9AWFc.js.map
+//# sourceMappingURL=run-BAc1zfMQ.js.map

package/dist/{run-s6bRK0LF.js → run-Dif8PJRd.js} RENAMED Viewed

@@ -1,8 +1,8 @@
-import "./health-DHLR9Iz1.js";
+import "./health-BIS34IYK.js";
 import "./logger-KeHncl-f.js";
 import "./helpers-CElYrONe.js";
 import "./dist-srr3BfCc.js";
-import { normalizeGraphSummaryToStatus, registerRunCommand, resolveMaxReviewCycles, runRunAction, wireNdjsonEmitter } from "./run-ofO9AWFc.js";
+import { normalizeGraphSummaryToStatus, registerRunCommand, resolveMaxReviewCycles, runRunAction, wireNdjsonEmitter } from "./run-BAc1zfMQ.js";
 import "./routing-CcBOCuC9.js";
 import "./decisions-C0pz9Clx.js";

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "substrate-ai",
-  "version": "0.20.5",
+  "version": "0.20.7",
   "description": "Substrate — multi-agent orchestration daemon for AI coding agents",
   "type": "module",
   "license": "MIT",

package/packs/bmad/prompts/create-story.md CHANGED Viewed

@@ -64,6 +64,96 @@ Use this exact format for each item:
 - The transport annotation `(queue: ...)` or `(api: ...)` or `(from story X-Y)` is optional but recommended when applicable
 - **The `## Interface Contracts` section is optional** — omit it entirely if the story has no cross-story schema dependencies
+## Runtime Verification Guidance
+**Decide whether this story's artifact is runtime-dependent.** An artifact is runtime-dependent if correctness depends on execution — systemd units, container definitions (Podman Quadlet, Docker Compose), install scripts, migration runners, anything whose behavior is only observable by running it against a real host or ephemeral sandbox.
+If the artifact is runtime-dependent, add a `## Runtime Probes` section to the story file. Each probe is a short shell command whose exit status answers "does this artifact actually work?".
+**If the artifact is NOT runtime-dependent — TypeScript/JavaScript code + tests, type-only refactors, documentation, build or tsconfig edits — omit the `## Runtime Probes` section entirely.** Adding one for a static-output story produces a `pass` (skip) with no benefit. The default substrate self-development case (source code + tests) has no probes.
+### Probe YAML shape
+Declare probes as a YAML list inside a single fenced `yaml` block directly under the `## Runtime Probes` heading. Each entry has this shape:
+```text
+- name: <hyphen-separated-identifier>    # required; unique within story
+  sandbox: host | twin                    # required; one of host | twin
+  command: <shell command line(s)>        # required
+  timeout_ms: 60000                       # optional; defaults to 60000
+  description: <optional context>         # optional
+```
+Required fields: `name`, `sandbox`, `command`. `timeout_ms` and `description` are optional. Probe names must be unique within one story.
+### Sandbox choice
+- **`sandbox: twin`** — default for probes that mutate host state: starting services, binding ports, writing outside the project working directory, running privileged commands. Safer; ephemeral.
+- **`sandbox: host`** — only when the probe is strictly read-only from the host's perspective (linting a file, parsing config, asserting a command exists, pulling an image into a local cache) OR when the host context itself is what the story needs to verify.
+- **When in doubt, pick `twin`.**
+### Probe granularity
+For stories with multiple runtime concerns (install + start + connect), declare **separate named probes per concern** rather than one monolithic probe. Finding messages reference probe names; granular probes produce actionable failures and let retries focus on the specific failure.
+Probe names are hyphen-separated identifiers, not sentences: `dolt-image-pullable`, not `verify that the dolt image can be pulled`.
+### Examples by artifact class
+**Systemd unit:**
+```yaml
+- name: unit-is-active
+  sandbox: twin
+  command: systemctl is-active my-service.service
+  description: unit started and has not crashed
+```
+**Container / Podman Quadlet** (catches the wrong-image-path class — strata Story 1-4):
+```yaml
+- name: dolt-image-pullable
+  sandbox: host
+  command: podman pull ghcr.io/dolthub/dolt-sql-server:latest
+  description: image reference resolves and is pullable
+```
+**Install script:**
+```yaml
+- name: installer-exits-clean
+  sandbox: twin
+  command: bash ./install.sh --dry-run
+- name: installed-binary-reports-version
+  sandbox: twin
+  command: /usr/local/bin/my-tool --version
+```
+**Database migration:**
+```yaml
+- name: migration-applies-cleanly
+  sandbox: twin
+  command: npm run migrate:up && npm run migrate:status
+  description: migration applies and schema_migrations reports the new version
+```
+**Docker Compose:**
+```yaml
+- name: compose-parses
+  sandbox: host
+  command: docker compose -f ./compose.yaml config --quiet
+  description: compose file is syntactically valid
+- name: compose-service-starts
+  sandbox: twin
+  command: docker compose -f ./compose.yaml up -d api && docker compose -f ./compose.yaml ps api | grep -q running
+```
+### Framing
+Treat the probes you draft as a **first pass** the human author will refine. Probes execute on a real host (or — for `sandbox: twin` — a real ephemeral sandbox), so command correctness matters. Prefer conservative commands that exit 0 only on true success and non-zero on any real failure.
 ## Scope Cap Guidance
 **Aim for 6-7 acceptance criteria and 7-8 tasks per story.**