npm - al-sem - Versions diffs - 0.0.1 - Mend

al-sem 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

package/LICENSE +21 -0
package/README.md +361 -0
package/package.json +64 -0
package/scripts/d40-diff.ts +44 -0
package/scripts/fetch-native-parser.ts +179 -0
package/scripts/precision-sample.ts +99 -0
package/scripts/precision-study.ts +42 -0
package/scripts/precision-tabulate.ts +52 -0
package/src/cli/baseline.ts +31 -0
package/src/cli/diff.ts +199 -0
package/src/cli/events-chains.ts +56 -0
package/src/cli/events-fanout.ts +87 -0
package/src/cli/exit-code.ts +30 -0
package/src/cli/fingerprint-indexes.ts +130 -0
package/src/cli/fingerprint-query.ts +543 -0
package/src/cli/fingerprint-witness.ts +493 -0
package/src/cli/fingerprint.ts +292 -0
package/src/cli/format-compact-json.ts +45 -0
package/src/cli/format-events.ts +77 -0
package/src/cli/format-fingerprint.ts +295 -0
package/src/cli/format-html.ts +503 -0
package/src/cli/format-json.ts +13 -0
package/src/cli/format-policy.ts +95 -0
package/src/cli/format-sarif.ts +186 -0
package/src/cli/format-terminal.ts +153 -0
package/src/cli/index.ts +566 -0
package/src/cli/policy.ts +204 -0
package/src/config/roots-config.ts +302 -0
package/src/deps/cache-versions.ts +74 -0
package/src/deps/canonical-json.ts +27 -0
package/src/deps/dependency-artifact.ts +144 -0
package/src/deps/dependency-cache.ts +262 -0
package/src/deps/dependency-dag.ts +128 -0
package/src/deps/dependency-package-discovery.ts +85 -0
package/src/deps/dependency-pipeline.ts +483 -0
package/src/deps/dependency-projection.ts +211 -0
package/src/deps/dependency-resolver.ts +154 -0
package/src/deps/workspace-dependencies.ts +114 -0
package/src/detectors/capability-query.ts +145 -0
package/src/detectors/confidence.ts +52 -0
package/src/detectors/d1-db-op-in-loop.ts +457 -0
package/src/detectors/d10-self-modifying-loop.ts +114 -0
package/src/detectors/d11-modify-without-get.ts +129 -0
package/src/detectors/d12-dead-integration-event.ts +81 -0
package/src/detectors/d13-cross-app-internal-call.ts +105 -0
package/src/detectors/d14-dead-routine.ts +151 -0
package/src/detectors/d16-obsolete-routine-call.ts +94 -0
package/src/detectors/d17-min-version-drift.ts +157 -0
package/src/detectors/d18-constant-filter-in-loop.ts +151 -0
package/src/detectors/d19-unused-parameter.ts +116 -0
package/src/detectors/d2-event-fanout-in-loop.ts +240 -0
package/src/detectors/d20-unreachable-after-exit.ts +92 -0
package/src/detectors/d21-read-without-load.ts +128 -0
package/src/detectors/d22-flowfield-without-calcfields.ts +168 -0
package/src/detectors/d29-subscriber-modify-on-event-record.ts +163 -0
package/src/detectors/d3-load-state.ts +72 -0
package/src/detectors/d3-missing-setloadfields.ts +234 -0
package/src/detectors/d32-constant-boolean-parameter.ts +185 -0
package/src/detectors/d33-unfiltered-bulk-write.ts +173 -0
package/src/detectors/d34-commit-in-loop.ts +206 -0
package/src/detectors/d35-commit-in-event-subscriber.ts +138 -0
package/src/detectors/d36-late-setloadfields.ts +162 -0
package/src/detectors/d37-validate-without-persist.ts +271 -0
package/src/detectors/d38-subscriber-to-obsolete-event.ts +140 -0
package/src/detectors/d39-record-left-dirty-across-chain.ts +165 -0
package/src/detectors/d4-repeated-lookup-in-loop.ts +128 -0
package/src/detectors/d40-transitive-load-missing.ts +217 -0
package/src/detectors/d41-transitive-filter-loss.ts +200 -0
package/src/detectors/d42-cross-call-wrong-setloadfields.ts +243 -0
package/src/detectors/d43-event-ishandled-skip.ts +257 -0
package/src/detectors/d44-event-multi-subscriber-overlap.ts +223 -0
package/src/detectors/d45-event-transitive-table-exposure.ts +159 -0
package/src/detectors/d5-set-based-opportunity.ts +162 -0
package/src/detectors/d7-recursive-event-expansion.ts +151 -0
package/src/detectors/d8-commit-in-transaction.ts +132 -0
package/src/detectors/d9-transaction-span-summary.ts +107 -0
package/src/detectors/detector-context.ts +121 -0
package/src/detectors/finding-grouping.ts +61 -0
package/src/detectors/path-merge.ts +174 -0
package/src/detectors/registry.ts +176 -0
package/src/detectors/table-display.ts +42 -0
package/src/diff/diff-abi.ts +195 -0
package/src/diff/diff-capabilities.ts +179 -0
package/src/diff/diff-engine.ts +146 -0
package/src/diff/diff-events.ts +323 -0
package/src/diff/diff-identity.ts +73 -0
package/src/diff/diff-indexes.ts +199 -0
package/src/diff/diff-permissions.ts +260 -0
package/src/diff/diff-policy.ts +101 -0
package/src/diff/diff-preflight.ts +66 -0
package/src/diff/diff-renames.ts +104 -0
package/src/diff/diff-schema.ts +232 -0
package/src/diff/format-diff.ts +148 -0
package/src/engine/attribute-parser.ts +50 -0
package/src/engine/capability-cone.ts +531 -0
package/src/engine/combined-graph.ts +357 -0
package/src/engine/control-flow-walker.ts +1317 -0
package/src/engine/dispatch-sites.ts +199 -0
package/src/engine/effect-lattice.ts +81 -0
package/src/engine/entry-points.ts +57 -0
package/src/engine/event-flow.ts +524 -0
package/src/engine/event-relay.ts +92 -0
package/src/engine/op-classification.ts +92 -0
package/src/engine/path-walker.ts +189 -0
package/src/engine/reverse-call-graph.ts +23 -0
package/src/engine/root-classifier-overlay.ts +194 -0
package/src/engine/root-classifier.ts +135 -0
package/src/engine/scc.ts +110 -0
package/src/engine/source-anchor.ts +25 -0
package/src/engine/summary-context.ts +104 -0
package/src/engine/summary-engine.ts +296 -0
package/src/engine/summary-runner.ts +560 -0
package/src/engine/transaction-spans.ts +112 -0
package/src/engine/uncertainty-util.ts +54 -0
package/src/hash.ts +31 -0
package/src/index/attribute-from-node.ts +141 -0
package/src/index/callee-from-node.ts +181 -0
package/src/index/capability/background.ts +90 -0
package/src/index/capability/commit.ts +44 -0
package/src/index/capability/dispatch.ts +164 -0
package/src/index/capability/events.ts +65 -0
package/src/index/capability/extractor.ts +124 -0
package/src/index/capability/file-blob.ts +137 -0
package/src/index/capability/http.ts +159 -0
package/src/index/capability/hyperlink.ts +60 -0
package/src/index/capability/isolated-storage.ts +179 -0
package/src/index/capability/table.ts +113 -0
package/src/index/capability/telemetry.ts +84 -0
package/src/index/capability/ui.ts +55 -0
package/src/index/capability/value-source.ts +202 -0
package/src/index/expression-from-node.ts +117 -0
package/src/index/indexer.ts +102 -0
package/src/index/intraprocedural-body.ts +1467 -0
package/src/index/intraprocedural-ops.ts +253 -0
package/src/index/intraprocedural-refs.ts +188 -0
package/src/index/object-indexer.ts +279 -0
package/src/index/routine-indexer.ts +282 -0
package/src/index/routine-signature.ts +46 -0
package/src/index/variable-indexer.ts +134 -0
package/src/index/variable-initializer-extractor.ts +155 -0
package/src/index/variable-type-normalizer.ts +83 -0
package/src/index.ts +267 -0
package/src/mcp/server.ts +72 -0
package/src/mcp/session.ts +49 -0
package/src/mcp/tools/explain-path.ts +75 -0
package/src/mcp/tools/get-analysis-health.ts +62 -0
package/src/mcp/tools/get-finding.ts +47 -0
package/src/mcp/tools/get-routine-summary.ts +126 -0
package/src/mcp/tools/list-findings.ts +85 -0
package/src/mcp/tools/list-hotspots.ts +78 -0
package/src/mcp/tools/list-rollups.ts +103 -0
package/src/mcp/tools/validators.ts +25 -0
package/src/model/attributes.ts +120 -0
package/src/model/callee.ts +45 -0
package/src/model/capability.ts +187 -0
package/src/model/coverage.ts +85 -0
package/src/model/entities.ts +628 -0
package/src/model/expression.ts +98 -0
package/src/model/finding.ts +110 -0
package/src/model/graph-edge.ts +93 -0
package/src/model/graph.ts +62 -0
package/src/model/identity.ts +81 -0
package/src/model/ids.ts +90 -0
package/src/model/index.ts +13 -0
package/src/model/model.ts +51 -0
package/src/model/permission.ts +76 -0
package/src/model/root-classification.ts +116 -0
package/src/model/stable-identity.ts +102 -0
package/src/model/summary.ts +96 -0
package/src/parser/ast.ts +82 -0
package/src/parser/native/ffi.ts +145 -0
package/src/parser/native/parse-index-pool.ts +148 -0
package/src/parser/native/parse-index-worker.ts +94 -0
package/src/parser/native/wrapper.ts +353 -0
package/src/parser/parser-init.ts +43 -0
package/src/perf/profiler.ts +66 -0
package/src/policy/policy-default.yaml +83 -0
package/src/policy/policy-engine.ts +339 -0
package/src/policy/policy-loader.ts +257 -0
package/src/policy/policy-schema.json +379 -0
package/src/policy/policy-types.ts +81 -0
package/src/policy/predicate-compiler.ts +151 -0
package/src/policy/predicate-evaluator.ts +267 -0
package/src/policy/predicate-fields.ts +439 -0
package/src/projection/actionable-anchor.ts +48 -0
package/src/projection/finding-filters.ts +44 -0
package/src/projection/finding-fingerprint.ts +54 -0
package/src/projection/finding-groups.ts +41 -0
package/src/projection/finding-summary.ts +110 -0
package/src/projection/rollup-findings.ts +105 -0
package/src/providers/discover.ts +88 -0
package/src/providers/external.ts +46 -0
package/src/providers/types.ts +36 -0
package/src/providers/workspace.ts +117 -0
package/src/resolve/call-resolver.ts +117 -0
package/src/resolve/coverage.ts +61 -0
package/src/resolve/event-graph.ts +166 -0
package/src/resolve/implicit-edges.ts +53 -0
package/src/resolve/record-types.ts +36 -0
package/src/resolve/resolver.ts +23 -0
package/src/resolve/semantic-graph.ts +29 -0
package/src/resolve/symbol-table.ts +69 -0
package/src/snapshot/app-snapshot.ts +74 -0
package/src/snapshot/compose.ts +100 -0
package/src/snapshot/derive/callsite-evidence.ts +76 -0
package/src/snapshot/derive/capability-facts.ts +70 -0
package/src/snapshot/derive/contracts.ts +131 -0
package/src/snapshot/derive/coverage.ts +35 -0
package/src/snapshot/derive/event-declarations.ts +140 -0
package/src/snapshot/derive/identity-table.ts +58 -0
package/src/snapshot/derive/inputs.ts +91 -0
package/src/snapshot/derive/operation-evidence.ts +70 -0
package/src/snapshot/derive/permissions.ts +186 -0
package/src/snapshot/derive/root-classifications.ts +56 -0
package/src/snapshot/derive/schema.ts +130 -0
package/src/snapshot/derive/typed-edges.ts +60 -0
package/src/snapshot/derive/workspace-fingerprint.ts +19 -0
package/src/snapshot/deserialize.ts +40 -0
package/src/snapshot/serialize-cbor-gz.ts +12 -0
package/src/snapshot/serialize-cbor.ts +19 -0
package/src/snapshot/serialize-json.ts +22 -0
package/src/snapshot/shard.ts +134 -0
package/src/snapshot/types.ts +181 -0
package/src/symbols/app-manifest.ts +96 -0
package/src/symbols/app-package-zip.ts +50 -0
package/src/symbols/embedded-source-reader.ts +41 -0
package/src/symbols/package-hash.ts +81 -0
package/src/symbols/symbol-reader.ts +101 -0
package/src/symbols/symbol-reference-parser.ts +378 -0
package/src/symbols/symbol-reference-reader.ts +27 -0
package/tsconfig.json +18 -0

package/src/engine/summary-runner.ts ADDED Viewed

@@ -0,0 +1,560 @@
+import { extractCapabilities } from "../index/capability/extractor.ts";
+import type { CapabilityFact, EventExtra } from "../model/capability.ts";
+import type { CoverageReason } from "../model/coverage.ts";
+import type { Routine, VariableSymbol } from "../model/entities.ts";
+import type { Diagnostic } from "../model/finding.ts";
+import type { EventId, RoutineId } from "../model/ids.ts";
+import type { SemanticModel } from "../model/model.ts";
+import type { DbEffect, RecordRoleSummary, RoutineSummary, Uncertainty } from "../model/summary.ts";
+import { makeLap } from "../perf/profiler.ts";
+import { composeInheritedCones } from "./capability-cone.ts";
+import type { CombinedEdge, CombinedGraph } from "./combined-graph.ts";
+import { walkRoutine } from "./control-flow-walker.ts";
+import { effectKeyOf, joinPresence, mergeVia } from "./effect-lattice.ts";
+import { tarjanScc } from "./scc.ts";
+import { type SummaryContext, buildSummaryContext } from "./summary-context.ts";
+import { baseIntraproceduralSummaryCtx } from "./summary-engine.ts";
+import { compareStrings, uncertaintyKey } from "./uncertainty-util.ts";
+const MAX_FIXED_POINT_ITERATIONS = 1000;
+/**
+ * Optional SCC instrumentation, gated on `AL_SEM_SCC_STATS=1`. Cheap counters useful
+ * for deciding whether further fixed-point optimizations (fingerprint caching, worklist
+ * propagation) are worth the complexity. Prints once to stderr at the end of `runSummaries`.
+ */
+const SCC_STATS_ENABLED = process.env.AL_SEM_SCC_STATS === "1";
+export interface SummaryRunOptions {
+	/**
+	 * A fixed leaf: a routine whose `summary` is authoritative and must NOT be recomputed.
+	 * Default: any routine that already carries a summary. This covers both pipelines —
+	 * workspace routines and a cold run's current-app routines start with `summary ===
+	 * undefined`, so they are computed; merged-in artifact routines arrive with `summary`
+	 * set, so they are fixed leaves.
+	 */
+	isLeaf?: (r: Routine) => boolean;
+}
+function defaultIsLeaf(r: Routine): boolean {
+	return r.summary !== undefined;
+}
+/** Map a combined-edge kind to the `via` tag callee effects inherit through it. */
+function viaForEdge(
+	kind: CombinedEdge["kind"],
+): "inherited" | "implicit-trigger" | "event-subscriber" | "dynamic" {
+	if (kind === "implicit-trigger") return "implicit-trigger";
+	if (kind === "event-dispatch") return "event-subscriber";
+	if (kind === "dynamic") return "dynamic";
+	return "inherited";
+}
+/**
+ * Map an EventSymbol.eventKind to the EventExtra.eventClass discriminant.
+ * Phase 1a Family B publisher fix — used by the publish-fact injector in runSummaries.
+ */
+function mapEventKindToClass(
+	k: "integration" | "business" | "trigger" | "internal" | "unknown",
+): EventExtra["eventClass"] {
+	if (k === "business") return "Business";
+	if (k === "internal") return "Internal";
+	if (k === "trigger") return "Trigger";
+	return "Integration";
+}
+/** Stable fingerprint for fixed-point change detection. */
+function summaryFingerprint(s: RoutineSummary): string {
+	return JSON.stringify([
+		s.dbEffects.map((e) => `${e.effectKey}:${e.via}`),
+		s.hasUnresolvedCalls,
+		s.uncertainties.map(uncertaintyKey),
+		// Include may-fact fields so c1b changes are detected during fixed-point iteration.
+		// Entry-requirement fields (Phase 4 walker) and dirtyAtExit + currentLoadedFieldsAtExit
+		// (Phase 6) are pre-included so future phases cannot silently regress convergence by
+		// forgetting to extend the fingerprint.
+		s.parameterRoles.map((r) => [
+			r.parameterIndex,
+			r.loadsFromDbParam,
+			r.initialisesParam,
+			r.persistsCurrentRecord,
+			r.setBasedDbWrites,
+			r.validatesParam,
+			r.copiesIntoParam,
+			r.resetsFiltersOnParam,
+			r.mutatesParam,
+			r.requiresLoadedAtEntry,
+			r.mutatesBeforeLoad,
+			Array.isArray(r.requiredLoadedFieldsAtEntry)
+				? r.requiredLoadedFieldsAtEntry.join(",")
+				: r.requiredLoadedFieldsAtEntry,
+			r.dirtyAtExit,
+			typeof r.currentLoadedFieldsAtExit === "string"
+				? r.currentLoadedFieldsAtExit
+				: r.currentLoadedFieldsAtExit.join(","),
+		]),
+	]);
+}
+/**
+ * Compose a routine's full summary: start from its base intraprocedural summary, then fold
+ * in every outgoing combined edge's callee summary.
+ *
+ * O(1)-lookup + mutable-accumulator variant — the hot path inside `runSummaries`.
+ *
+ * Old hot-loop shape was:
+ *   acc.dbEffects = mergeDbEffects(acc.dbEffects, calleeEffects);     // new Map + sort
+ *   acc.publishesEvents = [...new Set([...acc, ...callee])].sort();   // new Set + array + sort
+ *   acc.uncertainties = dedupeUncertainties([...acc, ...callee]);     // new Map + sort
+ * — once PER outgoing edge. On large dependency graphs that's a lot of GC pressure.
+ *
+ * New shape: seed local Maps/Sets from the base summary once, fold every callee into them
+ * in place, then materialize sorted/canonical arrays exactly once at the end.
+ *
+ * `baseLookup` optionally returns a precomputed base summary. When set, this function
+ * reuses the precomputed summary's data (skipping a fresh `baseIntraproceduralSummaryCtx`
+ * call). Required for the fixed-point loop on recursive SCCs.
+ */
+export function composeRoutineCtx(
+	routine: Routine,
+	lookup: (id: RoutineId) => RoutineSummary | undefined,
+	graph: CombinedGraph,
+	ctx: SummaryContext,
+	baseLookup?: (id: RoutineId) => RoutineSummary | undefined,
+): RoutineSummary {
+	const base = baseLookup?.(routine.id) ?? baseIntraproceduralSummaryCtx(routine, ctx);
+	const calleeOpaque = (id: RoutineId): boolean => ctx.routineById.get(id)?.bodyAvailable === false;
+	// Scalar/lattice accumulators — copied because the base is shared and must not mutate.
+	let hasUnresolvedCalls = base.hasUnresolvedCalls;
+	// Set/Map accumulators seeded from the base. dbEffects key on effectKey so duplicate
+	// inherited entries merge by `via` precedence (matches the old mergeDbEffects).
+	const dbEffectsByKey = new Map<string, DbEffect>();
+	for (const e of base.dbEffects) dbEffectsByKey.set(e.effectKey, e);
+	const uncertaintiesByKey = new Map<string, Uncertainty>();
+	for (const u of base.uncertainties) uncertaintiesByKey.set(uncertaintyKey(u), u);
+	for (const edge of graph.edgesByFrom.get(routine.id) ?? []) {
+		const calleeSummary = lookup(edge.to);
+		if (calleeSummary === undefined) {
+			hasUnresolvedCalls = true;
+			continue;
+		}
+		const via = viaForEdge(edge.kind);
+		for (const e of calleeSummary.dbEffects) {
+			// Tag the inherited effect with the edge's via; recompute the key (effectKeyOf
+			// excludes via, so it's stable). Merge into the local map by precedence.
+			const key = effectKeyOf(e);
+			const existing = dbEffectsByKey.get(key);
+			if (existing) {
+				dbEffectsByKey.set(key, { ...existing, via: mergeVia(existing.via, via) });
+			} else {
+				dbEffectsByKey.set(key, { ...e, effectKey: key, via });
+			}
+		}
+		for (const u of calleeSummary.uncertainties) {
+			const k = uncertaintyKey(u);
+			if (!uncertaintiesByKey.has(k)) uncertaintiesByKey.set(k, u);
+		}
+		if (calleeSummary.hasUnresolvedCalls) hasUnresolvedCalls = true;
+		// interface / dynamic edges, and opaque callees, are confidence-lowering — the CALLER
+		// holds the callsiteId, so the opaque-callee uncertainty is attached here, not on the
+		// callee's own summary.
+		if (edge.kind === "interface" || edge.kind === "dynamic" || calleeOpaque(edge.to)) {
+			if (edge.callsiteId !== undefined) {
+				const u: Uncertainty = { kind: "opaque-callee", callsiteId: edge.callsiteId };
+				const k = uncertaintyKey(u);
+				if (!uncertaintiesByKey.has(k)) uncertaintiesByKey.set(k, u);
+			}
+			hasUnresolvedCalls = true;
+		}
+	}
+	// Uncertainty edges (to-less call sites) on this routine — looked up by `from`
+	// instead of scanned globally, which on big graphs was O(R × U) per iteration.
+	for (const ue of ctx.uncertaintyEdgesByFrom.get(routine.id) ?? []) {
+		const k = uncertaintyKey(ue.uncertainty);
+		if (!uncertaintiesByKey.has(k)) uncertaintiesByKey.set(k, ue.uncertainty);
+		hasUnresolvedCalls = true;
+	}
+	// Materialize deterministic arrays once. dbEffects sort key matches the old
+	// mergeDbEffects: (effectKey, operationId).
+	const dbEffects = [...dbEffectsByKey.values()].sort((a, b) => {
+		if (a.effectKey !== b.effectKey) return compareStrings(a.effectKey, b.effectKey);
+		return compareStrings(a.operationId, b.operationId);
+	});
+	const uncertainties = [...uncertaintiesByKey.values()].sort((a, b) =>
+		compareStrings(uncertaintyKey(a), uncertaintyKey(b)),
+	);
+	// Cross-call exit-effect composition (spec §(c1b)) — compose only when BOTH the
+	// caller-side source and the callee-side parameter are var.
+	// Deep-copy the base parameterRoles so we can mutate them independently each iteration.
+	// NOTE: entry-requirement fields (requiresLoadedAtEntry, mutatesBeforeLoad,
+	// requiredLoadedFieldsAtEntry) are overwritten by the walker below; base values
+	// computed in baseIntraproceduralSummaryCtx are intentionally superseded.
+	const parameterRoles: RecordRoleSummary[] = base.parameterRoles.map((r) => ({ ...r }));
+	for (const cs of routine.features.callSites) {
+		for (const binding of cs.argumentBindings) {
+			if (binding.bindingResolution !== "resolved") continue;
+			if (binding.sourceParameterIndex === undefined) continue;
+			if (!binding.callerSourceParameterIsVar) continue;
+			if (!binding.calleeParameterIsVar) continue;
+			const edge = ctx.resolvedCallEdgeByCallsite.get(cs.id);
+			if (edge?.to === undefined) continue;
+			const calleeRoutine = ctx.routineById.get(edge.to);
+			const calleeRoleSummary = lookup(edge.to);
+			const calleeRole = calleeRoleSummary?.parameterRoles.find(
+				(r) => r.parameterIndex === binding.parameterIndex,
+			);
+			const p = parameterRoles.find((r) => r.parameterIndex === binding.sourceParameterIndex);
+			if (p === undefined) continue;
+			// Opaque guard: any of the three reasons we cannot trust callee facts
+			// (no role, routine missing, body unavailable) takes the unknown branch.
+			// Phase 6's symbol-only projections may produce a callee role with
+			// bodyAvailable=false; this guard keeps such cases on the opaque path.
+			const opaque =
+				calleeRole === undefined ||
+				calleeRoutine === undefined ||
+				calleeRoutine.bodyAvailable === false;
+			if (opaque) {
+				p.persistsCurrentRecord = joinPresence(p.persistsCurrentRecord, "unknown");
+				p.setBasedDbWrites = joinPresence(p.setBasedDbWrites, "unknown");
+				p.validatesParam = joinPresence(p.validatesParam, "unknown");
+				p.copiesIntoParam = joinPresence(p.copiesIntoParam, "unknown");
+				p.resetsFiltersOnParam = joinPresence(p.resetsFiltersOnParam, "unknown");
+			} else {
+				p.persistsCurrentRecord = joinPresence(
+					p.persistsCurrentRecord,
+					calleeRole.persistsCurrentRecord,
+				);
+				p.setBasedDbWrites = joinPresence(p.setBasedDbWrites, calleeRole.setBasedDbWrites);
+				p.validatesParam = joinPresence(p.validatesParam, calleeRole.validatesParam);
+				p.copiesIntoParam = joinPresence(p.copiesIntoParam, calleeRole.copiesIntoParam);
+				p.resetsFiltersOnParam = joinPresence(
+					p.resetsFiltersOnParam,
+					calleeRole.resetsFiltersOnParam,
+				);
+			}
+			p.mutatesParam = joinPresence(
+				joinPresence(p.persistsCurrentRecord, p.validatesParam),
+				p.copiesIntoParam,
+			);
+		}
+	}
+	// Path-aware entry-requirement composition (spec §(c1a)).
+	// Run the walker with the current fixed-point `lookup` so callee summaries
+	// are from the current iteration (not the stale routine.summary).
+	// Only run on routines with a body — opaque/parse-incomplete cases stay "unknown"
+	// as set by baseIntraproceduralSummaryCtx.
+	//
+	// Memoization note (I7, deferred — see review): the walker is re-run every
+	// fixed-point iteration for routines in recursive SCCs. Measurement on DC/Cloud
+	// (AL_SEM_SCC_STATS=1: 35 recursive SCCs, maxSize=4, totalIters=65, maxIters=5)
+	// shows redundant walks are bounded at ~30 across the whole workspace — well
+	// below 1% of total walker cost. Phase 6's full statement-tree walker should
+	// re-measure; if cost grows materially, cache walkRoutine output keyed by
+	// (routineId × fingerprint of callee summaries' requires/mutates fields).
+	if (routine.bodyAvailable && !routine.parseIncomplete) {
+		const pathFacts = walkRoutine(routine, ctx, lookup);
+		const pathByIndex = new Map(pathFacts.map((p) => [p.parameterIndex, p]));
+		for (const role of parameterRoles) {
+			const pf = pathByIndex.get(role.parameterIndex);
+			if (pf === undefined) continue;
+			role.requiresLoadedAtEntry = pf.requiresLoadedAtEntry;
+			role.requiredLoadedFieldsAtEntry = pf.requiredLoadedFieldsAtEntry;
+			role.mutatesBeforeLoad = pf.mutatesBeforeLoad;
+			// Phase 6: walker now emits path-proven dirtyAtExit and
+			// currentLoadedFieldsAtExit. These override the base "unknown"
+			// placeholders set by baseIntraproceduralSummaryCtx.
+			role.dirtyAtExit = pf.dirtyAtExit;
+			role.currentLoadedFieldsAtExit = pf.currentLoadedFieldsAtExit;
+		}
+	}
+	return {
+		routineId: routine.id,
+		dbEffects,
+		inRecursiveCycle: base.inRecursiveCycle,
+		hasUnresolvedCalls,
+		uncertainties,
+		parameterRoles,
+	};
+}
+/**
+ * Public, model-based form kept for callers outside the runner (and the older spec text
+ * referenced in docs). Builds a one-shot context per call — fine for one-offs, NOT for
+ * hot loops. The runner uses `composeRoutineCtx` directly.
+ */
+export function composeRoutine(
+	routine: Routine,
+	lookup: (id: RoutineId) => RoutineSummary | undefined,
+	graph: CombinedGraph,
+	model: SemanticModel,
+): RoutineSummary {
+	return composeRoutineCtx(routine, lookup, graph, buildSummaryContext(model, graph));
+}
+/**
+ * Compute a RoutineSummary for every NON-leaf routine and mutate `routine.summary` in place.
+ * Fixed-leaf routines (see `SummaryRunOptions.isLeaf`) keep their existing `summary` and are
+ * pre-seeded into the lookup map so callers compose against them. Walks the SCC condensation
+ * bottom-up; recursive SCCs get a finite monotone fixed-point.
+ */
+export function runSummaries(
+	model: SemanticModel,
+	graph: CombinedGraph,
+	diagnostics: Diagnostic[],
+	options?: SummaryRunOptions,
+): void {
+	const isLeaf = options?.isLeaf ?? defaultIsLeaf;
+	const lap = makeLap("summary:");
+	// Build O(1) lookup indexes once. This replaces ~50G+ linear scans on Base App-sized
+	// dependencies — the cold-run dominant cost before the refactor.
+	const ctx = buildSummaryContext(model, graph);
+	lap("buildSummaryContext");
+	// Precompute base intraprocedural summaries ONCE per non-leaf routine. For non-recursive
+	// SCCs this is the same as before; for recursive SCCs it eliminates recomputing the base
+	// every fixed-point iteration (was a significant cost — base touches every record op,
+	// every call site, and computes parameterRoles, all of which never change between iters).
+	const baseSummaries = new Map<RoutineId, RoutineSummary>();
+	for (const r of model.routines) {
+		if (isLeaf(r)) continue;
+		baseSummaries.set(r.id, baseIntraproceduralSummaryCtx(r, ctx));
+	}
+	const baseLookup = (id: RoutineId): RoutineSummary | undefined => baseSummaries.get(id);
+	lap(`base-precompute (${baseSummaries.size} routines)`);
+	const final = new Map<RoutineId, RoutineSummary>();
+	// Pre-seed fixed leaves so composition can look them up; they are never recomputed.
+	for (const r of model.routines) {
+		if (isLeaf(r) && r.summary !== undefined) final.set(r.id, r.summary);
+	}
+	const { sccs } = tarjanScc(graph);
+	lap(`tarjanScc (${sccs.length} sccs)`);
+	let nonRecursiveSccs = 0;
+	let recursiveSccs = 0;
+	let maxSccSize = 0;
+	let totalSccMembers = 0;
+	let totalIterations = 0;
+	let maxIterations = 0;
+	let fingerprintCalls = 0;
+	for (const scc of sccs) {
+		if (SCC_STATS_ENABLED) {
+			if (scc.recursive) recursiveSccs++;
+			else nonRecursiveSccs++;
+			if (scc.members.length > maxSccSize) maxSccSize = scc.members.length;
+			totalSccMembers += scc.members.length;
+		}
+		if (!scc.recursive) {
+			const id = scc.members[0];
+			const routine = id !== undefined ? ctx.routineById.get(id) : undefined;
+			if (id === undefined || routine === undefined) continue;
+			if (isLeaf(routine)) continue; // fixed leaf — already in `final`
+			final.set(
+				id,
+				composeRoutineCtx(routine, (x) => final.get(x), graph, ctx, baseLookup),
+			);
+			continue;
+		}
+		// Recursive SCC — finite monotone fixed-point with snapshot iteration.
+		const inProgress = new Map<RoutineId, RoutineSummary>();
+		for (const id of scc.members) {
+			const routine = ctx.routineById.get(id);
+			if (routine === undefined) continue;
+			if (isLeaf(routine)) continue;
+			const base = baseSummaries.get(id);
+			if (base !== undefined) inProgress.set(id, base);
+		}
+		let iterations = 0;
+		let changed = true;
+		while (changed) {
+			changed = false;
+			iterations++;
+			const snapshot = new Map(inProgress);
+			for (const id of scc.members) {
+				const routine = ctx.routineById.get(id);
+				if (routine === undefined || isLeaf(routine)) continue;
+				const next = composeRoutineCtx(
+					routine,
+					(x) => snapshot.get(x) ?? final.get(x),
+					graph,
+					ctx,
+					baseLookup,
+				);
+				const prev = inProgress.get(id);
+				if (prev === undefined || summaryFingerprint(prev) !== summaryFingerprint(next)) {
+					changed = true;
+				}
+				if (SCC_STATS_ENABLED) fingerprintCalls += prev === undefined ? 1 : 2;
+				inProgress.set(id, next);
+			}
+			if (iterations >= MAX_FIXED_POINT_ITERATIONS) {
+				diagnostics.push({
+					severity: "warning",
+					stage: "summarize",
+					message: `Summary fixed-point did not converge for SCC [${scc.members.join(", ")}]`,
+				});
+				break;
+			}
+		}
+		if (SCC_STATS_ENABLED) {
+			totalIterations += iterations;
+			if (iterations > maxIterations) maxIterations = iterations;
+		}
+		for (const id of scc.members) {
+			const summary = inProgress.get(id);
+			if (summary !== undefined) final.set(id, { ...summary, inRecursiveCycle: true });
+		}
+	}
+	lap("scc-compose");
+	// Phase 0b-β: attach direct capability facts and baseline coverage to each non-leaf
+	// routine's final summary. Capability extraction is per-routine (intrinsic, not
+	// inherited) — it runs once here, after the fixed-point has converged, so every
+	// routine gets its own direct facts attached exactly once.
+	//
+	// capabilityFactsInherited stays [] and coverage.inheritedStatus stays "unknown"
+	// until Tasks 21-22 (coverage composer + inherited composition).
+	//
+	// Engine-never-throws: extractCapabilities catches its own errors; this loop adds a
+	// second outer guard so a bug in the wire-in itself cannot crash the engine.
+	//
+	// Index publisher events by routine ONCE. The per-routine publisher-fact injection below
+	// otherwise filtered the entire eventGraph.events array per routine — O(routines × events),
+	// which on Base App (84k non-leaf routines × thousands of platform events) is a multi-second
+	// quadratic. This map makes it O(routines + events). Insertion order matches eventGraph.events
+	// order, so injected-fact order is unchanged.
+	const eventsForPublisherIndex = model.eventGraph?.events ?? [];
+	const publisherEventsByRoutine = new Map<RoutineId, typeof eventsForPublisherIndex>();
+	for (const evt of eventsForPublisherIndex) {
+		if (evt.publisherRoutineId === undefined) continue;
+		const list = publisherEventsByRoutine.get(evt.publisherRoutineId);
+		if (list) list.push(evt);
+		else publisherEventsByRoutine.set(evt.publisherRoutineId, [evt]);
+	}
+	for (const routine of model.routines) {
+		if (isLeaf(routine)) continue;
+		const summary = final.get(routine.id);
+		if (summary === undefined) continue;
+		// Build a minimal ExtractionContext — the orchestrator rebuilds variables
+		// internally, so ctx.variables here is just a safe placeholder.
+		const dispatchCtx = {
+			routine,
+			variables: new Map<string, VariableSymbol>(),
+			receiverTypeOf: (_name: string) => "unknown",
+			reportDiagnostic: (_d: Diagnostic) => {},
+			reportCoverageGap: (_r: CoverageReason, _t?: string) => {},
+		};
+		let { facts, status, reasons } = extractCapabilities(routine, dispatchCtx);
+		// Opaque / parse-incomplete routines: skip extraction (no body to extract from).
+		// extractCapabilities already handles this internally but we reinforce intent.
+		if (!routine.bodyAvailable || routine.parseIncomplete) {
+			facts = [];
+			status = "unknown";
+			reasons = routine.parseIncomplete ? ["parse-incomplete"] : ["opaque-dependency"];
+		}
+		// Phase 1a Family B — publisher-fact injection.
+		//
+		// The events-family extractor (src/index/capability/events.ts) runs at
+		// routine-indexing time and has no access to the resolved event graph, so it
+		// intentionally emits SUBSCRIBE facts only. Publisher routines ([IntegrationEvent]
+		// / [BusinessEvent] / [InternalEvent]) therefore have no direct publish facts, which
+		// caused publishesEventsOf to return [] for publisher routines — direct publish
+		// facts must be present so callers' inherited cones surface the event.
+		//
+		// Here, in the summary engine where model.eventGraph is already resolved, we look up
+		// every EventSymbol whose publisherRoutineId === routine.id and inject one direct
+		// publish CapabilityFact per event. The Task-22 inherited-facts BFS (below) then
+		// naturally propagates these facts to callers via direct-call edges, satisfying the
+		// publishesEventsOf invariant on publisher routines.
+		//
+		// Injection runs BEFORE final.set so the facts are present when the BFS reads
+		// capabilityFactsDirect for each routine.
+		const publisherEvents = publisherEventsByRoutine.get(routine.id) ?? [];
+		for (const evt of publisherEvents) {
+			const extra: EventExtra = {
+				kind: "event",
+				eventClass: mapEventKindToClass(evt.eventKind),
+			};
+			const publishFact: CapabilityFact = {
+				subject: routine.id,
+				op: "publish",
+				resourceKind: "event",
+				resourceId: evt.id as EventId,
+				confidence: "static",
+				provenance: "direct",
+				via: "self",
+				extra,
+			};
+			facts = [...facts, publishFact];
+		}
+		final.set(routine.id, {
+			...summary,
+			capabilityFactsDirect: facts,
+			capabilityFactsInherited: [],
+			coverage: {
+				subject: routine.id,
+				directStatus: status,
+				inheritedStatus: "unknown",
+				reasons,
+				unknownTargets: [],
+			},
+		});
+	}
+	lap("task17-capability-extract");
+	const cones = composeInheritedCones(model, final, isLeaf, diagnostics);
+	for (const routine of model.routines) {
+		if (isLeaf(routine)) continue;
+		const summary = final.get(routine.id);
+		if (summary === undefined) continue;
+		const cone = cones.get(routine.id);
+		if (cone === undefined) continue; // composition failed → keep task-17 baseline coverage + []
+		final.set(routine.id, {
+			...summary,
+			capabilityFactsInherited: cone.inherited,
+			coverage: cone.coverage,
+		});
+	}
+	lap("task22-inherited-bfs");
+	for (const routine of model.routines) {
+		if (isLeaf(routine)) continue; // leaves keep their authoritative summary
+		routine.summary = final.get(routine.id);
+	}
+	lap("writeback");
+	if (SCC_STATS_ENABLED) {
+		process.stderr.write(
+			`al-sem SCC stats: sccs=${nonRecursiveSccs + recursiveSccs}` +
+				` (recursive=${recursiveSccs} non-recursive=${nonRecursiveSccs})` +
+				` maxSize=${maxSccSize} totalMembers=${totalSccMembers}` +
+				` totalIterations=${totalIterations} maxIterations=${maxIterations}` +
+				` fingerprintCalls=${fingerprintCalls}\n`,
+		);
+	}
+}
+/** Phase 2b-compatible entry point: run summaries with the default leaf policy. */
+export function computeSummaries(
+	model: SemanticModel,
+	graph: CombinedGraph,
+	diagnostics: Diagnostic[],
+): void {
+	runSummaries(model, graph, diagnostics);
+}

package/src/engine/transaction-spans.ts ADDED Viewed

@@ -0,0 +1,112 @@
+import {
+	publishesEventsOf,
+	reachableCoverage,
+	writesTablesOf,
+} from "../detectors/capability-query.ts";
+import { roleOf } from "../model/entities.ts";
+import type { EventId, OperationId, RoutineId, TableId } from "../model/ids.ts";
+import type { SemanticModel } from "../model/model.ts";
+import type { CombinedGraph } from "./combined-graph.ts";
+import type { ReverseCallGraph } from "./reverse-call-graph.ts";
+export interface TransactionSpan {
+	/** The Commit operation that bounds the span. */
+	commitOperationId: OperationId;
+	/** The routine containing the bounding Commit. */
+	commitRoutineId: RoutineId;
+	/** All routines reachable backward from commitRoutineId up to another commit or root. */
+	routinesInSpan: RoutineId[];
+	/** Union of tables written by any routine in the span (from writesTablesOf — sorted+deduped). */
+	writesTables: TableId[];
+	/** Union of events published by any routine in the span (from publishesEventsOf — sorted+deduped). */
+	publishesEvents: EventId[];
+	/** Entry roots — routines in the span with no upstream caller inside the span. */
+	spanRoots: RoutineId[];
+	/**
+	 * True iff EVERY routine in `routinesInSpan` has a defined summary AND
+	 * `reachableCoverage(summary) === "complete"`. False when at least
+	 * one routine's inherited cone is partial / unknown — which means
+	 * the aggregated `writesTables` and `publishesEvents` sets may be
+	 * an under-approximation of what this span actually touches.
+	 *
+	 * Replaces the legacy per-routine `summary.writesTables === "unknown"`
+	 * probe D9 used to do. The signal is coarser (overall coverage, not
+	 * per-family) because Phase 1a's `reachableCoverage` is per-routine
+	 * overall. When per-family coverage roll-up lands (spec §3.7
+	 * FingerprintCoverage.perFamily), this field upgrades cleanly to a
+	 * `writesCoverage: CoverageStatus`.
+	 */
+	coverageComplete: boolean;
+}
+const MAX_DEPTH = 50;
+/**
+ * Compute transaction spans. For each primary-app routine that contains a Commit, walk
+ * callers backward to find every routine that participates in the transaction. The walk
+ * stops at any routine that itself commits (that's a prior span's domain) or at the depth
+ * bound. Each Commit operation yields one TransactionSpan.
+ */
+export function computeTransactionSpans(
+	model: SemanticModel,
+	_graph: CombinedGraph,
+	reverse: ReverseCallGraph,
+): TransactionSpan[] {
+	const routineById = new Map(model.routines.map((r) => [r.id, r]));
+	const spans: TransactionSpan[] = [];
+	// Build: routineId → list of Commit operationIds in that routine (from operationSites
+	// with kind === "commit"). We only care about primary-app routines.
+	const commitsByRoutine = new Map<RoutineId, OperationId[]>();
+	for (const r of model.routines) {
+		if (roleOf(r) !== "primary") continue;
+		const commitOps = r.features.operationSites
+			.filter((os) => os.kind === "commit")
+			.map((os) => os.id);
+		if (commitOps.length > 0) commitsByRoutine.set(r.id, commitOps);
+	}
+	for (const [commitRoutineId, commitOps] of commitsByRoutine) {
+		for (const commitOperationId of commitOps) {
+			const visited = new Set<RoutineId>();
+			const queue: { id: RoutineId; depth: number }[] = [{ id: commitRoutineId, depth: 0 }];
+			while (queue.length > 0) {
+				const item = queue.shift();
+				if (!item) break;
+				const { id, depth } = item;
+				if (visited.has(id)) continue;
+				visited.add(id);
+				if (depth >= MAX_DEPTH) continue;
+				// Don't walk past another committing routine (prior span bounds the trace).
+				if (id !== commitRoutineId && commitsByRoutine.has(id)) continue;
+				for (const caller of reverse.get(id) ?? []) {
+					if (!visited.has(caller.from)) queue.push({ id: caller.from, depth: depth + 1 });
+				}
+			}
+			const writes = new Set<TableId>();
+			const events = new Set<EventId>();
+			let coverageComplete = true;
+			for (const rid of visited) {
+				const r = routineById.get(rid);
+				if (r?.summary === undefined) {
+					coverageComplete = false;
+					continue;
+				}
+				for (const t of writesTablesOf(r.summary)) writes.add(t);
+				for (const e of publishesEventsOf(r.summary)) events.add(e);
+				if (reachableCoverage(r.summary) !== "complete") coverageComplete = false;
+			}
+			const spanRoots = [...visited].filter((rid) => (reverse.get(rid) ?? []).length === 0);
+			spans.push({
+				commitOperationId,
+				commitRoutineId,
+				routinesInSpan: [...visited].sort(),
+				writesTables: [...writes].sort(),
+				publishesEvents: [...events].sort(),
+				spanRoots: spanRoots.sort(),
+				coverageComplete,
+			});
+		}
+	}
+	return spans;
+}