npm - al-sem - Versions diffs - 0.0.1 - Mend

al-sem 0.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

package/LICENSE +21 -0
package/README.md +361 -0
package/package.json +64 -0
package/scripts/d40-diff.ts +44 -0
package/scripts/fetch-native-parser.ts +179 -0
package/scripts/precision-sample.ts +99 -0
package/scripts/precision-study.ts +42 -0
package/scripts/precision-tabulate.ts +52 -0
package/src/cli/baseline.ts +31 -0
package/src/cli/diff.ts +199 -0
package/src/cli/events-chains.ts +56 -0
package/src/cli/events-fanout.ts +87 -0
package/src/cli/exit-code.ts +30 -0
package/src/cli/fingerprint-indexes.ts +130 -0
package/src/cli/fingerprint-query.ts +543 -0
package/src/cli/fingerprint-witness.ts +493 -0
package/src/cli/fingerprint.ts +292 -0
package/src/cli/format-compact-json.ts +45 -0
package/src/cli/format-events.ts +77 -0
package/src/cli/format-fingerprint.ts +295 -0
package/src/cli/format-html.ts +503 -0
package/src/cli/format-json.ts +13 -0
package/src/cli/format-policy.ts +95 -0
package/src/cli/format-sarif.ts +186 -0
package/src/cli/format-terminal.ts +153 -0
package/src/cli/index.ts +566 -0
package/src/cli/policy.ts +204 -0
package/src/config/roots-config.ts +302 -0
package/src/deps/cache-versions.ts +74 -0
package/src/deps/canonical-json.ts +27 -0
package/src/deps/dependency-artifact.ts +144 -0
package/src/deps/dependency-cache.ts +262 -0
package/src/deps/dependency-dag.ts +128 -0
package/src/deps/dependency-package-discovery.ts +85 -0
package/src/deps/dependency-pipeline.ts +483 -0
package/src/deps/dependency-projection.ts +211 -0
package/src/deps/dependency-resolver.ts +154 -0
package/src/deps/workspace-dependencies.ts +114 -0
package/src/detectors/capability-query.ts +145 -0
package/src/detectors/confidence.ts +52 -0
package/src/detectors/d1-db-op-in-loop.ts +457 -0
package/src/detectors/d10-self-modifying-loop.ts +114 -0
package/src/detectors/d11-modify-without-get.ts +129 -0
package/src/detectors/d12-dead-integration-event.ts +81 -0
package/src/detectors/d13-cross-app-internal-call.ts +105 -0
package/src/detectors/d14-dead-routine.ts +151 -0
package/src/detectors/d16-obsolete-routine-call.ts +94 -0
package/src/detectors/d17-min-version-drift.ts +157 -0
package/src/detectors/d18-constant-filter-in-loop.ts +151 -0
package/src/detectors/d19-unused-parameter.ts +116 -0
package/src/detectors/d2-event-fanout-in-loop.ts +240 -0
package/src/detectors/d20-unreachable-after-exit.ts +92 -0
package/src/detectors/d21-read-without-load.ts +128 -0
package/src/detectors/d22-flowfield-without-calcfields.ts +168 -0
package/src/detectors/d29-subscriber-modify-on-event-record.ts +163 -0
package/src/detectors/d3-load-state.ts +72 -0
package/src/detectors/d3-missing-setloadfields.ts +234 -0
package/src/detectors/d32-constant-boolean-parameter.ts +185 -0
package/src/detectors/d33-unfiltered-bulk-write.ts +173 -0
package/src/detectors/d34-commit-in-loop.ts +206 -0
package/src/detectors/d35-commit-in-event-subscriber.ts +138 -0
package/src/detectors/d36-late-setloadfields.ts +162 -0
package/src/detectors/d37-validate-without-persist.ts +271 -0
package/src/detectors/d38-subscriber-to-obsolete-event.ts +140 -0
package/src/detectors/d39-record-left-dirty-across-chain.ts +165 -0
package/src/detectors/d4-repeated-lookup-in-loop.ts +128 -0
package/src/detectors/d40-transitive-load-missing.ts +217 -0
package/src/detectors/d41-transitive-filter-loss.ts +200 -0
package/src/detectors/d42-cross-call-wrong-setloadfields.ts +243 -0
package/src/detectors/d43-event-ishandled-skip.ts +257 -0
package/src/detectors/d44-event-multi-subscriber-overlap.ts +223 -0
package/src/detectors/d45-event-transitive-table-exposure.ts +159 -0
package/src/detectors/d5-set-based-opportunity.ts +162 -0
package/src/detectors/d7-recursive-event-expansion.ts +151 -0
package/src/detectors/d8-commit-in-transaction.ts +132 -0
package/src/detectors/d9-transaction-span-summary.ts +107 -0
package/src/detectors/detector-context.ts +121 -0
package/src/detectors/finding-grouping.ts +61 -0
package/src/detectors/path-merge.ts +174 -0
package/src/detectors/registry.ts +176 -0
package/src/detectors/table-display.ts +42 -0
package/src/diff/diff-abi.ts +195 -0
package/src/diff/diff-capabilities.ts +179 -0
package/src/diff/diff-engine.ts +146 -0
package/src/diff/diff-events.ts +323 -0
package/src/diff/diff-identity.ts +73 -0
package/src/diff/diff-indexes.ts +199 -0
package/src/diff/diff-permissions.ts +260 -0
package/src/diff/diff-policy.ts +101 -0
package/src/diff/diff-preflight.ts +66 -0
package/src/diff/diff-renames.ts +104 -0
package/src/diff/diff-schema.ts +232 -0
package/src/diff/format-diff.ts +148 -0
package/src/engine/attribute-parser.ts +50 -0
package/src/engine/capability-cone.ts +531 -0
package/src/engine/combined-graph.ts +357 -0
package/src/engine/control-flow-walker.ts +1317 -0
package/src/engine/dispatch-sites.ts +199 -0
package/src/engine/effect-lattice.ts +81 -0
package/src/engine/entry-points.ts +57 -0
package/src/engine/event-flow.ts +524 -0
package/src/engine/event-relay.ts +92 -0
package/src/engine/op-classification.ts +92 -0
package/src/engine/path-walker.ts +189 -0
package/src/engine/reverse-call-graph.ts +23 -0
package/src/engine/root-classifier-overlay.ts +194 -0
package/src/engine/root-classifier.ts +135 -0
package/src/engine/scc.ts +110 -0
package/src/engine/source-anchor.ts +25 -0
package/src/engine/summary-context.ts +104 -0
package/src/engine/summary-engine.ts +296 -0
package/src/engine/summary-runner.ts +560 -0
package/src/engine/transaction-spans.ts +112 -0
package/src/engine/uncertainty-util.ts +54 -0
package/src/hash.ts +31 -0
package/src/index/attribute-from-node.ts +141 -0
package/src/index/callee-from-node.ts +181 -0
package/src/index/capability/background.ts +90 -0
package/src/index/capability/commit.ts +44 -0
package/src/index/capability/dispatch.ts +164 -0
package/src/index/capability/events.ts +65 -0
package/src/index/capability/extractor.ts +124 -0
package/src/index/capability/file-blob.ts +137 -0
package/src/index/capability/http.ts +159 -0
package/src/index/capability/hyperlink.ts +60 -0
package/src/index/capability/isolated-storage.ts +179 -0
package/src/index/capability/table.ts +113 -0
package/src/index/capability/telemetry.ts +84 -0
package/src/index/capability/ui.ts +55 -0
package/src/index/capability/value-source.ts +202 -0
package/src/index/expression-from-node.ts +117 -0
package/src/index/indexer.ts +102 -0
package/src/index/intraprocedural-body.ts +1467 -0
package/src/index/intraprocedural-ops.ts +253 -0
package/src/index/intraprocedural-refs.ts +188 -0
package/src/index/object-indexer.ts +279 -0
package/src/index/routine-indexer.ts +282 -0
package/src/index/routine-signature.ts +46 -0
package/src/index/variable-indexer.ts +134 -0
package/src/index/variable-initializer-extractor.ts +155 -0
package/src/index/variable-type-normalizer.ts +83 -0
package/src/index.ts +267 -0
package/src/mcp/server.ts +72 -0
package/src/mcp/session.ts +49 -0
package/src/mcp/tools/explain-path.ts +75 -0
package/src/mcp/tools/get-analysis-health.ts +62 -0
package/src/mcp/tools/get-finding.ts +47 -0
package/src/mcp/tools/get-routine-summary.ts +126 -0
package/src/mcp/tools/list-findings.ts +85 -0
package/src/mcp/tools/list-hotspots.ts +78 -0
package/src/mcp/tools/list-rollups.ts +103 -0
package/src/mcp/tools/validators.ts +25 -0
package/src/model/attributes.ts +120 -0
package/src/model/callee.ts +45 -0
package/src/model/capability.ts +187 -0
package/src/model/coverage.ts +85 -0
package/src/model/entities.ts +628 -0
package/src/model/expression.ts +98 -0
package/src/model/finding.ts +110 -0
package/src/model/graph-edge.ts +93 -0
package/src/model/graph.ts +62 -0
package/src/model/identity.ts +81 -0
package/src/model/ids.ts +90 -0
package/src/model/index.ts +13 -0
package/src/model/model.ts +51 -0
package/src/model/permission.ts +76 -0
package/src/model/root-classification.ts +116 -0
package/src/model/stable-identity.ts +102 -0
package/src/model/summary.ts +96 -0
package/src/parser/ast.ts +82 -0
package/src/parser/native/ffi.ts +145 -0
package/src/parser/native/parse-index-pool.ts +148 -0
package/src/parser/native/parse-index-worker.ts +94 -0
package/src/parser/native/wrapper.ts +353 -0
package/src/parser/parser-init.ts +43 -0
package/src/perf/profiler.ts +66 -0
package/src/policy/policy-default.yaml +83 -0
package/src/policy/policy-engine.ts +339 -0
package/src/policy/policy-loader.ts +257 -0
package/src/policy/policy-schema.json +379 -0
package/src/policy/policy-types.ts +81 -0
package/src/policy/predicate-compiler.ts +151 -0
package/src/policy/predicate-evaluator.ts +267 -0
package/src/policy/predicate-fields.ts +439 -0
package/src/projection/actionable-anchor.ts +48 -0
package/src/projection/finding-filters.ts +44 -0
package/src/projection/finding-fingerprint.ts +54 -0
package/src/projection/finding-groups.ts +41 -0
package/src/projection/finding-summary.ts +110 -0
package/src/projection/rollup-findings.ts +105 -0
package/src/providers/discover.ts +88 -0
package/src/providers/external.ts +46 -0
package/src/providers/types.ts +36 -0
package/src/providers/workspace.ts +117 -0
package/src/resolve/call-resolver.ts +117 -0
package/src/resolve/coverage.ts +61 -0
package/src/resolve/event-graph.ts +166 -0
package/src/resolve/implicit-edges.ts +53 -0
package/src/resolve/record-types.ts +36 -0
package/src/resolve/resolver.ts +23 -0
package/src/resolve/semantic-graph.ts +29 -0
package/src/resolve/symbol-table.ts +69 -0
package/src/snapshot/app-snapshot.ts +74 -0
package/src/snapshot/compose.ts +100 -0
package/src/snapshot/derive/callsite-evidence.ts +76 -0
package/src/snapshot/derive/capability-facts.ts +70 -0
package/src/snapshot/derive/contracts.ts +131 -0
package/src/snapshot/derive/coverage.ts +35 -0
package/src/snapshot/derive/event-declarations.ts +140 -0
package/src/snapshot/derive/identity-table.ts +58 -0
package/src/snapshot/derive/inputs.ts +91 -0
package/src/snapshot/derive/operation-evidence.ts +70 -0
package/src/snapshot/derive/permissions.ts +186 -0
package/src/snapshot/derive/root-classifications.ts +56 -0
package/src/snapshot/derive/schema.ts +130 -0
package/src/snapshot/derive/typed-edges.ts +60 -0
package/src/snapshot/derive/workspace-fingerprint.ts +19 -0
package/src/snapshot/deserialize.ts +40 -0
package/src/snapshot/serialize-cbor-gz.ts +12 -0
package/src/snapshot/serialize-cbor.ts +19 -0
package/src/snapshot/serialize-json.ts +22 -0
package/src/snapshot/shard.ts +134 -0
package/src/snapshot/types.ts +181 -0
package/src/symbols/app-manifest.ts +96 -0
package/src/symbols/app-package-zip.ts +50 -0
package/src/symbols/embedded-source-reader.ts +41 -0
package/src/symbols/package-hash.ts +81 -0
package/src/symbols/symbol-reader.ts +101 -0
package/src/symbols/symbol-reference-parser.ts +378 -0
package/src/symbols/symbol-reference-reader.ts +27 -0
package/tsconfig.json +18 -0

package/src/detectors/d4-repeated-lookup-in-loop.ts ADDED Viewed

@@ -0,0 +1,128 @@
+import type { CombinedGraph } from "../engine/combined-graph.ts";
+import { compareStrings } from "../engine/uncertainty-util.ts";
+import { roleOf } from "../model/entities.ts";
+import type { RecordOperation } from "../model/entities.ts";
+import { isStringLikeLiteral } from "../model/expression.ts";
+import type { DetectorStats, EvidenceStep, Finding } from "../model/finding.ts";
+import type { SemanticModel } from "../model/model.ts";
+import { fingerprintOf } from "../projection/finding-fingerprint.ts";
+import { toConfidence } from "./confidence.ts";
+import type { DetectorContext } from "./detector-context.ts";
+const LOOKUP_OPS: ReadonlySet<string> = new Set(["Get", "FindFirst", "FindLast"]);
+/**
+ * D4: detect `Get` / `FindFirst` / `FindLast` called 2+ times inside the same loop
+ * with the same literal key argument on the same record variable.
+ *
+ * v1 only matches string-literal arguments (`'...'` or `"..."`), which is the
+ * conservative correct case — the key is known at compile time, so it can trivially
+ * be hoisted outside the loop. Future versions can extend this to dataflow over
+ * key expressions.
+ */
+export function detectD4(
+	model: SemanticModel,
+	_graph: CombinedGraph,
+	_ctx: DetectorContext,
+): { findings: Finding[]; stats: DetectorStats } {
+	const findings: Finding[] = [];
+	let candidatesConsidered = 0;
+	let skippedOther = 0;
+	for (const routine of model.routines) {
+		if (roleOf(routine) !== "primary") continue;
+		if (!routine.bodyAvailable) continue;
+		if (routine.parseIncomplete) continue;
+		candidatesConsidered++;
+		let emittedForRoutine = 0;
+		for (const loop of routine.features.loops) {
+			// Collect all lookup ops that sit inside this loop and have a literal key argument.
+			const candidates: { op: RecordOperation; key: string }[] = [];
+			for (const op of routine.features.recordOperations) {
+				if (!LOOKUP_OPS.has(op.op)) continue;
+				if (!op.loopStack.includes(loop.id)) continue;
+				// Only flag string-like literal keys (`'VALUE'` / `"VALUE"`); the structured
+				// classifier distinguishes them from identifiers / expressions without any
+				// text shredding. Dedup key uses the unquoted `.value` so `'X'` and `"X"`
+				// (same content, different quoting) group together.
+				const keyInfo = op.fieldArgumentInfos?.[0];
+				if (keyInfo === undefined) continue;
+				if (!isStringLikeLiteral(keyInfo)) continue;
+				candidates.push({ op, key: keyInfo.value ?? keyInfo.text });
+			}
+			if (candidates.length < 2) continue;
+			// Group by (recordVariableName.toLowerCase, literal key) — duplicates per group → finding.
+			const groups = new Map<string, RecordOperation[]>();
+			for (const { op, key } of candidates) {
+				const groupKey = `${op.recordVariableName.toLowerCase()}|${key}`;
+				const list = groups.get(groupKey);
+				if (list) list.push(op);
+				else groups.set(groupKey, [op]);
+			}
+			for (const ops of groups.values()) {
+				if (ops.length < 2) continue;
+				const first = ops[0];
+				if (!first) continue;
+				const path: EvidenceStep[] = [
+					{
+						routineId: routine.id,
+						loopId: loop.id,
+						sourceAnchor: loop.sourceAnchor,
+						note: `${loop.type} loop`,
+					},
+					...ops.map(
+						(o): EvidenceStep => ({
+							routineId: routine.id,
+							operationId: o.id,
+							sourceAnchor: o.sourceAnchor,
+							note: `${o.op} on ${o.recordVariableName} with literal key`,
+						}),
+					),
+				];
+				const finding: Finding = {
+					id: `d4/${routine.id}/${loop.id}/${first.recordVariableName.toLowerCase()}`,
+					rootCauseKey: `d4/${routine.id}/${loop.id}/${first.recordVariableName.toLowerCase()}`,
+					detector: "d4-repeated-lookup-in-loop",
+					title: "Repeated identical lookup inside a loop",
+					rootCause: `${routine.name} calls ${first.op} on ${first.recordVariableName} ${ops.length} times inside a loop with the same literal key — cache the result once before the loop.`,
+					severity: "medium",
+					confidence: toConfidence([], "likely"),
+					primaryLocation: first.sourceAnchor,
+					evidencePath: path,
+					affectedObjects: [routine.objectId],
+					affectedTables: first.tableId !== undefined ? [first.tableId] : [],
+					fixOptions: [
+						{
+							description:
+								"Move the lookup out of the loop into a local variable, then read fields from that variable inside the loop.",
+							safety: "high",
+						},
+					],
+					provenance: [{ source: "tree-sitter" }],
+				};
+				finding.fingerprint = fingerprintOf(finding, model);
+				findings.push(finding);
+				emittedForRoutine++;
+			}
+		}
+		if (emittedForRoutine === 0) skippedOther++;
+	}
+	const sorted = findings.sort((a, b) => compareStrings(a.id, b.id));
+	return {
+		findings: sorted,
+		stats: {
+			detector: "d4-repeated-lookup-in-loop",
+			candidatesConsidered,
+			findingsEmitted: sorted.length,
+			skipped: { other: skippedOther > 0 ? skippedOther : undefined },
+		},
+	};
+}

package/src/detectors/d40-transitive-load-missing.ts ADDED Viewed

@@ -0,0 +1,217 @@
+import type { CombinedGraph } from "../engine/combined-graph.ts";
+import { recordFlowRoleOf } from "../engine/op-classification.ts";
+import { beforeAnchor } from "../engine/source-anchor.ts";
+import { compareStrings } from "../engine/uncertainty-util.ts";
+import { type RecordOpType, type RecordOperation, roleOf } from "../model/entities.ts";
+import type { DetectorStats, EvidenceStep, Finding } from "../model/finding.ts";
+import type { SemanticModel } from "../model/model.ts";
+import { fingerprintOf } from "../projection/finding-fingerprint.ts";
+import { toConfidence } from "./confidence.ts";
+import type { DetectorContext } from "./detector-context.ts";
+/**
+ * D40 — transitive load missing.
+ *
+ * For each resolved call edge where the callee requires its parameter to be
+ * loaded at entry (callee.parameterRoles[Q].requiresLoadedAtEntry === "yes"),
+ * verify the caller has loaded the forwarded record before the callsite.
+ * Otherwise emit a finding at the caller's callsite.
+ *
+ * Severity: `medium`, escalates to `high` when the callee mutates the unloaded
+ * record (callee.mutatesBeforeLoad === "yes" — strictly worse than a read).
+ *
+ * Predicate:
+ *  - resolved callsite + binding;
+ *  - source is NOT an implicit-rec (`Rec`/`xRec` in triggers/event subscribers are
+ *    loaded by the AL runtime before the trigger fires — flagging them is a
+ *    structural false positive);
+ *  - source-tempState is not `known/true` (temporary records have no DB load concept);
+ *  - callee.parameterRoles[Q].requiresLoadedAtEntry === "yes";
+ *  - caller has not loaded the forwarded record on the path to the callsite
+ *    (intra-routine source-ordered check using `isLoadingOp` — see below).
+ *
+ * Skipped (counters):
+ *  - `unresolved`     — binding.bindingResolution !== "resolved", or no resolved edge.
+ *  - `implicitRec`    — binding.sourceKind === "implicit-rec".
+ *  - `tempRecord`     — binding.sourceTempState is known-true.
+ *  - `calleeUnknown`  — callee summary missing or no role for the parameter.
+ *  - `callerLoaded`   — caller has a prior loading op for the same source record.
+ *
+ * NOTE — opt-in pending Phase 6. D40 is intentionally NOT in the default detector
+ * registry while the Phase 4 walker remains straight-line-only. The walker bails to
+ * `requiresLoadedAtEntry = "unknown"` on any branching control flow, and D40's
+ * intra-caller load check doesn't see records loaded inside loops (FindSet/repeat/
+ * Next pattern). On Continia DC/Cloud the default-on shape produced ~1186 medium
+ * findings dominated by the loop-loaded false-positive class. Phase 6's full
+ * statement-tree walker closes that class; D40 returns to the default registry then.
+ * Until then it is usable via `--detector d40-transitive-load-missing`.
+ */
+/**
+ * True iff a record op acts as "load" for the parameter — after running it, the record
+ * variable is in a well-defined loaded/initialised state. Mirrors the Phase 4 walker's
+ * `loaded = true` triggers (loadsFromDb / initialises / copiesInto). The previous
+ * hand-maintained LOAD_OPS set is replaced by this single source of truth via
+ * `recordFlowRoleOf`, so future RecordOpType additions update one place.
+ */
+function isLoadingOp(op: RecordOpType): boolean {
+	const role = recordFlowRoleOf(op);
+	return role === "loadsFromDb" || role === "initialises" || role === "copiesInto";
+}
+export function detectD40(
+	model: SemanticModel,
+	_graph: CombinedGraph,
+	ctx: DetectorContext,
+): { findings: Finding[]; stats: DetectorStats } {
+	const findings: Finding[] = [];
+	const { routineById, resolvedCallEdgeByCallsite } = ctx;
+	let candidatesConsidered = 0;
+	let skippedUnresolved = 0;
+	let skippedImplicitRec = 0;
+	let skippedTempRecord = 0;
+	let skippedCallerLoaded = 0;
+	let skippedCalleeUnknown = 0;
+	for (const routine of model.routines) {
+		if (roleOf(routine) !== "primary") continue;
+		if (!routine.bodyAvailable) continue;
+		if (routine.parseIncomplete) continue;
+		// I2: precompute load-op buckets per source variable once per routine.
+		// Key = lowercase recordVariableName. Each bucket also retains the op's
+		// recordVariableId (when present) so we can prefer id-matching at the binding
+		// site (I4).
+		const loadsBySourceLc = new Map<string, RecordOperation[]>();
+		for (const op of routine.features.recordOperations) {
+			if (!isLoadingOp(op.op)) continue;
+			const key = op.recordVariableName.toLowerCase();
+			let bucket = loadsBySourceLc.get(key);
+			if (bucket === undefined) {
+				bucket = [];
+				loadsBySourceLc.set(key, bucket);
+			}
+			bucket.push(op);
+		}
+		for (const cs of routine.features.callSites) {
+			// I1: O(1) edge lookup via the new DetectorContext index.
+			const edge = resolvedCallEdgeByCallsite.get(cs.id);
+			if (edge?.to === undefined) {
+				skippedUnresolved++;
+				continue;
+			}
+			const callee = routineById.get(edge.to);
+			if (callee === undefined) continue;
+			for (const binding of cs.argumentBindings) {
+				// C2(a): implicit-rec narrowing — checked BEFORE bindingResolution so that
+				// triggers passing `Rec` (where the indexer classifies the arg as
+				// `non-record-arg` because there is no local recVar named `Rec` even though
+				// `sourceKind` is correctly `"implicit-rec"`) are still recognised and skipped.
+				// `Rec` / `xRec` inside a trigger or event subscriber are loaded by the AL
+				// runtime before the trigger fires — there is no caller in source code that
+				// could "Get them". Flagging is a structural false positive (~87 cases on
+				// DC/Cloud at the pre-narrowing default — ~7% of total).
+				if (binding.sourceKind === "implicit-rec") {
+					skippedImplicitRec++;
+					continue;
+				}
+				if (binding.bindingResolution !== "resolved") {
+					skippedUnresolved++;
+					continue;
+				}
+				if (binding.sourceTempState?.kind === "known" && binding.sourceTempState.value === true) {
+					skippedTempRecord++;
+					continue;
+				}
+				const calleeRole = callee.summary?.parameterRoles.find(
+					(r) => r.parameterIndex === binding.parameterIndex,
+				);
+				if (calleeRole === undefined) {
+					skippedCalleeUnknown++;
+					continue;
+				}
+				if (calleeRole.requiresLoadedAtEntry !== "yes") continue;
+				candidatesConsidered++;
+				const sourceNameLc = binding.sourceVariableName;
+				if (sourceNameLc === undefined) continue;
+				const bucket = loadsBySourceLc.get(sourceNameLc) ?? [];
+				// I4: prefer id-match when both sides have an id; fall back to the
+				// name-keyed bucket (AL forbids shadowing within a single procedure, so
+				// names disambiguate uniquely in practice).
+				const sourceId = binding.sourceRecordVariableId;
+				const loadedBefore = bucket.some((op) => {
+					if (!beforeAnchor(op.sourceAnchor, cs.sourceAnchor)) return false;
+					if (sourceId !== undefined && op.recordVariableId !== undefined) {
+						return op.recordVariableId === sourceId;
+					}
+					return true; // name-match already established by bucket lookup
+				});
+				if (loadedBefore) {
+					skippedCallerLoaded++;
+					continue;
+				}
+				const severity: Finding["severity"] =
+					calleeRole.mutatesBeforeLoad === "yes" ? "high" : "medium";
+				const path: EvidenceStep[] = [
+					{
+						routineId: routine.id,
+						callsiteId: cs.id,
+						sourceAnchor: binding.argumentAnchor,
+						note: `forwards ${binding.sourceVariableName} to ${callee.name} (param[${binding.parameterIndex}])`,
+					},
+					{
+						routineId: callee.id,
+						sourceAnchor: callee.sourceAnchor,
+						note: `${callee.name} ${calleeRole.mutatesBeforeLoad === "yes" ? "mutates" : "reads"} this record before loading it`,
+					},
+				];
+				const finding: Finding = {
+					id: `d40/${routine.id}/${cs.id}/${binding.parameterIndex}`,
+					rootCauseKey: `d40/${routine.id}/${cs.id}/${binding.parameterIndex}`,
+					detector: "d40-transitive-load-missing",
+					title: `Forwarded record not loaded before ${calleeRole.mutatesBeforeLoad === "yes" ? "mutating" : "reading"} helper`,
+					rootCause: `${routine.name} forwards ${binding.sourceVariableName} to ${callee.name}, which ${calleeRole.mutatesBeforeLoad === "yes" ? "mutates" : "reads"} the record without loading it — the caller must Get/Find the record before the call.`,
+					severity,
+					confidence: toConfidence([], "likely"),
+					primaryLocation: binding.argumentAnchor,
+					evidencePath: path,
+					affectedObjects: [routine.objectId, callee.objectId].sort(),
+					affectedTables: [],
+					fixOptions: [
+						{
+							description: `Load ${binding.sourceVariableName} with Get / FindFirst before forwarding to ${callee.name}, or have ${callee.name} load its parameter internally.`,
+							safety: "high",
+						},
+					],
+					provenance: [{ source: "tree-sitter" }],
+				};
+				finding.fingerprint = fingerprintOf(finding, model);
+				findings.push(finding);
+			}
+		}
+	}
+	const sorted = findings.sort((a, b) => compareStrings(a.id, b.id));
+	return {
+		findings: sorted,
+		stats: {
+			detector: "d40-transitive-load-missing",
+			candidatesConsidered,
+			findingsEmitted: sorted.length,
+			skipped: {
+				...(skippedUnresolved > 0 ? { unresolved: skippedUnresolved } : {}),
+				...(skippedImplicitRec > 0 ? { implicitRec: skippedImplicitRec } : {}),
+				...(skippedTempRecord > 0 ? { tempRecord: skippedTempRecord } : {}),
+				...(skippedCallerLoaded > 0 ? { callerLoaded: skippedCallerLoaded } : {}),
+				...(skippedCalleeUnknown > 0 ? { calleeUnknown: skippedCalleeUnknown } : {}),
+			},
+		},
+	};
+}

package/src/detectors/d41-transitive-filter-loss.ts ADDED Viewed

@@ -0,0 +1,200 @@
+import type { CombinedGraph } from "../engine/combined-graph.ts";
+import { beforeAnchor } from "../engine/source-anchor.ts";
+import { compareStrings } from "../engine/uncertainty-util.ts";
+import { roleOf } from "../model/entities.ts";
+import type { DetectorStats, EvidenceStep, Finding } from "../model/finding.ts";
+import type { SemanticModel } from "../model/model.ts";
+import { fingerprintOf } from "../projection/finding-fingerprint.ts";
+import { toConfidence } from "./confidence.ts";
+import type { DetectorContext } from "./detector-context.ts";
+const FILTER_SET_OPS: ReadonlySet<string> = new Set(["SetRange", "SetFilter"]);
+const FILTER_SENSITIVE_OPS: ReadonlySet<string> = new Set([
+	"FindFirst",
+	"FindLast",
+	"FindSet",
+	"Find",
+	"Next",
+	"CalcSums",
+	"DeleteAll",
+	"ModifyAll",
+	"Count",
+	"IsEmpty",
+]);
+/**
+ * D41 — transitive filter loss.
+ *
+ * Predicate (all four must hold):
+ *  1. Caller called SetRange / SetFilter on R before a callsite that forwards R
+ *     by-var to a callee;
+ *  2. Callee's parameterRoles[Q].resetsFiltersOnParam === "yes" (the helper calls
+ *     Reset on the forwarded record);
+ *  3. Caller subsequently performs a filter-sensitive op on R (FindFirst, FindLast,
+ *     FindSet, Find, Next, CalcSums, DeleteAll, ModifyAll, Count, IsEmpty) AFTER
+ *     the callsite;
+ *  4. Caller did NOT re-filter R between the callsite and the sensitive op.
+ *
+ * Without clause (3)+(4) the pattern is unobservable or intentional (the helper
+ * was called for the explicit purpose of resetting filters). This requirement is
+ * what makes D41 actionable rather than noisy.
+ *
+ * Severity: high (silent wrong-set-size). Confidence: likely.
+ * Anchor: caller's argumentAnchor (the argument forwarding the record).
+ *
+ * Skip counters:
+ *  - `noPriorFilter`  — caller did not filter R before the callsite
+ *  - `noPostUse`      — no filter-sensitive op on R after the callsite
+ *  - `reFiltered`     — caller re-filters R between the callsite and the sensitive op
+ *
+ * Control-flow-blindness carry-forward: the prior-filter check and the re-filter
+ * check are both source-order linear (same as D39's persist check). A SetRange/
+ * SetFilter that lives in a mutually-exclusive branch from the callsite can create
+ * false positives; a re-filter in a mutually-exclusive branch can create false
+ * negatives. These are the same FN/FP classes D39 documents and defers to a future
+ * walker-aware pass.
+ */
+export function detectD41(
+	model: SemanticModel,
+	_graph: CombinedGraph,
+	ctx: DetectorContext,
+): { findings: Finding[]; stats: DetectorStats } {
+	const findings: Finding[] = [];
+	const { routineById } = ctx;
+	let candidatesConsidered = 0;
+	let skippedNoPriorFilter = 0;
+	let skippedNoPostUse = 0;
+	let skippedReFiltered = 0;
+	for (const routine of model.routines) {
+		if (roleOf(routine) !== "primary") continue;
+		if (!routine.bodyAvailable) continue;
+		if (routine.parseIncomplete) continue;
+		for (const cs of routine.features.callSites) {
+			// O(1) resolved-edge lookup via the DetectorContext index (added in Phase 4 / I1).
+			const edge = ctx.resolvedCallEdgeByCallsite.get(cs.id);
+			if (edge?.to === undefined) continue;
+			const callee = routineById.get(edge.to);
+			if (callee === undefined) continue;
+			for (const binding of cs.argumentBindings) {
+				if (binding.bindingResolution !== "resolved") continue;
+				if (!binding.calleeParameterIsVar) continue;
+				const calleeRole = callee.summary?.parameterRoles.find(
+					(r) => r.parameterIndex === binding.parameterIndex,
+				);
+				if (calleeRole?.resetsFiltersOnParam !== "yes") continue;
+				const sourceNameLc = binding.sourceVariableName;
+				if (sourceNameLc === undefined) continue;
+				// Count every binding that targets a reset-helper callee — the meaningful
+				// candidate set at the structural gate. Matches D39's convention so
+				// cross-detector stats comparisons are meaningful.
+				candidatesConsidered++;
+				// Precompute all ops on this variable once for the three predicate checks.
+				const opsOnVar = routine.features.recordOperations.filter(
+					(op) => op.recordVariableName.toLowerCase() === sourceNameLc,
+				);
+				// (1) Caller filtered before the call?
+				const priorFilters = opsOnVar.filter(
+					(op) => FILTER_SET_OPS.has(op.op) && beforeAnchor(op.sourceAnchor, cs.sourceAnchor),
+				);
+				if (priorFilters.length === 0) {
+					skippedNoPriorFilter++;
+					continue;
+				}
+				// (3) Any filter-sensitive op AFTER the callsite?
+				const postSensitive = opsOnVar.filter(
+					(op) => FILTER_SENSITIVE_OPS.has(op.op) && beforeAnchor(cs.sourceAnchor, op.sourceAnchor),
+				);
+				if (postSensitive.length === 0) {
+					skippedNoPostUse++;
+					continue;
+				}
+				// (4) Re-filter between callsite and the sensitive op?
+				// biome-ignore lint/style/noNonNullAssertion: guarded by postSensitive.length === 0 check above
+				const firstSensitive = postSensitive[0]!;
+				const reFiltered = opsOnVar.some(
+					(op) =>
+						FILTER_SET_OPS.has(op.op) &&
+						beforeAnchor(cs.sourceAnchor, op.sourceAnchor) &&
+						beforeAnchor(op.sourceAnchor, firstSensitive.sourceAnchor),
+				);
+				if (reFiltered) {
+					skippedReFiltered++;
+					continue;
+				}
+				// priorFilters[0] is guaranteed to exist (guarded by priorFilters.length === 0 check above).
+				const firstPriorFilter = priorFilters[0];
+				if (firstPriorFilter === undefined) continue; // unreachable, satisfies the linter
+				const path: EvidenceStep[] = [
+					{
+						routineId: routine.id,
+						operationId: firstPriorFilter.id,
+						sourceAnchor: firstPriorFilter.sourceAnchor,
+						note: `${firstPriorFilter.op} on ${sourceNameLc}`,
+					},
+					{
+						routineId: routine.id,
+						callsiteId: cs.id,
+						sourceAnchor: binding.argumentAnchor,
+						note: `forwards ${sourceNameLc} to ${callee.name}, which calls Reset`,
+					},
+					{
+						routineId: routine.id,
+						operationId: firstSensitive.id,
+						sourceAnchor: firstSensitive.sourceAnchor,
+						note: `${firstSensitive.op} on ${sourceNameLc} — operates on the now-unfiltered set`,
+					},
+				];
+				const finding: Finding = {
+					id: `d41/${routine.id}/${cs.id}/${binding.parameterIndex}`,
+					rootCauseKey: `d41/${routine.id}/${cs.id}/${binding.parameterIndex}`,
+					detector: "d41-transitive-filter-loss",
+					title: "Filter silently lost across helper call",
+					rootCause: `${routine.name} filters ${sourceNameLc} before calling ${callee.name}, which calls Reset; the subsequent ${firstSensitive.op} operates on the unfiltered set.`,
+					severity: "high",
+					confidence: toConfidence([], "likely"),
+					primaryLocation: binding.argumentAnchor,
+					evidencePath: path,
+					affectedObjects: [routine.objectId, callee.objectId].sort(),
+					affectedTables: [],
+					fixOptions: [
+						{
+							description: `Re-apply the SetRange/SetFilter on ${sourceNameLc} after the call to ${callee.name}, or restructure to avoid the call inside the filtered scope.`,
+							safety: "high",
+						},
+					],
+					provenance: [{ source: "tree-sitter" }],
+				};
+				finding.fingerprint = fingerprintOf(finding, model);
+				findings.push(finding);
+			}
+		}
+	}
+	const sorted = findings.sort((a, b) => compareStrings(a.id, b.id));
+	return {
+		findings: sorted,
+		stats: {
+			detector: "d41-transitive-filter-loss",
+			candidatesConsidered,
+			findingsEmitted: sorted.length,
+			skipped: {
+				...(skippedNoPriorFilter > 0 ? { noPriorFilter: skippedNoPriorFilter } : {}),
+				...(skippedNoPostUse > 0 ? { noPostUse: skippedNoPostUse } : {}),
+				...(skippedReFiltered > 0 ? { reFiltered: skippedReFiltered } : {}),
+			},
+		},
+	};
+}