npm - @thotischner/observability-mcp - Versions diffs - 1.8.1 → 3.0.1 - Mend

@thotischner/observability-mcp 1.8.1 → 3.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (204) hide show

package/dist/analysis/history.d.ts +70 -0
package/dist/analysis/history.js +170 -0
package/dist/analysis/history.test.d.ts +1 -0
package/dist/analysis/history.test.js +141 -0
package/dist/audit/log.d.ts +9 -0
package/dist/audit/log.js +20 -0
package/dist/audit/redaction-bypass.d.ts +67 -0
package/dist/audit/redaction-bypass.js +64 -0
package/dist/audit/redaction-bypass.test.d.ts +1 -0
package/dist/audit/redaction-bypass.test.js +72 -0
package/dist/audit/sinks/s3.d.ts +61 -0
package/dist/audit/sinks/s3.js +179 -0
package/dist/audit/sinks/s3.test.d.ts +1 -0
package/dist/audit/sinks/s3.test.js +175 -0
package/dist/audit/sinks/types.d.ts +18 -0
package/dist/audit/sinks/types.js +1 -0
package/dist/audit/sinks/webhook.d.ts +45 -0
package/dist/audit/sinks/webhook.js +111 -0
package/dist/audit/sinks/webhook.test.d.ts +1 -0
package/dist/audit/sinks/webhook.test.js +162 -0
package/dist/auth/credentials.d.ts +11 -0
package/dist/auth/credentials.js +27 -0
package/dist/auth/credentials.test.js +21 -1
package/dist/auth/csrf.d.ts +26 -0
package/dist/auth/csrf.js +128 -0
package/dist/auth/csrf.test.d.ts +1 -0
package/dist/auth/csrf.test.js +143 -0
package/dist/auth/local-users.d.ts +6 -0
package/dist/auth/local-users.js +11 -0
package/dist/auth/local-users.test.js +41 -0
package/dist/auth/middleware.d.ts +7 -6
package/dist/auth/oidc/dcr.d.ts +70 -0
package/dist/auth/oidc/dcr.js +160 -0
package/dist/auth/oidc/dcr.test.d.ts +1 -0
package/dist/auth/oidc/dcr.test.js +109 -0
package/dist/auth/oidc/endpoints.js +44 -0
package/dist/auth/oidc/profiles.d.ts +22 -0
package/dist/auth/oidc/profiles.js +95 -0
package/dist/auth/oidc/profiles.test.d.ts +1 -0
package/dist/auth/oidc/profiles.test.js +51 -0
package/dist/auth/oidc/runtime.d.ts +3 -0
package/dist/auth/oidc/runtime.js +16 -3
package/dist/auth/oidc/runtime.test.js +1 -0
package/dist/auth/policy/batch-dry-run.d.ts +56 -0
package/dist/auth/policy/batch-dry-run.js +144 -0
package/dist/auth/policy/batch-dry-run.test.d.ts +1 -0
package/dist/auth/policy/batch-dry-run.test.js +140 -0
package/dist/auth/policy/engine.d.ts +20 -4
package/dist/auth/policy/engine.js +16 -2
package/dist/auth/policy/loader.d.ts +11 -1
package/dist/auth/policy/loader.js +37 -0
package/dist/auth/policy/loader.test.d.ts +1 -0
package/dist/auth/policy/loader.test.js +86 -0
package/dist/auth/policy/opa.d.ts +5 -5
package/dist/auth/policy/opa.js +25 -14
package/dist/auth/policy/opa.test.js +48 -0
package/dist/auth/rbac.d.ts +23 -1
package/dist/auth/rbac.js +43 -1
package/dist/auth/rbac.test.js +62 -0
package/dist/cli/index.js +3 -0
package/dist/cli/inspector-config.d.ts +9 -0
package/dist/cli/inspector-config.js +28 -0
package/dist/cli/inspector-config.test.d.ts +1 -0
package/dist/cli/inspector-config.test.js +33 -0
package/dist/cli/lib.d.ts +1 -1
package/dist/cli/lib.js +1 -0
package/dist/conformance/mcp-2025-11-25.test.d.ts +1 -0
package/dist/conformance/mcp-2025-11-25.test.js +206 -0
package/dist/connectors/interface.d.ts +5 -1
package/dist/connectors/loader.d.ts +8 -0
package/dist/connectors/loader.js +55 -4
package/dist/connectors/loader.test.d.ts +1 -0
package/dist/connectors/loader.test.js +78 -0
package/dist/connectors/manifest-hooks.test.d.ts +1 -0
package/dist/connectors/manifest-hooks.test.js +206 -0
package/dist/connectors/prometheus.test.js +31 -13
package/dist/connectors/registry.d.ts +13 -0
package/dist/connectors/registry.js +30 -0
package/dist/connectors/registry.test.js +56 -2
package/dist/context.d.ts +32 -0
package/dist/context.js +35 -0
package/dist/context.test.d.ts +1 -0
package/dist/context.test.js +58 -0
package/dist/federation/registry.d.ts +54 -0
package/dist/federation/registry.js +122 -0
package/dist/federation/registry.test.d.ts +1 -0
package/dist/federation/registry.test.js +206 -0
package/dist/federation/upstream.d.ts +86 -0
package/dist/federation/upstream.js +162 -0
package/dist/federation/upstream.test.d.ts +1 -0
package/dist/federation/upstream.test.js +118 -0
package/dist/index.js +1435 -126
package/dist/metrics/self.d.ts +1 -0
package/dist/metrics/self.js +8 -0
package/dist/middleware/ssrfGuard.d.ts +15 -0
package/dist/middleware/ssrfGuard.js +103 -0
package/dist/middleware/ssrfGuard.test.d.ts +1 -0
package/dist/middleware/ssrfGuard.test.js +81 -0
package/dist/observability/otel.d.ts +20 -0
package/dist/observability/otel.js +118 -0
package/dist/observability/otel.test.d.ts +1 -0
package/dist/observability/otel.test.js +56 -0
package/dist/openapi.js +215 -7
package/dist/openapi.test.js +34 -0
package/dist/policy/redact.js +1 -1
package/dist/postmortem/store.d.ts +34 -0
package/dist/postmortem/store.js +113 -0
package/dist/postmortem/store.test.d.ts +1 -0
package/dist/postmortem/store.test.js +118 -0
package/dist/postmortem/synthesizer.d.ts +83 -0
package/dist/postmortem/synthesizer.js +205 -0
package/dist/postmortem/synthesizer.test.d.ts +1 -0
package/dist/postmortem/synthesizer.test.js +141 -0
package/dist/products/loader.d.ts +31 -3
package/dist/products/loader.js +77 -4
package/dist/products/loader.test.js +90 -1
package/dist/quota/charge.d.ts +28 -0
package/dist/quota/charge.js +30 -0
package/dist/quota/charge.test.d.ts +1 -0
package/dist/quota/charge.test.js +83 -0
package/dist/quota/limiter.d.ts +29 -4
package/dist/quota/limiter.js +64 -8
package/dist/quota/limiter.test.js +86 -0
package/dist/scim/compliance.test.d.ts +1 -0
package/dist/scim/compliance.test.js +169 -0
package/dist/scim/factory.test.d.ts +1 -0
package/dist/scim/factory.test.js +54 -0
package/dist/scim/group-role-map.d.ts +4 -0
package/dist/scim/group-role-map.js +33 -0
package/dist/scim/group-role-map.test.d.ts +1 -0
package/dist/scim/group-role-map.test.js +33 -0
package/dist/scim/patch-ops.test.d.ts +1 -0
package/dist/scim/patch-ops.test.js +100 -0
package/dist/scim/redis-store.d.ts +38 -0
package/dist/scim/redis-store.js +178 -0
package/dist/scim/redis-store.test.d.ts +1 -0
package/dist/scim/redis-store.test.js +138 -0
package/dist/scim/routes.d.ts +40 -0
package/dist/scim/routes.js +395 -0
package/dist/scim/store.d.ts +76 -0
package/dist/scim/store.js +196 -0
package/dist/scim/store.test.d.ts +1 -0
package/dist/scim/store.test.js +121 -0
package/dist/scim/types.d.ts +73 -0
package/dist/scim/types.js +29 -0
package/dist/sdk/hook-wrappers.d.ts +39 -0
package/dist/sdk/hook-wrappers.js +113 -0
package/dist/sdk/hook-wrappers.test.d.ts +1 -0
package/dist/sdk/hook-wrappers.test.js +204 -0
package/dist/sdk/hooks.d.ts +77 -0
package/dist/sdk/hooks.js +72 -0
package/dist/sdk/hooks.test.d.ts +1 -0
package/dist/sdk/hooks.test.js +159 -0
package/dist/sdk/index.d.ts +15 -0
package/dist/sdk/index.js +1 -0
package/dist/sdk/manifest-schema.d.ts +17 -0
package/dist/sdk/manifest-schema.js +21 -0
package/dist/tools/context-seam.test.js +6 -1
package/dist/tools/detect-anomalies.d.ts +12 -1
package/dist/tools/detect-anomalies.js +26 -5
package/dist/tools/generate-postmortem.d.ts +35 -0
package/dist/tools/generate-postmortem.js +191 -0
package/dist/tools/get-anomaly-history.d.ts +35 -0
package/dist/tools/get-anomaly-history.js +126 -0
package/dist/tools/get-service-health.d.ts +1 -1
package/dist/tools/get-service-health.js +4 -3
package/dist/tools/list-services.d.ts +1 -1
package/dist/tools/list-services.js +3 -2
package/dist/tools/list-sources.d.ts +1 -1
package/dist/tools/list-sources.js +6 -2
package/dist/tools/query-logs.d.ts +1 -1
package/dist/tools/query-logs.js +2 -2
package/dist/tools/query-metrics.d.ts +1 -1
package/dist/tools/query-metrics.js +19 -6
package/dist/tools/query-traces.d.ts +47 -0
package/dist/tools/query-traces.js +145 -0
package/dist/tools/query-traces.test.d.ts +1 -0
package/dist/tools/query-traces.test.js +110 -0
package/dist/tools/registry-names.d.ts +35 -0
package/dist/tools/registry-names.js +54 -0
package/dist/tools/registry-names.test.d.ts +1 -0
package/dist/tools/registry-names.test.js +61 -0
package/dist/tools/topology.d.ts +3 -3
package/dist/tools/topology.js +33 -11
package/dist/tools/topology.test.js +45 -0
package/dist/topology/merge.d.ts +22 -0
package/dist/topology/merge.js +178 -0
package/dist/topology/merge.test.d.ts +1 -0
package/dist/topology/merge.test.js +110 -0
package/dist/transport/sessionStore.d.ts +66 -0
package/dist/transport/sessionStore.js +138 -0
package/dist/transport/sessionStore.test.d.ts +1 -0
package/dist/transport/sessionStore.test.js +118 -0
package/dist/transport/transportSessionMap.d.ts +70 -0
package/dist/transport/transportSessionMap.js +128 -0
package/dist/transport/transportSessionMap.test.d.ts +1 -0
package/dist/transport/transportSessionMap.test.js +111 -0
package/dist/transport/websocket.d.ts +35 -0
package/dist/transport/websocket.js +133 -0
package/dist/transport/websocket.test.d.ts +1 -0
package/dist/transport/websocket.test.js +124 -0
package/dist/types.d.ts +51 -0
package/dist/ui/index.html +2529 -145
package/package.json +13 -3

package/dist/postmortem/synthesizer.d.ts ADDED Viewed

@@ -0,0 +1,83 @@
+export interface AnomalySample {
+    ts: string;
+    service: string;
+    score: number;
+    method: string;
+    severity: string;
+    signal?: string;
+}
+export interface BlastRadiusNode {
+    id: string;
+    kind: string;
+    name: string;
+    /** Whether this node is the suspected root cause (the input service). */
+    root?: boolean;
+}
+export interface TraceSummary {
+    traceId: string;
+    rootName: string;
+    rootService: string;
+    durationMs: number;
+    hasError: boolean;
+}
+export interface PostmortemInput {
+    /** Suspected root-cause service (the operator's first guess). */
+    service: string;
+    /** Rolling window the incident took place in, e.g. "2h", "6h". */
+    window: string;
+    /** Tenant the incident occurred in. */
+    tenant: string;
+    /** RFC-3339 start + end of the incident window for human display. */
+    fromIso: string;
+    toIso: string;
+    /** Live anomaly samples within the window. */
+    anomalies: AnomalySample[];
+    /** Blast-radius graph at peak. */
+    blastRadius: {
+        nodes: BlastRadiusNode[];
+        edges: Array<{
+            from: string;
+            to: string;
+            relation: string;
+        }>;
+    };
+    /** Trace summaries (top by duration). */
+    traces: TraceSummary[];
+    /** Optional log-error summary lines, e.g. ["payment-service: 412 5xx in window"]. */
+    logHighlights?: string[];
+}
+export interface PostmortemReport {
+    service: string;
+    window: string;
+    fromIso: string;
+    toIso: string;
+    /** Compact synopsis the UI puts at the top of the report. */
+    synopsis: string;
+    /** Markdown body of the full report. */
+    markdown: string;
+    /** Structured form for callers that want to render their own UI. */
+    sections: {
+        timeline: Array<{
+            ts: string;
+            service: string;
+            score: number;
+            severity: string;
+            method: string;
+        }>;
+        blastRadius: {
+            nodes: BlastRadiusNode[];
+            edgeCount: number;
+        };
+        topTraces: TraceSummary[];
+        contributingSignals: Array<{
+            signal: string;
+            count: number;
+            meanScore: number;
+        }>;
+        followUps: string[];
+        logHighlights: string[];
+    };
+}
+/** Synthesise one report from already-fetched primitives. Pure
+ *  compute — no I/O. */
+export declare function synthesizePostmortem(input: PostmortemInput): PostmortemReport;

package/dist/postmortem/synthesizer.js ADDED Viewed

@@ -0,0 +1,205 @@
+// Auto-post-mortem synthesizer — Phase F19.
+//
+// Stitches together the existing observability primitives — anomaly
+// history (F15), blast-radius (F13/topology), trace summaries (F13),
+// log-derived error patterns (existing query_logs) — into a single
+// markdown report a human (or LLM) can read in one shot.
+//
+// The synthesizer is pure-ish: it accepts the upstream queries as
+// injected functions so the tool layer can compose them without the
+// synthesizer depending on the entire ConnectorRegistry API. Tests
+// inject fake data and don't need a live demo stack.
+/** Synthesise one report from already-fetched primitives. Pure
+ *  compute — no I/O. */
+export function synthesizePostmortem(input) {
+    const timeline = [...input.anomalies]
+        .sort((a, b) => a.ts.localeCompare(b.ts))
+        .map((a) => ({ ts: a.ts, service: a.service, score: a.score, severity: a.severity, method: a.method }));
+    const contributingSignals = aggregateBySignal(input.anomalies);
+    const peakScore = input.anomalies.reduce((m, a) => Math.max(m, a.score), 0);
+    const errorTraces = input.traces.filter((t) => t.hasError).length;
+    const peakNode = input.blastRadius.nodes.find((n) => n.root) ?? input.blastRadius.nodes[0];
+    const blastSize = input.blastRadius.nodes.length;
+    const followUps = inferFollowUps(input, { peakScore, errorTraces, blastSize });
+    const synopsis = synopsisFor(input, peakScore, errorTraces, blastSize);
+    const markdown = renderMarkdown({
+        input,
+        timeline,
+        contributingSignals,
+        peakNode,
+        peakScore,
+        errorTraces,
+        blastSize,
+        followUps,
+        synopsis,
+    });
+    return {
+        service: input.service,
+        window: input.window,
+        fromIso: input.fromIso,
+        toIso: input.toIso,
+        synopsis,
+        markdown,
+        sections: {
+            timeline,
+            blastRadius: { nodes: input.blastRadius.nodes, edgeCount: input.blastRadius.edges.length },
+            topTraces: input.traces.slice(0, 10),
+            contributingSignals,
+            followUps,
+            logHighlights: input.logHighlights ?? [],
+        },
+    };
+}
+function aggregateBySignal(anomalies) {
+    const groups = new Map();
+    for (const a of anomalies) {
+        const sig = a.signal ?? a.method;
+        const prev = groups.get(sig);
+        if (prev)
+            prev.push(a.score);
+        else
+            groups.set(sig, [a.score]);
+    }
+    return [...groups.entries()]
+        .map(([signal, scores]) => ({
+        signal,
+        count: scores.length,
+        meanScore: Math.round((scores.reduce((s, x) => s + x, 0) / scores.length) * 100) / 100,
+    }))
+        .sort((a, b) => b.meanScore - a.meanScore);
+}
+function inferFollowUps(input, ctx) {
+    const out = [];
+    if (input.anomalies.length === 0) {
+        out.push("No anomaly history found for this service in the window — confirm OMCP_ANOMALY_HISTORY_REMOTE_WRITE is wired and Prometheus is scraping the same TSDB.");
+        return out;
+    }
+    if (ctx.peakScore >= 0.9) {
+        out.push(`Peak anomaly score ${ctx.peakScore} is critical — review the detector's threshold for service '${input.service}' and consider whether the chosen method (${dominantMethod(input.anomalies)}) suits this signal's distribution.`);
+    }
+    if (ctx.errorTraces > 0) {
+        out.push(`${ctx.errorTraces} trace(s) carried error spans during the window — drill into the slowest via \`query_traces(service="${input.service}", errorsOnly=true)\`.`);
+    }
+    if (ctx.blastSize > 5) {
+        out.push(`Blast radius spans ${ctx.blastSize} nodes — verify that the dependency edges are still accurate (a stale topology snapshot can blow up the radius and miss the real cause).`);
+    }
+    if ((input.logHighlights ?? []).length > 0) {
+        out.push("Log highlights above point at concrete error patterns — promote the recurring ones to an alert or SLO so the next regression catches itself.");
+    }
+    if (out.length === 0) {
+        out.push("All signals look stable for this window — consider closing the incident as a transient anomaly or expanding the time window.");
+    }
+    return out;
+}
+function dominantMethod(anomalies) {
+    const c = new Map();
+    for (const a of anomalies)
+        c.set(a.method, (c.get(a.method) ?? 0) + 1);
+    return [...c.entries()].sort((a, b) => b[1] - a[1])[0]?.[0] ?? "unknown";
+}
+function synopsisFor(input, peakScore, errorTraces, blastSize) {
+    const anomalyCount = input.anomalies.length;
+    if (anomalyCount === 0) {
+        return `No anomalies recorded for service '${input.service}' between ${input.fromIso} and ${input.toIso}. Either the window was clean, or the history sink wasn't writing at the time.`;
+    }
+    return [
+        `Service '${input.service}' produced ${anomalyCount} anomaly sample(s) between ${input.fromIso} and ${input.toIso}, peaking at ${peakScore}.`,
+        `Blast radius at peak covered ${blastSize} node(s); ${errorTraces} trace(s) carried error spans.`,
+    ].join(" ");
+}
+function renderMarkdown(ctx) {
+    const { input, timeline, contributingSignals, peakNode, peakScore, errorTraces, followUps, synopsis } = ctx;
+    const lines = [];
+    lines.push(`# Post-mortem — ${input.service}`);
+    lines.push("");
+    lines.push(`> **Window:** \`${input.fromIso}\` → \`${input.toIso}\` (\`${input.window}\`)  `);
+    lines.push(`> **Tenant:** \`${input.tenant}\`  `);
+    lines.push(`> **Generated by:** observability-mcp \`generate_postmortem\``);
+    lines.push("");
+    lines.push("## Synopsis");
+    lines.push("");
+    lines.push(synopsis);
+    lines.push("");
+    lines.push("## Anomaly timeline");
+    lines.push("");
+    if (timeline.length === 0) {
+        lines.push("_No anomaly samples in this window._");
+    }
+    else {
+        lines.push("| ts | service | score | severity | method |");
+        lines.push("|---|---|---|---|---|");
+        for (const t of timeline.slice(0, 20)) {
+            lines.push(`| \`${t.ts}\` | \`${t.service}\` | ${t.score} | ${t.severity} | ${t.method} |`);
+        }
+        if (timeline.length > 20)
+            lines.push(`| … | _${timeline.length - 20} more rows_ |  |  |  |`);
+    }
+    lines.push("");
+    lines.push("## Blast radius at peak");
+    lines.push("");
+    if (peakNode) {
+        lines.push(`Root node: **\`${peakNode.name}\`** (\`${peakNode.kind}\`).`);
+    }
+    else {
+        lines.push("_Topology snapshot empty._");
+    }
+    lines.push("");
+    if (input.blastRadius.nodes.length > 0) {
+        lines.push("| node | kind |");
+        lines.push("|---|---|");
+        for (const n of input.blastRadius.nodes.slice(0, 30)) {
+            lines.push(`| \`${n.name}\`${n.root ? " *(root)*" : ""} | \`${n.kind}\` |`);
+        }
+    }
+    lines.push("");
+    lines.push(`Edges in radius: **${input.blastRadius.edges.length}**.`);
+    lines.push("");
+    lines.push("## Contributing signals (ranked)");
+    lines.push("");
+    if (contributingSignals.length === 0) {
+        lines.push("_No anomaly samples to rank._");
+    }
+    else {
+        lines.push("| signal | samples | mean score |");
+        lines.push("|---|---|---|");
+        for (const s of contributingSignals.slice(0, 10)) {
+            lines.push(`| \`${s.signal}\` | ${s.count} | ${s.meanScore} |`);
+        }
+    }
+    lines.push("");
+    lines.push("## Related traces");
+    lines.push("");
+    if (input.traces.length === 0) {
+        lines.push("_No traces returned for the window. Configure a Tempo / Jaeger source if traces are expected._");
+    }
+    else {
+        lines.push("| trace | service | duration ms | error |");
+        lines.push("|---|---|---|---|");
+        for (const t of input.traces.slice(0, 10)) {
+            lines.push(`| \`${t.traceId}\` | \`${t.rootService}\` | ${t.durationMs} | ${t.hasError ? "yes" : "no"} |`);
+        }
+        if (errorTraces > 0)
+            lines.push(`\n_${errorTraces} of the returned traces carried error spans._`);
+    }
+    lines.push("");
+    if ((input.logHighlights ?? []).length > 0) {
+        lines.push("## Log highlights");
+        lines.push("");
+        for (const l of input.logHighlights)
+            lines.push(`- ${l}`);
+        lines.push("");
+    }
+    lines.push("## Suggested follow-ups");
+    lines.push("");
+    for (const f of followUps)
+        lines.push(`- ${f}`);
+    lines.push("");
+    lines.push("---");
+    lines.push("");
+    lines.push(`*Generated by observability-mcp \`generate_postmortem\` — see \`docs/postmortems.md\` for the prompt sources.*`);
+    lines.push("");
+    // Bound the chunk to keep memory predictable; the rendered report
+    // is normally a few KB but a pathological 10k-sample timeline
+    // could approach MB without the slice() caps above.
+    return lines.join("\n");
+}

package/dist/postmortem/synthesizer.test.d.ts ADDED Viewed

	@@ -0,0 +1 @@
1	+ export {};

package/dist/postmortem/synthesizer.test.js ADDED Viewed

@@ -0,0 +1,141 @@
+import { test } from "node:test";
+import assert from "node:assert/strict";
+import { synthesizePostmortem, } from "./synthesizer.js";
+function input(overrides = {}) {
+    return {
+        service: "payment",
+        window: "1h",
+        tenant: "default",
+        fromIso: "2026-06-06T00:00:00.000Z",
+        toIso: "2026-06-06T01:00:00.000Z",
+        anomalies: [],
+        blastRadius: { nodes: [], edges: [] },
+        traces: [],
+        ...overrides,
+    };
+}
+function anomaly(ts, score, method = "mad", severity = "warn", signal) {
+    return { ts, service: "payment", score, method, severity, signal };
+}
+test("synthesizePostmortem: empty input returns synopsis + 'no anomalies' follow-up", () => {
+    const r = synthesizePostmortem(input());
+    assert.match(r.synopsis, /No anomalies recorded/);
+    assert.equal(r.sections.timeline.length, 0);
+    assert.equal(r.sections.followUps.length, 1);
+    assert.match(r.sections.followUps[0], /OMCP_ANOMALY_HISTORY_REMOTE_WRITE/);
+});
+test("synthesizePostmortem: timeline is sorted by ts ascending", () => {
+    const r = synthesizePostmortem(input({
+        anomalies: [
+            anomaly("2026-06-06T00:30:00Z", 0.5),
+            anomaly("2026-06-06T00:10:00Z", 0.4),
+            anomaly("2026-06-06T00:50:00Z", 0.9),
+        ],
+    }));
+    assert.deepEqual(r.sections.timeline.map((t) => t.ts), ["2026-06-06T00:10:00Z", "2026-06-06T00:30:00Z", "2026-06-06T00:50:00Z"]);
+});
+test("synthesizePostmortem: contributing signals aggregated by signal label + ranked by mean score desc", () => {
+    const r = synthesizePostmortem(input({
+        anomalies: [
+            anomaly("2026-06-06T00:10Z", 0.5, "mad", "warn", "request_latency"),
+            anomaly("2026-06-06T00:20Z", 0.4, "mad", "warn", "request_latency"),
+            anomaly("2026-06-06T00:30Z", 0.95, "seasonality", "critical", "error_rate"),
+        ],
+    }));
+    const sigs = r.sections.contributingSignals;
+    assert.equal(sigs.length, 2);
+    // error_rate (0.95 mean) ranks above request_latency (0.45 mean)
+    assert.equal(sigs[0].signal, "error_rate");
+    assert.equal(sigs[0].count, 1);
+    assert.equal(sigs[0].meanScore, 0.95);
+    assert.equal(sigs[1].signal, "request_latency");
+    assert.equal(sigs[1].count, 2);
+    assert.equal(sigs[1].meanScore, 0.45);
+});
+test("synthesizePostmortem: missing signal label falls back to method", () => {
+    const r = synthesizePostmortem(input({ anomalies: [anomaly("2026-06-06T00:10Z", 0.6, "correlator")] }));
+    assert.equal(r.sections.contributingSignals[0].signal, "correlator");
+});
+test("synthesizePostmortem: critical peak triggers a follow-up mentioning the threshold", () => {
+    const r = synthesizePostmortem(input({ anomalies: [anomaly("2026-06-06T00:30Z", 0.95)] }));
+    assert.ok(r.sections.followUps.some((f) => /Peak anomaly score 0\.95/.test(f)));
+});
+test("synthesizePostmortem: errors-in-traces triggers errorsOnly drill-in suggestion", () => {
+    const r = synthesizePostmortem(input({
+        anomalies: [anomaly("2026-06-06T00:10Z", 0.6)],
+        traces: [
+            { traceId: "aaa", rootName: "GET /pay", rootService: "payment", durationMs: 800, hasError: true },
+        ],
+    }));
+    assert.ok(r.sections.followUps.some((f) => /errorsOnly=true/.test(f)));
+});
+test("synthesizePostmortem: large blast radius triggers stale-topology hint", () => {
+    const nodes = Array.from({ length: 7 }, (_, i) => ({ id: `n${i}`, kind: "pod", name: `n${i}`, root: i === 0 }));
+    const r = synthesizePostmortem(input({
+        anomalies: [anomaly("2026-06-06T00:10Z", 0.6)],
+        blastRadius: { nodes, edges: [{ from: "n0", to: "n1", relation: "CALLS" }] },
+    }));
+    assert.ok(r.sections.followUps.some((f) => /7 nodes/.test(f) && /stale topology/i.test(f)));
+});
+test("synthesizePostmortem: clean window returns a 'stable, consider closing' follow-up", () => {
+    // The "all signals stable" branch fires only when:
+    //   anomalies present (not zero)
+    //   peak < 0.9
+    //   no error traces
+    //   blast radius <= 5
+    //   no log highlights
+    const r = synthesizePostmortem(input({
+        anomalies: [anomaly("2026-06-06T00:10Z", 0.3)],
+        blastRadius: { nodes: [{ id: "n0", kind: "pod", name: "n0", root: true }], edges: [] },
+    }));
+    assert.ok(r.sections.followUps.some((f) => /stable for this window/.test(f)));
+});
+test("synthesizePostmortem: markdown contains every section header in order", () => {
+    const r = synthesizePostmortem(input({
+        anomalies: [anomaly("2026-06-06T00:10Z", 0.7)],
+        blastRadius: {
+            nodes: [{ id: "p", kind: "deployment", name: "payment", root: true }],
+            edges: [{ from: "p", to: "rds", relation: "READS_FROM" }],
+        },
+        traces: [{ traceId: "t", rootName: "GET /pay", rootService: "payment", durationMs: 200, hasError: false }],
+        logHighlights: ["payment-service: 12 5xx in window"],
+    }));
+    for (const heading of [
+        "# Post-mortem — payment",
+        "## Synopsis",
+        "## Anomaly timeline",
+        "## Blast radius at peak",
+        "## Contributing signals (ranked)",
+        "## Related traces",
+        "## Log highlights",
+        "## Suggested follow-ups",
+    ]) {
+        assert.ok(r.markdown.includes(heading), `markdown missing section: ${heading}`);
+    }
+    // The order check — anomaly timeline should appear before blast radius
+    assert.ok(r.markdown.indexOf("## Anomaly timeline") < r.markdown.indexOf("## Blast radius at peak"));
+});
+test("synthesizePostmortem: timeline > 20 rows is truncated with an ellipsis row", () => {
+    const anomalies = Array.from({ length: 25 }, (_, i) => anomaly(`2026-06-06T00:${String(i).padStart(2, "0")}:00Z`, 0.5 + i * 0.01));
+    const r = synthesizePostmortem(input({ anomalies }));
+    // The structured section has all 25
+    assert.equal(r.sections.timeline.length, 25);
+    // The markdown table is capped at 20 data rows + an ellipsis row
+    // — count rows specifically inside the Anomaly timeline section
+    // (other sections also use | ` ... | tables and would inflate a
+    // global grep).
+    const md = r.markdown;
+    const timelineStart = md.indexOf("## Anomaly timeline");
+    const blastStart = md.indexOf("## Blast radius at peak");
+    const timelineSection = md.slice(timelineStart, blastStart);
+    const tableRows = timelineSection.split("\n").filter((l) => l.startsWith("| `")).length;
+    assert.equal(tableRows, 20);
+    assert.match(timelineSection, /_5 more rows_/);
+});
+test("synthesizePostmortem: report carries the input window + iso bounds back into the structured shape", () => {
+    const r = synthesizePostmortem(input({ window: "6h" }));
+    assert.equal(r.service, "payment");
+    assert.equal(r.window, "6h");
+    assert.equal(r.fromIso, "2026-06-06T00:00:00.000Z");
+    assert.equal(r.toIso, "2026-06-06T01:00:00.000Z");
+});

package/dist/products/loader.d.ts CHANGED Viewed

@@ -12,8 +12,13 @@
  *     (YAML or JSON). Missing/empty file → empty catalog.
  *   - Strict validation: unknown action / unknown resource /
  *     unexpected keys reject loudly.
- *   - Hot-reload on next /api/products call (slice 2 wires the
- *     reload trigger; for now the file is read once at boot).
+ *   - Mtime-poll hot-reload: callers (e.g. each /api/products
+ *     handler) `await store.maybeReload()` before reading. If the
+ *     file mtime advanced since the last load, the store re-parses
+ *     and atomically swaps the in-memory file; parse errors keep
+ *     the previous good state and log loudly. One `stat()` call per
+ *     reload-aware request — too cheap to matter vs. the network
+ *     round-trip, no FSWatcher platform fragility (WSL / NFS).
  */
 export interface Product {
     /** Stable identifier — used in URLs, audit entries, /api/products/{id}. */
@@ -47,7 +52,30 @@ export declare function parseProductsText(text: string, origin: string): Product
 /** In-memory store with tenant- and status-aware queries. */
 export declare class ProductsStore {
     private file;
-    constructor(file?: ProductsFile);
+    /** Optional source file path. When set, `maybeReload()` polls its
+     *  mtime and re-parses on change. Mutations via upsert/delete update
+     *  `lastMtimeMs` after the caller persists, so the store does not
+     *  reload its own writes. */
+    private path?;
+    private lastMtimeMs;
+    constructor(file?: ProductsFile, opts?: {
+        path?: string;
+        initialMtimeMs?: number;
+    });
+    /** Re-read the source file if its mtime has advanced since the last
+     *  load. No-op when no path was supplied at construction. Parse or
+     *  IO errors are logged and the previous good state is kept — the
+     *  invariant is "the store always reflects a valid catalogue", so a
+     *  broken edit on disk never takes the running server down. */
+    maybeReload(): Promise<{
+        reloaded: boolean;
+    }>;
+    /** Re-stat the source file and pin the mtime cursor to its current
+     *  value. Call this after a successful write so the store does not
+     *  treat its own change as an external reload trigger. Best-effort:
+     *  if the stat fails, the next maybeReload() will simply reload the
+     *  file once and find it identical. */
+    pinMtimeAfterWrite(): Promise<void>;
     /** Return the product list. When `tenant` is set, filters to that
      *  tenant (entries without a tenant field treated as "default").
      *  When `includeStaging` is false (default), staging products are

package/dist/products/loader.js CHANGED Viewed

@@ -12,10 +12,15 @@
  *     (YAML or JSON). Missing/empty file → empty catalog.
  *   - Strict validation: unknown action / unknown resource /
  *     unexpected keys reject loudly.
- *   - Hot-reload on next /api/products call (slice 2 wires the
- *     reload trigger; for now the file is read once at boot).
+ *   - Mtime-poll hot-reload: callers (e.g. each /api/products
+ *     handler) `await store.maybeReload()` before reading. If the
+ *     file mtime advanced since the last load, the store re-parses
+ *     and atomically swaps the in-memory file; parse errors keep
+ *     the previous good state and log loudly. One `stat()` call per
+ *     reload-aware request — too cheap to matter vs. the network
+ *     round-trip, no FSWatcher platform fragility (WSL / NFS).
  */
-import { readFile, writeFile, rename } from "node:fs/promises";
+import { readFile, writeFile, rename, stat } from "node:fs/promises";
 import yaml from "js-yaml";
 const EMPTY = { products: [] };
 const VALID_STATUS = new Set(["published", "staging"]);
@@ -134,8 +139,76 @@ export function parseProductsText(text, origin) {
 /** In-memory store with tenant- and status-aware queries. */
 export class ProductsStore {
     file;
-    constructor(file = EMPTY) {
+    /** Optional source file path. When set, `maybeReload()` polls its
+     *  mtime and re-parses on change. Mutations via upsert/delete update
+     *  `lastMtimeMs` after the caller persists, so the store does not
+     *  reload its own writes. */
+    path;
+    lastMtimeMs = 0;
+    constructor(file = EMPTY, opts = {}) {
         this.file = file;
+        this.path = opts.path;
+        this.lastMtimeMs = opts.initialMtimeMs ?? 0;
+    }
+    /** Re-read the source file if its mtime has advanced since the last
+     *  load. No-op when no path was supplied at construction. Parse or
+     *  IO errors are logged and the previous good state is kept — the
+     *  invariant is "the store always reflects a valid catalogue", so a
+     *  broken edit on disk never takes the running server down. */
+    async maybeReload() {
+        if (!this.path)
+            return { reloaded: false };
+        let mtimeMs;
+        try {
+            const s = await stat(this.path);
+            mtimeMs = s.mtimeMs;
+        }
+        catch (e) {
+            const code = e.code;
+            // File gone (ENOENT) — keep last good state. Re-creating the
+            // file will land in this branch's else on the next call when
+            // stat succeeds again with a fresh mtime.
+            if (code !== "ENOENT") {
+                console.warn(`[products] hot-reload stat(${this.path}) failed: ${e.message} — keeping previous catalogue`);
+            }
+            return { reloaded: false };
+        }
+        if (mtimeMs <= this.lastMtimeMs)
+            return { reloaded: false };
+        let next;
+        try {
+            next = await readProductsFile(this.path);
+        }
+        catch (e) {
+            // readProductsFile downgrades IO errors to EMPTY but lets
+            // parse errors (ProductsLoadError) propagate — so a broken
+            // YAML edit lands here, and we explicitly do NOT swap state.
+            console.warn(`[products] hot-reload of ${this.path} failed: ${e.message} — keeping previous catalogue`);
+            // Bump the mtime cursor anyway so we don't re-log the same
+            // failure on every subsequent request until the operator fixes
+            // the file (next save advances mtime past this value).
+            this.lastMtimeMs = mtimeMs;
+            return { reloaded: false };
+        }
+        this.file = next;
+        this.lastMtimeMs = mtimeMs;
+        return { reloaded: true };
+    }
+    /** Re-stat the source file and pin the mtime cursor to its current
+     *  value. Call this after a successful write so the store does not
+     *  treat its own change as an external reload trigger. Best-effort:
+     *  if the stat fails, the next maybeReload() will simply reload the
+     *  file once and find it identical. */
+    async pinMtimeAfterWrite() {
+        if (!this.path)
+            return;
+        try {
+            const s = await stat(this.path);
+            this.lastMtimeMs = s.mtimeMs;
+        }
+        catch {
+            // Silent — see method JSDoc.
+        }
     }
     /** Return the product list. When `tenant` is set, filters to that
      *  tenant (entries without a tenant field treated as "default").

package/dist/products/loader.test.js CHANGED Viewed

@@ -1,6 +1,6 @@
 import { test } from "node:test";
 import assert from "node:assert/strict";
-import { parseProductsText, ProductsStore, ProductsLoadError } from "./loader.js";
+import { parseProductsText, ProductsStore, ProductsLoadError, readProductsFile } from "./loader.js";
 test("parseProductsText — empty/minimal products array", () => {
     const f = parseProductsText("products: []", "test");
     assert.deepEqual(f.products, []);
@@ -166,3 +166,92 @@ test("ProductsLoadError is the throw class", () => {
     }
     assert.fail("expected throw");
 });
+test("ProductsStore.maybeReload — picks up out-of-band edits on next call", async () => {
+    const { mkdtemp, rm, writeFile, utimes } = await import("node:fs/promises");
+    const { tmpdir } = await import("node:os");
+    const { join } = await import("node:path");
+    const dir = await mkdtemp(join(tmpdir(), "omcp-products-reload-"));
+    try {
+        const file = join(dir, "products.yaml");
+        await writeFile(file, "products:\n  - id: a\n    name: A\n", "utf8");
+        const initial = await readProductsFile(file);
+        const store = new ProductsStore(initial, { path: file });
+        await store.pinMtimeAfterWrite();
+        assert.equal(store.list().length, 1);
+        assert.equal(store.list()[0].id, "a");
+        // Simulate an out-of-band edit. Bump mtime explicitly because
+        // some filesystems (WSL → 9P) round mtime to the second, so a
+        // back-to-back write can land in the same second and look
+        // unchanged to stat().
+        await writeFile(file, "products:\n  - id: a\n    name: A\n  - id: b\n    name: B\n", "utf8");
+        const future = new Date(Date.now() + 5_000);
+        await utimes(file, future, future);
+        const { reloaded } = await store.maybeReload();
+        assert.equal(reloaded, true);
+        assert.equal(store.list().length, 2);
+        // A second call with no further edit is a no-op.
+        const r2 = await store.maybeReload();
+        assert.equal(r2.reloaded, false);
+    }
+    finally {
+        await rm(dir, { recursive: true, force: true });
+    }
+});
+test("ProductsStore.maybeReload — broken YAML on disk keeps previous good state", async () => {
+    const { mkdtemp, rm, writeFile, utimes } = await import("node:fs/promises");
+    const { tmpdir } = await import("node:os");
+    const { join } = await import("node:path");
+    const dir = await mkdtemp(join(tmpdir(), "omcp-products-broken-"));
+    try {
+        const file = join(dir, "products.yaml");
+        await writeFile(file, "products:\n  - id: a\n    name: A\n", "utf8");
+        const store = new ProductsStore(await readProductsFile(file), { path: file });
+        await store.pinMtimeAfterWrite();
+        // Corrupt the file with an unknown top-level key — fails the
+        // strict typo guard inside parseProductsText.
+        await writeFile(file, "products:\n  - id: a\n    name: A\n    junk: true\n", "utf8");
+        const future = new Date(Date.now() + 5_000);
+        await utimes(file, future, future);
+        const { reloaded } = await store.maybeReload();
+        // We did NOT swap state — caller sees the previous good catalogue.
+        assert.equal(reloaded, false);
+        assert.equal(store.list().length, 1);
+        assert.equal(store.list()[0].name, "A");
+    }
+    finally {
+        await rm(dir, { recursive: true, force: true });
+    }
+});
+test("ProductsStore.maybeReload — no path = no-op", async () => {
+    const store = new ProductsStore({ products: [{ id: "a", name: "A" }] });
+    const r = await store.maybeReload();
+    assert.equal(r.reloaded, false);
+    assert.equal(store.list().length, 1);
+});
+test("ProductsStore.pinMtimeAfterWrite — own writes do not trigger a redundant reload", async () => {
+    const { mkdtemp, rm, writeFile, utimes } = await import("node:fs/promises");
+    const { tmpdir } = await import("node:os");
+    const { join } = await import("node:path");
+    const { writeProductsFile } = await import("./loader.js");
+    const dir = await mkdtemp(join(tmpdir(), "omcp-products-pin-"));
+    try {
+        const file = join(dir, "products.yaml");
+        await writeFile(file, "products:\n  - id: a\n    name: A\n", "utf8");
+        const store = new ProductsStore(await readProductsFile(file), { path: file });
+        await store.pinMtimeAfterWrite();
+        // Simulate the server-side mutate-then-persist path.
+        store.upsert({ id: "b", name: "B" });
+        // Move mtime forward so writeProductsFile genuinely advances it
+        // past our cursor (1-second-resolution FS guard).
+        const future = new Date(Date.now() + 5_000);
+        await writeProductsFile(file, store.snapshot());
+        await utimes(file, future, future);
+        await store.pinMtimeAfterWrite();
+        const { reloaded } = await store.maybeReload();
+        assert.equal(reloaded, false, "own write must not re-trigger maybeReload");
+        assert.equal(store.list().length, 2);
+    }
+    finally {
+        await rm(dir, { recursive: true, force: true });
+    }
+});