npm - euparliamentmonitor - Versions diffs - 0.9.21 → 0.9.23 - Mend

euparliamentmonitor 0.9.21 → 0.9.23

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (47) hide show

package/package.json +6 -2
package/scripts/aggregator/article-metadata.js +69 -14
package/scripts/aggregator/editorial-brief-resolver.js +23 -0
package/scripts/aggregator/html/headline.d.ts +41 -9
package/scripts/aggregator/html/headline.js +69 -10
package/scripts/aggregator/html/shell.js +73 -17
package/scripts/aggregator/manifest/index.d.ts +1 -1
package/scripts/aggregator/manifest/index.js +1 -1
package/scripts/aggregator/manifest/resolver.d.ts +28 -1
package/scripts/aggregator/manifest/resolver.js +61 -5
package/scripts/aggregator/markdown-renderer.js +11 -0
package/scripts/aggregator/metadata/artifact-category-heading.d.ts +81 -0
package/scripts/aggregator/metadata/artifact-category-heading.js +353 -0
package/scripts/aggregator/metadata/artifact-walker.js +29 -10
package/scripts/aggregator/metadata/brief-body.d.ts +12 -0
package/scripts/aggregator/metadata/brief-body.js +69 -0
package/scripts/aggregator/metadata/briefing-highlight.d.ts +47 -0
package/scripts/aggregator/metadata/briefing-highlight.js +469 -0
package/scripts/aggregator/metadata/editorial-highlight.d.ts +18 -0
package/scripts/aggregator/metadata/editorial-highlight.js +40 -1
package/scripts/aggregator/metadata/heading-rules.d.ts +2 -81
package/scripts/aggregator/metadata/heading-rules.js +78 -269
package/scripts/aggregator/metadata/keyword-filters.d.ts +60 -0
package/scripts/aggregator/metadata/keyword-filters.js +156 -0
package/scripts/aggregator/metadata/lede-extractor.js +11 -2
package/scripts/aggregator/metadata/priority-finding-cleaning.d.ts +22 -0
package/scripts/aggregator/metadata/priority-finding-cleaning.js +181 -0
package/scripts/aggregator/metadata/priority-finding-highlight.js +75 -159
package/scripts/aggregator/metadata/resolve-helpers.d.ts +34 -0
package/scripts/aggregator/metadata/resolve-helpers.js +202 -15
package/scripts/aggregator/metadata/seo-budgets.d.ts +140 -0
package/scripts/aggregator/metadata/seo-budgets.js +202 -0
package/scripts/aggregator/metadata/text-truncate.d.ts +75 -0
package/scripts/aggregator/metadata/text-truncate.js +277 -0
package/scripts/aggregator/metadata/text-utils-constants.d.ts +96 -0
package/scripts/aggregator/metadata/text-utils-constants.js +209 -0
package/scripts/aggregator/metadata/text-utils.d.ts +32 -143
package/scripts/aggregator/metadata/text-utils.js +119 -439
package/scripts/aggregator/metadata/title-rejection.d.ts +37 -0
package/scripts/aggregator/metadata/title-rejection.js +179 -0
package/scripts/copy-vendor.js +84 -112
package/scripts/dump-article-seo.js +640 -0
package/scripts/fix-mermaid-diagrams.js +931 -0
package/scripts/generators/news-indexes/backfill.d.ts +6 -1
package/scripts/generators/news-indexes/backfill.js +71 -4
package/scripts/validate-article-seo.js +534 -0
package/scripts/validate-mermaid-diagrams.js +306 -0

package/scripts/aggregator/metadata/keyword-filters.js ADDED Viewed

@@ -0,0 +1,156 @@
+// SPDX-FileCopyrightText: 2024-2026 Hack23 AB
+// SPDX-License-Identifier: Apache-2.0
+/**
+ * @module Aggregator/Metadata/KeywordFilters
+ * @description Cross-site keyword catalogue and noise-token filter used
+ * by {@link buildSeoKeywords} in `resolve-helpers.ts`.
+ *
+ * Two responsibilities:
+ *
+ *   1. **Always-on cross-site keywords** ({@link CROSS_SITE_KEYWORDS})
+ *      are prepended to every article's `<meta name="keywords">` list
+ *      regardless of language, so search-engine discovery of the
+ *      Hack23 civic-tech portfolio (EU Parliament Monitor +
+ *      Riksdagsmonitor + CIA) is consistent across all 14 localized
+ *      surfaces. The user explicitly requested
+ *      `riksdagsmonitor, political intelligence, riksdag, regeringen`
+ *      (the sister Swedish-Parliament project) plus EP analogues.
+ *
+ *   2. **Noise-token rejection** ({@link isNoiseKeywordToken}) drops
+ *      the UUID-fragment tokens (`77fc920c`, `3a76`, `9db5`, …) and
+ *      synthetic run-id slugs (`propositions-run261-1779431162`) that
+ *      the previous keyword extractor leaked into `<head>` when a
+ *      brief mentioned its own run id editorially (e.g.
+ *      `Analysis run 77fc920c-3a76-4813-9db5-43a7e9acc25e returned
+ *      0 classified actors`).
+ *
+ * Pure leaf module — no imports.
+ */
+/**
+ * Cross-site SEO keywords prepended to every article in every
+ * language. Order is meaningful: stronger civic-tech-portfolio terms
+ * first so they appear ahead of the per-article-type keywords when
+ * the 16-entry budget is exceeded.
+ */
+export const CROSS_SITE_KEYWORDS = [
+    'EU Parliament Monitor',
+    'European Parliament',
+    'European Commission',
+    'political intelligence',
+    'Riksdagsmonitor',
+    'Riksdag',
+    'Regeringen',
+];
+/**
+ * Lower-case allowlist of common English words that the noise filter
+ * must always keep, even when their shape would otherwise match the
+ * "looks like a hex token" heuristic (e.g. `face`, `dead`, `beef`).
+ * Kept intentionally tiny to avoid lexicon drift.
+ */
+const HEX_ALPHABETIC_ALLOWLIST = new Set([
+    'face',
+    'fade',
+    'dead',
+    'beef',
+    'cafe',
+    'feed',
+    'deed',
+    'fed',
+    'add',
+    'dad',
+    'bad',
+]);
+/**
+ * Detect run-id slug chains of the form
+ * `<letters>(-<letters>)*-run<digits>(-<digits>)*` — e.g.
+ * `propositions-run261-1779431162` or
+ * `breaking-news-run17-1234567890`. Implemented as a split-and-scan
+ * walker (instead of a single backtracking regex) to satisfy the
+ * `security/detect-unsafe-regex` lint rule.
+ *
+ * @param lower - Lower-case candidate token
+ * @returns `true` when the token matches the run-id slug shape
+ */
+function isRunSlugChain(lower) {
+    const parts = lower.split('-');
+    if (parts.length < 2)
+        return false;
+    let runIndex = -1;
+    for (let i = 0; i < parts.length; i++) {
+        if (/^run\d+$/u.test(parts[i] ?? '')) {
+            runIndex = i;
+            break;
+        }
+    }
+    if (runIndex <= 0)
+        return false;
+    // Every segment before `run<digits>` must be all-letters; every
+    // segment after must be all-digits.
+    for (let i = 0; i < runIndex; i++) {
+        if (!/^[a-z]+$/u.test(parts[i] ?? ''))
+            return false;
+    }
+    for (let i = runIndex + 1; i < parts.length; i++) {
+        if (!/^\d+$/u.test(parts[i] ?? ''))
+            return false;
+    }
+    return true;
+}
+/**
+ * Decide whether a single keyword token should be discarded as noise.
+ *
+ * The current rules reject tokens that:
+ *
+ *   - Look like a UUID hex chunk: ≥4 chars and consist solely of the
+ *     `[0-9a-f]` alphabet **and** contain at least one digit (so
+ *     real English words like `dead` / `face` survive). Tokens of
+ *     length ≥8 are always rejected (a real English word of that
+ *     length composed exclusively of hex letters is vanishingly rare;
+ *     the allowlist guards the short cases).
+ *   - Are mostly digits (≥80 % digit characters) — runtime epoch
+ *     suffixes such as `1779431162` and committee-codeoid mashes like
+ *     `2024k1234`.
+ *   - Start with `run` and end with all-digits (`run261`, `run17`),
+ *     the per-run slug suffix the aggregator stamps onto run ids.
+ *   - Match the full opaque-runId shape `<type>-run<digits>-<digits>`
+ *     after a strip / normalization round-trip.
+ *
+ * Returns `false` for normal vocabulary so the keyword list stays
+ * useful — every reject path is intentionally narrow.
+ *
+ * @param token - Single token candidate
+ * @returns `true` when the token should be dropped from keywords
+ */
+export function isNoiseKeywordToken(token) {
+    if (!token)
+        return true;
+    const trimmed = token.trim();
+    if (trimmed.length < 4)
+        return true;
+    const lower = trimmed.toLowerCase();
+    // Reject pure-digit and digit-dominated tokens.
+    if (/^\d+$/u.test(lower))
+        return true;
+    const digitCount = (lower.match(/\d/gu) ?? []).length;
+    if (digitCount > 0 && digitCount / lower.length >= 0.8)
+        return true;
+    // Reject `run<digits>` slugs and `…-run<digits>-<digits>` chains.
+    if (/^run\d+$/u.test(lower))
+        return true;
+    if (isRunSlugChain(lower))
+        return true;
+    // Reject hex-shaped tokens unless they are common English words.
+    const isHex = /^[0-9a-f]+$/u.test(lower);
+    if (isHex) {
+        if (lower.length >= 8)
+            return true;
+        if (digitCount > 0)
+            return true;
+        if (HEX_ALPHABETIC_ALLOWLIST.has(lower))
+            return false;
+        // Short all-letter hex words: keep (avoids overfitting).
+        return false;
+    }
+    return false;
+}
+//# sourceMappingURL=keyword-filters.js.map

package/scripts/aggregator/metadata/lede-extractor.js CHANGED Viewed

@@ -13,7 +13,7 @@
  * helpers) and heading-rules (for the editorial-lede whitelist and the
  * heading-text normaliser).
  */
-import { DESCRIPTION_MAX_LENGTH, EXTENDED_DESCRIPTION_MAX_LENGTH, shouldSkipDescriptionLine, stripInlineMarkdown, stripLeadingProseLabel, truncateDescription, truncateExtendedDescription, } from './text-utils.js';
+import { DESCRIPTION_MAX_LENGTH, EXTENDED_DESCRIPTION_MAX_LENGTH, shouldSkipDescriptionLine, stripInlineMarkdown, stripLeadingBoldLabel, stripLeadingProseLabel, truncateDescription, truncateExtendedDescription, } from './text-utils.js';
 import { EDITORIAL_LEDE_HEADINGS, isLedeHeadingMatch, normaliseHeadingText, } from './heading-rules.js';
 /**
  * Process one Markdown line against the in-progress paragraph buffer.
@@ -35,7 +35,16 @@ function collectProseLine(line, buf) {
         return 'continue';
     if (shouldSkipDescriptionLine(line))
         return hasBuffer ? 'break' : 'continue';
-    const plain = stripLeadingProseLabel(stripInlineMarkdown(line));
+    // Strip the leading `**Label:**` opener (any language) *before*
+    // running the inline-markdown stripper, so localized BLUF labels
+    // like `**Fråga:**` / `**主題:**` / `**الموضوع:**` are removed
+    // structurally rather than leaking into the description as plain
+    // text (`"Fråga: …"`). The English `**Issue:**` line is already
+    // skipped earlier by METADATA_LINE_PREFIXES; this code path covers
+    // the 13 non-English locales for which the label vocabulary is
+    // open-ended.
+    const stripped = stripLeadingBoldLabel(line);
+    const plain = stripLeadingProseLabel(stripInlineMarkdown(stripped));
     if (!hasBuffer && plain.length < 40)
         return 'continue';
     buf.lines.push(plain);

package/scripts/aggregator/metadata/priority-finding-cleaning.d.ts ADDED Viewed

@@ -0,0 +1,22 @@
+/**
+ * Strip the trailing parenthesised metadata that briefs append to every
+ * priority-finding name — procedure codes, dates, committee tags. The
+ * regex is intentionally non-greedy so it removes only the LAST
+ * parenthesised group on the line.
+ *
+ * @param text - Headline or paragraph text
+ * @returns Text with the trailing `(…)` stripped
+ */
+export declare function stripPriorityTailMetadata(text: string): string;
+/**
+ * Normalise a priority-finding headline: drop the
+ * `Trigger N:` / `Dossier N:` / leading-numeric prefix, strip trailing
+ * parenthesised metadata (`(TA-10-2026-0160, 2026-04-30)`,
+ * `(ITRE/ENVI)`), and trim residual punctuation. The result is a
+ * headline-shaped string suitable for `<title>` use.
+ *
+ * @param raw - Raw bold-title or heading text
+ * @returns Cleaned headline (may be empty after stripping)
+ */
+export declare function cleanPriorityHeadline(raw: string): string;
+//# sourceMappingURL=priority-finding-cleaning.d.ts.map

package/scripts/aggregator/metadata/priority-finding-cleaning.js ADDED Viewed

@@ -0,0 +1,181 @@
+// SPDX-FileCopyrightText: 2024-2026 Hack23 AB
+// SPDX-License-Identifier: Apache-2.0
+/**
+ * @module Aggregator/Metadata/PriorityFindingCleaning
+ * @description Headline-cleaning helpers extracted from
+ * `priority-finding-highlight.ts` to keep that module under the
+ * 600-line drift-guard budget enforced by
+ * `test/unit/source-file-size.test.js`.
+ *
+ * Public entry point: {@link cleanPriorityHeadline} — normalises a
+ * raw bold-title / heading string by stripping priority decorations
+ * (`🔴 CRITICAL — `), editorial prefixes (`Trigger 1: `), trailing
+ * confidence markers (`🔴 CRITICAL`), and parenthesised tail metadata
+ * (`(TA-10-2026-0160, 2026-04-30)`).
+ *
+ * Bounded-context rules:
+ * - **Pure helpers** — no I/O, no globals.
+ * - **Deterministic** — same input always produces same output.
+ * - **Reusable** — every helper accepts a plain string and returns a
+ *   plain string; suitable for property-tests.
+ */
+import { stripInlineMarkdown } from './text-utils.js';
+/**
+ * Leading priority-label tokens stripped by {@link cleanPriorityHeadline}
+ * (`🔴 CRITICAL — Title` → `Title`). Kept as a list to bypass the
+ * unsafe-regex lint by avoiding deep alternation in a single pattern.
+ */
+const PRIORITY_LABEL_TOKENS = [
+    'CRITICAL',
+    'HIGH PRIORITY',
+    'HIGH',
+    'MEDIUM PRIORITY',
+    'MEDIUM',
+    'LOW PRIORITY',
+    'LOW',
+    'URGENT',
+    'ALERT',
+    'PRIORITY',
+];
+/**
+ * Trailing confidence-marker tokens stripped by
+ * {@link cleanPriorityHeadline}. Same rationale as
+ * {@link PRIORITY_LABEL_TOKENS}.
+ */
+const PRIORITY_TRAILING_TOKENS = [
+    'CRITICAL',
+    'HIGH PRIORITY',
+    'HIGH',
+    'MEDIUM PRIORITY',
+    'MEDIUM',
+    'LOW PRIORITY',
+    'LOW',
+];
+/**
+ * Leading editorial-prefix tokens stripped by
+ * {@link cleanPriorityHeadline} (`Trigger 1: Title` → `Title`).
+ */
+const PRIORITY_LEADING_PREFIX_TOKENS = [
+    'Trigger',
+    'Dossier',
+    'Priority',
+    'Finding',
+    'Item',
+    'Highlight',
+    'Top',
+    'Story',
+    'Alert',
+    'Judgement',
+    'Judgment',
+];
+/**
+ * Strip a leading priority decoration (`🔴 `, `CRITICAL — `) from a
+ * candidate headline. Extracted from {@link cleanPriorityHeadline} to
+ * keep cognitive complexity within budget.
+ *
+ * @param text - Candidate headline (already trimmed)
+ * @returns Headline with the leading decoration removed
+ */
+function stripPriorityLeadingDecoration(text) {
+    let out = text;
+    for (let pass = 0; pass < 2; pass++) {
+        out = out.replace(/^[^\p{L}\p{N}]+/u, '').trim();
+        for (const token of PRIORITY_LABEL_TOKENS) {
+            if (out.toLowerCase().startsWith(token.toLowerCase())) {
+                const rest = out.slice(token.length).trim();
+                const sep = rest.match(/^[:—–-]\s*(.+)$/u);
+                if (sep?.[1]) {
+                    out = sep[1].trim();
+                    break;
+                }
+            }
+        }
+    }
+    return out;
+}
+/**
+ * Strip a leading editorial prefix (`Trigger 1: `, `Dossier 2: `) and a
+ * stray leading ordinal (`1. `, `2.1 `) from a candidate headline.
+ *
+ * @param text - Candidate headline
+ * @returns Headline with the leading editorial decoration removed
+ */
+function stripPriorityLeadingPrefix(text) {
+    let out = text;
+    for (const token of PRIORITY_LEADING_PREFIX_TOKENS) {
+        if (!out.toLowerCase().startsWith(token.toLowerCase()))
+            continue;
+        const rest = out.slice(token.length);
+        const match = rest.match(/^\s+\d+\s*[:–—-]\s*(.+)$/u);
+        if (match?.[1]) {
+            out = match[1];
+            break;
+        }
+    }
+    // Drop a stray leading "1. " / "2) " ordinal.
+    out = out.replace(/^\d+[.):·\s]\s*/u, '');
+    return out;
+}
+/**
+ * Strip a trailing confidence marker (`🔴 CRITICAL`, `🟡 MEDIUM`) from a
+ * candidate headline. Single pass — caller invokes inside a fixed-point
+ * loop.
+ *
+ * @param text - Candidate headline
+ * @returns Headline with the trailing confidence marker removed
+ */
+function stripPriorityTrailingMarker(text) {
+    let out = text;
+    for (const token of PRIORITY_TRAILING_TOKENS) {
+        const pattern = new RegExp(`\\s+[^\\p{L}\\p{N}\\s]?\\s*${token}\\s*$`, 'iu');
+        const next = out.replace(pattern, '');
+        if (next !== out) {
+            out = next;
+            break;
+        }
+    }
+    return out;
+}
+/**
+ * Strip the trailing parenthesised metadata that briefs append to every
+ * priority-finding name — procedure codes, dates, committee tags. The
+ * regex is intentionally non-greedy so it removes only the LAST
+ * parenthesised group on the line.
+ *
+ * @param text - Headline or paragraph text
+ * @returns Text with the trailing `(…)` stripped
+ */
+export function stripPriorityTailMetadata(text) {
+    return text.replace(/\s*\([^()]{3,80}\)\s*$/u, '').trim();
+}
+/**
+ * Normalise a priority-finding headline: drop the
+ * `Trigger N:` / `Dossier N:` / leading-numeric prefix, strip trailing
+ * parenthesised metadata (`(TA-10-2026-0160, 2026-04-30)`,
+ * `(ITRE/ENVI)`), and trim residual punctuation. The result is a
+ * headline-shaped string suitable for `<title>` use.
+ *
+ * @param raw - Raw bold-title or heading text
+ * @returns Cleaned headline (may be empty after stripping)
+ */
+export function cleanPriorityHeadline(raw) {
+    let text = stripInlineMarkdown(raw).trim();
+    text = stripPriorityLeadingDecoration(text);
+    text = stripPriorityLeadingPrefix(text);
+    // Trailing cleanup runs in a fixed-point loop so combined patterns
+    // like "Title (Confidence, 80%): 🔴" collapse all the way down to
+    // "Title".
+    let previous = '';
+    while (previous !== text) {
+        previous = text;
+        text = stripPriorityTrailingMarker(text);
+        text = stripPriorityTailMetadata(text);
+        // Drop a single trailing emoji left after metadata stripping.
+        text = text.replace(/\s+[^\p{L}\p{N}\s]+\s*$/u, '');
+        // Drop trailing colons / dashes left over.
+        text = text.replace(/[\s:—–-]+$/u, '');
+        text = text.trim();
+    }
+    return text;
+}
+//# sourceMappingURL=priority-finding-cleaning.js.map

package/scripts/aggregator/metadata/priority-finding-highlight.js CHANGED Viewed

@@ -9,7 +9,9 @@
  * artifact-highlight.ts when an artefact has no usable H1.
  */
 import { normaliseHeadingText } from './heading-rules.js';
+import { cleanPriorityHeadline, stripPriorityTailMetadata } from './priority-finding-cleaning.js';
 import { DESCRIPTION_MAX_LENGTH, shouldSkipDescriptionLine, stripInlineMarkdown, stripLeadingProseLabel, truncateDescription, } from './text-utils.js';
+import { findTitleRejectionReason } from './title-rejection.js';
 /**
  * Section headings inside the executive brief that introduce the
  * named-priority-finding block (matched case-insensitively against the
@@ -290,21 +292,69 @@ function extractPriorityFindingItem(lines, i) {
  */
 const PRIORITY_METADATA_BOLD_PREFIXES = [
     'admiralty',
+    'admiralty scale',
+    'admiralty scale used',
+    'analysis owner',
+    'analyst note',
+    'analytical quality',
+    'bluf',
+    'bottom line up front',
+    'caveats and gaps',
     'classification',
+    'composition layer',
     'confidence',
-    'data sources',
+    'confidence summary',
     'data quality',
+    'data sources',
     'date',
+    'emerging patterns',
+    'forward indicators',
+    'gate target',
     'generated',
+    'headline judgement',
+    'headline judgment',
+    'horizon',
+    'imf status',
+    'issue',
+    'key assumptions',
+    'key assumptions check',
+    'key intelligence',
+    'key risk indicators',
     'lead author',
+    'master assumptions',
+    'master narrative',
     'methodology',
+    'parliamentary status',
+    'period',
+    'prepared',
+    'purpose',
+    'quality of information check',
+    'reporting',
     'reporting window',
     'run',
+    'sat documentation',
+    'sat documentation below',
+    'scope',
     'session',
+    'signal assessment',
     'source',
     'sources',
+    'threat level',
+    'tier 1 priority issues',
+    'tier 2 priority issues',
+    'tier 3 priority issues',
+    'tier 1 priority',
+    'tier 2 priority',
+    'tier 3 priority',
     'time horizon',
+    'top line',
+    'top-line judgement',
+    'top-line judgment',
     'wep',
+    'wep band',
+    'wep bands',
+    'wep bands applied',
+    'window',
 ];
 /**
  * Recognise a metadata-banner bold line (`**Admiralty Grade: B/2**`,
@@ -331,6 +381,22 @@ function isMetadataBoldLine(line) {
         if (inner.startsWith(`${prefix}—`) || inner.startsWith(`${prefix} —`))
             return true;
     }
+    // Pipe-banner shape: two or more `|`-separated segments inside the
+    // bold body indicate a methodology / SAT-tag banner row, never an
+    // editorial headline (e.g.
+    // `**WEP Bands Applied | Admiralty Scale Used | SAT Documentation**`).
+    // Single `|` is allowed because it occurs in legitimate headlines
+    // ("Brexit | A Decade On"). Three or more delimiters is the threshold.
+    const pipeSegments = inner
+        .split('|')
+        .map((s) => s.trim())
+        .filter((s) => s.length > 0);
+    if (pipeSegments.length >= 3)
+        return true;
+    // Trailing-ellipsis bold: `**Some long banner line…**` was clipped by
+    // the brief author and is not a usable editorial headline.
+    if (inner.endsWith('…') || inner.endsWith('...'))
+        return true;
     return false;
 }
 /**
@@ -351,6 +417,14 @@ function buildPriorityResult(rawHeadline, tail, lines, i) {
     const cleaned = cleanPriorityHeadline(rawHeadline);
     if (cleaned.length < 5)
         return null;
+    // Reject bold-prose section labels (`Strategic significance`,
+    // `Threat Level`, `Convergence themes`, …) and other denylisted
+    // tokens. Without this, the priority-finding loop would surface a
+    // `**Strategic significance:** …` line — which the executive-brief
+    // template uses inside every dossier subsection — as the article
+    // title. See `title-rejection.ts` for the full denylist.
+    if (findTitleRejectionReason(cleaned))
+        return null;
     const summaryLines = collectPrioritySummaryLines(tail, lines, i);
     const summary = truncateDescription(summaryLines.join(' '));
     return { headline: cleaned, summary };
@@ -416,162 +490,4 @@ function collectPrioritySummaryLines(tail, lines, i) {
     }
     return summaryLines;
 }
-/**
- * Leading priority-label tokens stripped by {@link cleanPriorityHeadline}
- * (`🔴 CRITICAL — Title` → `Title`). Kept as a list to bypass the
- * unsafe-regex lint by avoiding deep alternation in a single pattern.
- */
-const PRIORITY_LABEL_TOKENS = [
-    'CRITICAL',
-    'HIGH PRIORITY',
-    'HIGH',
-    'MEDIUM PRIORITY',
-    'MEDIUM',
-    'LOW PRIORITY',
-    'LOW',
-    'URGENT',
-    'ALERT',
-    'PRIORITY',
-];
-/**
- * Trailing confidence-marker tokens stripped by
- * {@link cleanPriorityHeadline}. Same rationale as
- * {@link PRIORITY_LABEL_TOKENS}.
- */
-const PRIORITY_TRAILING_TOKENS = [
-    'CRITICAL',
-    'HIGH PRIORITY',
-    'HIGH',
-    'MEDIUM PRIORITY',
-    'MEDIUM',
-    'LOW PRIORITY',
-    'LOW',
-];
-/**
- * Leading editorial-prefix tokens stripped by
- * {@link cleanPriorityHeadline} (`Trigger 1: Title` → `Title`).
- */
-const PRIORITY_LEADING_PREFIX_TOKENS = [
-    'Trigger',
-    'Dossier',
-    'Priority',
-    'Finding',
-    'Item',
-    'Highlight',
-    'Top',
-    'Story',
-    'Alert',
-    'Judgement',
-    'Judgment',
-];
-/**
- * Strip a leading priority decoration (`🔴 `, `CRITICAL — `) from a
- * candidate headline. Extracted from {@link cleanPriorityHeadline} to
- * keep cognitive complexity within budget.
- *
- * @param text - Candidate headline (already trimmed)
- * @returns Headline with the leading decoration removed
- */
-function stripPriorityLeadingDecoration(text) {
-    let out = text;
-    for (let pass = 0; pass < 2; pass++) {
-        out = out.replace(/^[^\p{L}\p{N}]+/u, '').trim();
-        for (const token of PRIORITY_LABEL_TOKENS) {
-            if (out.toLowerCase().startsWith(token.toLowerCase())) {
-                const rest = out.slice(token.length).trim();
-                const sep = rest.match(/^[:—–-]\s*(.+)$/u);
-                if (sep?.[1]) {
-                    out = sep[1].trim();
-                    break;
-                }
-            }
-        }
-    }
-    return out;
-}
-/**
- * Strip a leading editorial prefix (`Trigger 1: `, `Dossier 2: `) and a
- * stray leading ordinal (`1. `, `2.1 `) from a candidate headline.
- *
- * @param text - Candidate headline
- * @returns Headline with the leading editorial decoration removed
- */
-function stripPriorityLeadingPrefix(text) {
-    let out = text;
-    for (const token of PRIORITY_LEADING_PREFIX_TOKENS) {
-        if (!out.toLowerCase().startsWith(token.toLowerCase()))
-            continue;
-        const rest = out.slice(token.length);
-        const match = rest.match(/^\s+\d+\s*[:–—-]\s*(.+)$/u);
-        if (match?.[1]) {
-            out = match[1];
-            break;
-        }
-    }
-    // Drop a stray leading "1. " / "2) " ordinal.
-    out = out.replace(/^\d+[.):·\s]\s*/u, '');
-    return out;
-}
-/**
- * Strip a trailing confidence marker (`🔴 CRITICAL`, `🟡 MEDIUM`) from a
- * candidate headline. Single pass — caller invokes inside a fixed-point
- * loop.
- *
- * @param text - Candidate headline
- * @returns Headline with the trailing confidence marker removed
- */
-function stripPriorityTrailingMarker(text) {
-    let out = text;
-    for (const token of PRIORITY_TRAILING_TOKENS) {
-        const pattern = new RegExp(`\\s+[^\\p{L}\\p{N}\\s]?\\s*${token}\\s*$`, 'iu');
-        const next = out.replace(pattern, '');
-        if (next !== out) {
-            out = next;
-            break;
-        }
-    }
-    return out;
-}
-/**
- * Normalise a priority-finding headline: drop the
- * `Trigger N:` / `Dossier N:` / leading-numeric prefix, strip trailing
- * parenthesised metadata (`(TA-10-2026-0160, 2026-04-30)`,
- * `(ITRE/ENVI)`), and trim residual punctuation. The result is a
- * headline-shaped string suitable for `<title>` use.
- *
- * @param raw - Raw bold-title or heading text
- * @returns Cleaned headline (may be empty after stripping)
- */
-function cleanPriorityHeadline(raw) {
-    let text = stripInlineMarkdown(raw).trim();
-    text = stripPriorityLeadingDecoration(text);
-    text = stripPriorityLeadingPrefix(text);
-    // Trailing cleanup runs in a fixed-point loop so combined patterns
-    // like "Title (Confidence, 80%): 🔴" collapse all the way down to
-    // "Title".
-    let previous = '';
-    while (previous !== text) {
-        previous = text;
-        text = stripPriorityTrailingMarker(text);
-        text = stripPriorityTailMetadata(text);
-        // Drop a single trailing emoji left after metadata stripping.
-        text = text.replace(/\s+[^\p{L}\p{N}\s]+\s*$/u, '');
-        // Drop trailing colons / dashes left over.
-        text = text.replace(/[\s:—–-]+$/u, '');
-        text = text.trim();
-    }
-    return text;
-}
-/**
- * Strip the trailing parenthesised metadata that briefs append to every
- * priority-finding name — procedure codes, dates, committee tags. The
- * regex is intentionally non-greedy so it removes only the LAST
- * parenthesised group on the line.
- *
- * @param text - Headline or paragraph text
- * @returns Text with the trailing `(…)` stripped
- */
-function stripPriorityTailMetadata(text) {
-    return text.replace(/\s*\([^()]{3,80}\)\s*$/u, '').trim();
-}
 //# sourceMappingURL=priority-finding-highlight.js.map