npm - euparliamentmonitor - Versions diffs - 0.9.6 → 0.9.7 - Mend

euparliamentmonitor 0.9.6 → 0.9.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/package.json +7 -1
package/scripts/aggregator/analysis-aggregator.js +48 -0
package/scripts/aggregator/article-metadata.js +69 -6
package/scripts/aggregator/artifact-order.js +28 -5
package/scripts/aggregator/reader-guide-constants.js +13 -1
package/scripts/aggregator/reader-intelligence-guide.js +105 -0
package/scripts/generators/news-indexes.d.ts +12 -0
package/scripts/generators/news-indexes.js +91 -2
package/scripts/generators/sitemap/rss.js +1 -0
package/scripts/generators/sitemap/xml.js +1 -0
package/scripts/minify-assets.js +238 -0
package/scripts/optimize-css.js +79 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "euparliamentmonitor",
-  "version": "0.9.6",
+  "version": "0.9.7",
   "type": "module",
   "description": "European Parliament Intelligence Platform - Monitor political activity with systematic transparency",
   "main": "scripts/index.js",
@@ -70,6 +70,8 @@
     "generate-article:all": "node scripts/aggregator/article-generator.js --all",
     "generate-news-indexes": "node scripts/generators/news-indexes.js",
     "generate-sitemap": "node scripts/generators/sitemap.js",
+    "optimize-css": "node scripts/optimize-css.js",
+    "minify-assets": "node scripts/minify-assets.js",
     "validate-ep-api": "npx tsx src/utils/validate-ep-api.ts",
     "lint:prompts": "node scripts/lint-prompts.js",
     "htmlhint": "sh -c 'htmlhint *.html; set -- news/*.html; if [ -e \"$1\" ]; then htmlhint \"$@\"; else echo \"No news/*.html files to lint\"; fi'",
@@ -154,6 +156,7 @@
     "@vitest/ui": "4.1.6",
     "chart.js": "4.5.1",
     "chartjs-plugin-annotation": "3.1.0",
+    "clean-css": "^5.3.3",
     "d3": "7.9.0",
     "eslint": "10.3.0",
     "eslint-config-prettier": "10.1.8",
@@ -161,6 +164,7 @@
     "eslint-plugin-security": "4.0.0",
     "eslint-plugin-sonarjs": "4.0.3",
     "happy-dom": "20.9.0",
+    "html-minifier-terser": "^7.2.0",
     "htmlhint": "1.9.2",
     "husky": "9.1.7",
     "jscpd": "4.1.1",
@@ -169,6 +173,8 @@
     "mermaid": "11.15.0",
     "papaparse": "5.5.3",
     "prettier": "3.8.3",
+    "purgecss": "7.0.2",
+    "terser": "^5.47.1",
     "ts-api-utils": "2.5.0",
     "tsx": "4.21.0",
     "typedoc": "0.28.19",

package/scripts/aggregator/analysis-aggregator.js CHANGED Viewed

@@ -284,6 +284,10 @@ const READER_GUIDE_EN = {
         need: 'Significance scoring',
         value: 'why this story outranks or trails other same-day European Parliament signals',
     },
+    'section-actors-forces': {
+        need: 'Actors and forces',
+        value: 'who is driving the story, what political forces line up behind them, and which institutional levers they can pull',
+    },
     'section-coalitions-voting': {
         need: 'Coalitions and voting',
         value: 'political group alignment, voting evidence, and coalition pressure points',
@@ -304,6 +308,50 @@ const READER_GUIDE_EN = {
         need: 'Risk assessment',
         value: 'policy, institutional, coalition, communications, and implementation risk register',
     },
+    'section-threat': {
+        need: 'Threat landscape',
+        value: 'hostile actors, attack vectors, consequence trees, and legislative-disruption pathways',
+    },
+    'section-forward-projection': {
+        need: 'What to watch',
+        value: 'dated trigger events, calendar dependencies, and legislative-pipeline forecasts',
+    },
+    'section-electoral-arc': {
+        need: 'Electoral arc and mandate',
+        value: 'where the story sits in the EP term, mandate fulfilment, seat projection, and presidency-trio context',
+    },
+    'section-pestle-context': {
+        need: 'PESTLE and structural context',
+        value: 'political, economic, social, technological, legal, and environmental forces plus the historical baseline',
+    },
+    'section-continuity': {
+        need: 'Cross-run continuity',
+        value: 'what changed since prior sessions and how confidence shifted between runs',
+    },
+    'section-deep-analysis': {
+        need: 'Deep analysis',
+        value: 'long-form Economist-style explanation for readers who want the full argument',
+    },
+    'section-documents': {
+        need: 'Document trail',
+        value: 'the document index and per-file analysis behind the public judgement',
+    },
+    'section-extended-intel': {
+        need: 'Extended intelligence',
+        value: "devil's-advocate critique, comparative parallels, historical precedents, and media framing",
+    },
+    'section-mcp-reliability': {
+        need: 'MCP data reliability',
+        value: 'which feeds were healthy, which were degraded, and how data limits bound conclusions',
+    },
+    'section-quality-reflection': {
+        need: 'Analytical quality and reflection',
+        value: 'self-assessment scores, methodology audit, structured analytic techniques, and known limitations',
+    },
+    'section-supplementary-intelligence': {
+        need: 'Supplementary intelligence',
+        value: 'additional markdown discovered in the run that has not yet been assigned to a canonical section',
+    },
 };
 /**
  * Render the generated reader-intelligence guide that appears before the

package/scripts/aggregator/article-metadata.js CHANGED Viewed

@@ -455,6 +455,56 @@ export function stripInlineMarkdown(raw) {
         .replace(/\s+/g, ' ')
         .trim();
 }
+/** Connector / determiner words that read as broken copy when they are
+ *  the final token before a truncation ellipsis. */
+const TRAILING_STOP_WORDS = new Set([
+    'the',
+    'a',
+    'an',
+    'of',
+    'to',
+    'for',
+    'in',
+    'on',
+    'at',
+    'by',
+    'and',
+    'or',
+    'with',
+    'from',
+]);
+/** Trailing characters we always strip before appending our own ellipsis,
+ *  so we never emit double-ellipsis or stray punctuation. */
+const TRAILING_PUNCT = /[.,;:—\-…\s]/u;
+/**
+ * Repeatedly strip trailing stop-words (separated by a single space) and
+ * trailing punctuation (including any pre-existing ellipsis). Implemented
+ * imperatively to avoid super-linear regex backtracking on the
+ * `(?:\s+stop-word)+$` pattern flagged by `security/detect-unsafe-regex`.
+ *
+ * @param input - Pre-clipped string to clean up
+ * @returns Cleaned string with no trailing stop-words or punctuation
+ */
+function stripTrailingStopWordsAndPunctuation(input) {
+    let result = input;
+    let changed = true;
+    while (changed) {
+        changed = false;
+        while (result.length > 0 && TRAILING_PUNCT.test(result.charAt(result.length - 1))) {
+            result = result.slice(0, -1);
+            changed = true;
+        }
+        const lastSpace = result.lastIndexOf(' ');
+        if (lastSpace >= 0) {
+            const tail = result.slice(lastSpace + 1).toLowerCase();
+            if (TRAILING_STOP_WORDS.has(tail)) {
+                result = result.slice(0, lastSpace);
+                changed = true;
+            }
+        }
+    }
+    return result;
+}
 /**
  * Clamp a string to `DESCRIPTION_MAX_LENGTH` characters, appending
  * an ellipsis when truncation actually happens. Does not break words if
@@ -467,10 +517,22 @@ export function stripInlineMarkdown(raw) {
 export function truncateDescription(text) {
     if (text.length <= DESCRIPTION_MAX_LENGTH)
         return text;
-    const cut = text.slice(0, DESCRIPTION_MAX_LENGTH - 3);
+    const cut = text.slice(0, DESCRIPTION_MAX_LENGTH - 1);
+    // Prefer the last full sentence terminator within the cut so we don't
+    // end on a dangling determiner ("…year. The"). Period/!/? followed by
+    // a space marks a clean boundary. Only honour the boundary when it
+    // sits past the soft minimum so we keep enough body text to be useful.
+    const sentenceEnd = Math.max(cut.lastIndexOf('. '), cut.lastIndexOf('! '), cut.lastIndexOf('? '));
+    if (sentenceEnd >= DESCRIPTION_MIN_LENGTH) {
+        return cut.slice(0, sentenceEnd + 1).replace(/\s+$/, '');
+    }
     const lastSpace = cut.lastIndexOf(' ');
-    const safe = lastSpace > DESCRIPTION_MAX_LENGTH - 60 ? cut.slice(0, lastSpace) : cut;
-    return `${safe.replace(/[.,;:—-]+$/, '')}…`;
+    let safe = lastSpace > DESCRIPTION_MAX_LENGTH - 60 ? cut.slice(0, lastSpace) : cut;
+    // Drop dangling stop-words and trailing punctuation/ellipsis so we
+    // never emit broken copy ("…year. The" → "…year.") or double-ellipsis
+    // ("The……") when the upstream input already carried an ellipsis.
+    safe = stripTrailingStopWordsAndPunctuation(safe);
+    return `${safe}…`;
 }
 /**
  * Clamp a title to `TITLE_MAX_LENGTH` characters in the same
@@ -482,10 +544,11 @@ export function truncateDescription(text) {
 export function truncateTitle(text) {
     if (text.length <= TITLE_MAX_LENGTH)
         return text;
-    const cut = text.slice(0, TITLE_MAX_LENGTH - 3);
+    const cut = text.slice(0, TITLE_MAX_LENGTH - 1);
     const lastSpace = cut.lastIndexOf(' ');
-    const safe = lastSpace > TITLE_MAX_LENGTH - 40 ? cut.slice(0, lastSpace) : cut;
-    return `${safe.replace(/[.,;:—-]+$/, '')}…`;
+    let safe = lastSpace > TITLE_MAX_LENGTH - 40 ? cut.slice(0, lastSpace) : cut;
+    safe = stripTrailingStopWordsAndPunctuation(safe);
+    return `${safe}…`;
 }
 /**
  * Return the first Markdown H1 (`# …`) in the supplied text, stripped of

package/scripts/aggregator/artifact-order.js CHANGED Viewed

@@ -29,7 +29,7 @@ export const ARTIFACT_SECTIONS = [
     {
         id: 'synthesis',
         title: 'Synthesis Summary',
-        artifacts: ['intelligence/synthesis-summary.md'],
+        artifacts: ['intelligence/synthesis-summary.md', 'synthesis.md'],
     },
     {
         id: 'significance',
@@ -40,6 +40,7 @@ export const ARTIFACT_SECTIONS = [
             'classification/priority-matrix.md',
             'classification/issue-classification.md',
             'intelligence/significance-scoring.md',
+            'significance-assessment.md',
         ],
     },
     {
@@ -50,6 +51,9 @@ export const ARTIFACT_SECTIONS = [
             'classification/forces-analysis.md',
             'classification/impact-matrix.md',
             'classification/stakeholder-classification.md',
+            'actor-mapping.md',
+            'political-forces.md',
+            'impact-assessment.md',
             // Catch-all for any other classification/*.md not consumed above
             // (keeps non-canonical artifact names out of the Supplementary bucket
             // and inside their journalist-correct section).
@@ -68,7 +72,11 @@ export const ARTIFACT_SECTIONS = [
     {
         id: 'stakeholder-map',
         title: 'Stakeholder Map',
-        artifacts: ['intelligence/stakeholder-map.md', 'existing/stakeholder-impact.md'],
+        artifacts: [
+            'intelligence/stakeholder-map.md',
+            'existing/stakeholder-impact.md',
+            'stakeholder-perspectives.md',
+        ],
     },
     {
         id: 'economic-context',
@@ -87,6 +95,8 @@ export const ARTIFACT_SECTIONS = [
             'risk-scoring/legislative-risk.md',
             'risk-scoring/economic-risk.md',
             'risk-scoring/institutional-risk.md',
+            'risk-matrix.md',
+            'quantitative-swot.md',
             // Catch-all for any other risk-scoring/*.md (e.g. naming variants) so
             // they render under Risk Assessment instead of Supplementary.
             'risk-scoring/',
@@ -104,7 +114,11 @@ export const ARTIFACT_SECTIONS = [
     {
         id: 'scenarios',
         title: 'Scenarios & Wildcards',
-        artifacts: ['intelligence/scenario-forecast.md', 'intelligence/wildcards-blackswans.md'],
+        artifacts: [
+            'intelligence/scenario-forecast.md',
+            'intelligence/wildcards-blackswans.md',
+            'scenario-forecast.md',
+        ],
     },
     {
         id: 'forward-projection',
@@ -113,6 +127,9 @@ export const ARTIFACT_SECTIONS = [
             'intelligence/forward-projection.md',
             'intelligence/legislative-pipeline-forecast.md',
             'intelligence/parliamentary-calendar-projection.md',
+            'forward/forward-projection.md',
+            'forward/legislative-pipeline-forecast.md',
+            'forward/parliamentary-calendar-projection.md',
             'extended/forward-indicators.md',
         ],
     },
@@ -130,7 +147,11 @@ export const ARTIFACT_SECTIONS = [
     {
         id: 'pestle-context',
         title: 'PESTLE & Context',
-        artifacts: ['intelligence/pestle-analysis.md', 'intelligence/historical-baseline.md'],
+        artifacts: [
+            'intelligence/pestle-analysis.md',
+            'intelligence/historical-baseline.md',
+            'pestle-analysis.md',
+        ],
     },
     {
         id: 'continuity',
@@ -162,7 +183,7 @@ export const ARTIFACT_SECTIONS = [
     {
         id: 'extended-intel',
         title: 'Extended Intelligence',
-        artifacts: ['extended/'],
+        artifacts: ['extended/', 'media-framing.md'],
     },
     {
         id: 'mcp-reliability',
@@ -177,6 +198,8 @@ export const ARTIFACT_SECTIONS = [
             'intelligence/reference-analysis-quality.md',
             'intelligence/workflow-audit.md',
             'intelligence/methodology-reflection.md',
+            'article-index.md',
+            'methodology-reflection.md',
         ],
     },
 ];

package/scripts/aggregator/reader-guide-constants.js CHANGED Viewed

@@ -14,10 +14,22 @@ export const READER_GUIDE_SECTION_IDS = [
     'section-executive-brief',
     'section-synthesis',
     'section-significance',
+    'section-actors-forces',
     'section-coalitions-voting',
     'section-stakeholder-map',
     'section-economic-context',
-    'section-scenarios',
     'section-risk',
+    'section-threat',
+    'section-scenarios',
+    'section-forward-projection',
+    'section-electoral-arc',
+    'section-pestle-context',
+    'section-continuity',
+    'section-deep-analysis',
+    'section-documents',
+    'section-extended-intel',
+    'section-mcp-reliability',
+    'section-quality-reflection',
+    'section-supplementary-intelligence',
 ];
 //# sourceMappingURL=reader-guide-constants.js.map

package/scripts/aggregator/reader-intelligence-guide.js CHANGED Viewed

@@ -567,6 +567,74 @@ const READER_GUIDE_ROWS = {
             zh: '本次运行如何与先前会话关联、变化了什么以及置信度在运行之间如何变化',
         },
     },
+    'section-deep-analysis': {
+        need: {
+            en: 'Deep analysis',
+            sv: 'Djupanalys',
+            da: 'Dybdegående analyse',
+            no: 'Dybdeanalyse',
+            fi: 'Syväanalyysi',
+            de: 'Tiefenanalyse',
+            fr: 'Analyse approfondie',
+            es: 'Análisis profundo',
+            nl: 'Diepteanalyse',
+            ar: 'تحليل معمق',
+            he: 'ניתוח עומק',
+            ja: '詳細分析',
+            ko: '심층 분석',
+            zh: '深度分析',
+        },
+        value: {
+            en: 'long-form Economist-style explanation for readers who want the full argument',
+            sv: 'lång Economist-liknande förklaring för läsare som vill ha hela argumentet',
+            da: 'lang Economist-lignende forklaring for læsere der ønsker hele argumentet',
+            no: 'lang Economist-lignende forklaring for lesere som ønsker hele argumentet',
+            fi: 'pitkä Economist-tyylinen selitys lukijoille, jotka haluavat koko perustelun',
+            de: 'lange, Economist-artige Erklärung für Leser, die das ganze Argument wollen',
+            fr: "explication longue de style Economist pour les lecteurs qui veulent l'argument complet",
+            es: 'explicación extensa de estilo Economist para lectores que quieren el argumento completo',
+            nl: 'lange uitleg in Economist-stijl voor lezers die het volledige argument willen',
+            ar: 'شرح مطول بأسلوب إيكونوميست للقراء الذين يريدون الحجة كاملة',
+            he: 'הסבר ארוך בסגנון האקונומיסט לקוראים שרוצים את הטיעון המלא',
+            ja: '全体の論旨を求める読者向けのエコノミスト風長文解説',
+            ko: '전체 논지를 원하는 독자를 위한 이코노미스트식 장문 설명',
+            zh: '为希望了解完整论证的读者提供的《经济学人》式长篇解释',
+        },
+    },
+    'section-documents': {
+        need: {
+            en: 'Document trail',
+            sv: 'Dokumentspår',
+            da: 'Dokumentspor',
+            no: 'Dokumentspor',
+            fi: 'Asiakirjapolku',
+            de: 'Dokumentenspur',
+            fr: 'Piste documentaire',
+            es: 'Rastro documental',
+            nl: 'Documentspoor',
+            ar: 'مسار الوثائق',
+            he: 'מסלול מסמכים',
+            ja: '文書トレイル',
+            ko: '문서 추적',
+            zh: '文件线索',
+        },
+        value: {
+            en: 'the document index and per-file analysis behind the public judgement',
+            sv: 'dokumentindexet och analysen per fil bakom den offentliga bedömningen',
+            da: 'dokumentindekset og analyse pr. fil bag den offentlige vurdering',
+            no: 'dokumentindeksen og analyse per fil bak den offentlige vurderingen',
+            fi: 'asiakirjahakemisto ja tiedostokohtainen analyysi julkisen arvion taustalla',
+            de: 'Dokumentenindex und Einzeldateianalyse hinter der öffentlichen Bewertung',
+            fr: "l'index des documents et l'analyse fichier par fichier derrière le jugement public",
+            es: 'el índice documental y el análisis por archivo detrás del juicio público',
+            nl: 'de documentenindex en analyse per bestand achter het publieke oordeel',
+            ar: 'فهرس الوثائق والتحليل لكل ملف خلف الحكم العام',
+            he: 'אינדקס המסמכים וניתוח לפי קובץ שמאחורי השיפוט הציבורי',
+            ja: '公開判断の背後にある文書索引とファイル別分析',
+            ko: '공개 판단 뒤에 있는 문서 색인과 파일별 분석',
+            zh: '公共判断背后的文件索引和逐文件分析',
+        },
+    },
     'section-extended-intel': {
         need: {
             en: 'Extended intelligence',
@@ -669,6 +737,40 @@ const READER_GUIDE_ROWS = {
             zh: '自我评估分数、方法论审计、使用的结构化分析技术和已知限制',
         },
     },
+    'section-supplementary-intelligence': {
+        need: {
+            en: 'Supplementary intelligence',
+            sv: 'Kompletterande underrättelse',
+            da: 'Supplerende efterretning',
+            no: 'Supplerende etterretning',
+            fi: 'Täydentävä tiedustelu',
+            de: 'Ergänzende Aufklärung',
+            fr: 'Renseignement supplémentaire',
+            es: 'Inteligencia suplementaria',
+            nl: 'Aanvullende inlichtingen',
+            ar: 'استخبارات تكميلية',
+            he: 'מודיעין משלים',
+            ja: '補足インテリジェンス',
+            ko: '보충 인텔리전스',
+            zh: '补充情报',
+        },
+        value: {
+            en: 'additional markdown discovered in the run that has not yet been assigned to a canonical section',
+            sv: 'ytterligare markdown som hittats i körningen och ännu inte tilldelats en kanonisk sektion',
+            da: 'yderligere markdown fundet i kørslen som endnu ikke er tildelt en kanonisk sektion',
+            no: 'ytterligere markdown funnet i kjøringen som ennå ikke er tilordnet en kanonisk seksjon',
+            fi: 'ajossa löydetty lisämarkdown, jota ei vielä ole liitetty kanoniseen osioon',
+            de: 'zusätzliches Markdown aus dem Lauf, das noch keinem kanonischen Abschnitt zugeordnet ist',
+            fr: "markdown supplémentaire découvert dans l'exécution et pas encore affecté à une section canonique",
+            es: 'markdown adicional descubierto en la ejecución que aún no se ha asignado a una sección canónica',
+            nl: 'extra markdown gevonden in de run dat nog niet aan een canonieke sectie is toegewezen',
+            ar: 'ملفات ماركداون إضافية اكتُشفت في التشغيل ولم تُسند بعد إلى قسم معياري',
+            he: 'מרקדאון נוסף שהתגלה בהרצה ועדיין לא שובץ למדור קנוני',
+            ja: '実行内で見つかったがまだ正規セクションに割り当てられていない追加Markdown',
+            ko: '실행에서 발견되었지만 아직 표준 섹션에 할당되지 않은 추가 마크다운',
+            zh: '运行中发现但尚未分配到规范章节的附加Markdown',
+        },
+    },
 };
 /* ─── Section icons ─────────────────────────────────────────────── */
 /** Visual icons for each reader guide section to improve scannability. */
@@ -687,9 +789,12 @@ const SECTION_ICONS = {
     'section-electoral-arc': '🗳️',
     'section-pestle-context': '🌍',
     'section-continuity': '🔁',
+    'section-deep-analysis': '🔬',
+    'section-documents': '📄',
     'section-extended-intel': '🧠',
     'section-mcp-reliability': '📡',
     'section-quality-reflection': '🪞',
+    'section-supplementary-intelligence': '📎',
 };
 /**
  * Look up the visual icon for a known article section.

package/scripts/generators/news-indexes.d.ts CHANGED Viewed

@@ -8,6 +8,18 @@ import type { ParsedArticle } from '../types/index.js';
  * @returns Filename string
  */
 export declare function getIndexFilename(lang: string): string;
+/**
+ * Backfill hreflang alternate links for all article HTML files.
+ *
+ * Handles three cases:
+ * 1. Articles with no hreflang links at all → inject the full block before `</head>`
+ * 2. Articles with relative hreflang URLs → replace with absolute URLs
+ * 3. Articles already correct → skip
+ *
+ * @param filenames - News article filenames
+ * @returns Number of HTML files updated
+ */
+export declare function backfillArticleHreflang(filenames: readonly string[]): number;
 /**
  * Generate index HTML for a language.
  *

package/scripts/generators/news-indexes.js CHANGED Viewed

@@ -92,9 +92,9 @@ function renderCard(article, meta, categoryLabels) {
 function buildHreflangTags() {
     const links = ALL_LANGUAGES.map((code) => {
         const href = getIndexFilename(code);
-        return `<link rel="alternate" hreflang="${code}" href="${href}">`;
+        return `<link rel="alternate" hreflang="${code}" href="${BASE_URL}/${href}">`;
     });
-    links.push('<link rel="alternate" hreflang="x-default" href="index.html">');
+    links.push(`<link rel="alternate" hreflang="x-default" href="${BASE_URL}/index.html">`);
     return links.join('\n  ');
 }
 /**
@@ -253,6 +253,91 @@ function applyArticleSeoBackfill(html, description, keywords) {
     next = next.replace(/"description":"[^"]*"/u, `"description":"${jsonDescription}"`);
     return next;
 }
+/**
+ * Build hreflang `<link rel="alternate">` tags for an article slug.
+ * Produces one tag per supported language plus an `x-default` pointing at
+ * the English variant, all using absolute URLs.
+ *
+ * @param articleSlug - Slug without language suffix (e.g. `2026-02-24-propositions`)
+ * @returns Newline-joined `<link>` tags
+ */
+function buildArticleHreflang(articleSlug) {
+    const entries = ALL_LANGUAGES.map((code) => `  <link rel="alternate" hreflang="${code}" href="${BASE_URL}/news/${articleSlug}-${code}.html">`);
+    entries.push(`  <link rel="alternate" hreflang="x-default" href="${BASE_URL}/news/${articleSlug}-en.html">`);
+    return entries.join('\n');
+}
+/**
+ * Inject hreflang links into an article that has none.
+ *
+ * @param html - Article HTML content
+ * @param hreflangBlock - Pre-built hreflang link block
+ * @returns Updated HTML, or original if no change needed
+ */
+function injectHreflangLinks(html, hreflangBlock) {
+    return html.replace(/(<\/head>)/u, `${hreflangBlock}\n$1`);
+}
+/**
+ * Replace existing relative hreflang links with absolute URLs.
+ *
+ * @param html - Article HTML content
+ * @param hreflangBlock - Pre-built hreflang link block with absolute URLs
+ * @returns Updated HTML, or original if no change needed
+ */
+function fixRelativeHreflangLinks(html, hreflangBlock) {
+    const stripped = html.replace(/\s*<link\s+rel="alternate"\s+hreflang="[^"]*"\s+href="[^"]*">\n?/gu, '');
+    return stripped.replace(/(<\/head>)/u, `${hreflangBlock}\n$1`);
+}
+/**
+ * Backfill hreflang alternate links for all article HTML files.
+ *
+ * Handles three cases:
+ * 1. Articles with no hreflang links at all → inject the full block before `</head>`
+ * 2. Articles with relative hreflang URLs → replace with absolute URLs
+ * 3. Articles already correct → skip
+ *
+ * @param filenames - News article filenames
+ * @returns Number of HTML files updated
+ */
+export function backfillArticleHreflang(filenames) {
+    let updated = 0;
+    for (const filename of filenames) {
+        if (backfillOneArticleHreflang(filename))
+            updated++;
+    }
+    return updated;
+}
+/**
+ * Backfill hreflang for a single article file.
+ *
+ * @param filename - News article filename
+ * @returns True when the file was updated
+ */
+function backfillOneArticleHreflang(filename) {
+    const parsed = parseArticleFilename(filename);
+    if (!parsed)
+        return false;
+    const filepath = path.join(NEWS_DIR, filename);
+    const html = readArticleHtml(filepath);
+    if (!html)
+        return false;
+    const articleSlug = `${parsed.date}-${parsed.slug}`;
+    const hreflangBlock = buildArticleHreflang(articleSlug);
+    const hasHreflang = /<link\s+rel="alternate"\s+hreflang="/u.test(html);
+    let next;
+    if (!hasHreflang) {
+        next = injectHreflangLinks(html, hreflangBlock);
+    }
+    else {
+        const hasRelative = /<link\s+rel="alternate"\s+hreflang="[^"]*"\s+href="(?!https?:\/\/)/u.test(html);
+        if (!hasRelative)
+            return false;
+        next = fixRelativeHreflangLinks(html, hreflangBlock);
+    }
+    if (next === html)
+        return false;
+    atomicWrite(filepath, next);
+    return true;
+}
 /**
  * Generate index HTML for a language.
  *
@@ -522,6 +607,10 @@ function main() {
     if (backfilled > 0) {
         console.log(`🔎 Backfilled SEO metadata for ${backfilled} legacy article file(s)`);
     }
+    const hreflangBackfilled = backfillArticleHreflang(articles);
+    if (hreflangBackfilled > 0) {
+        console.log(`🔗 Backfilled hreflang links for ${hreflangBackfilled} article file(s)`);
+    }
     const grouped = groupArticlesByLanguage(articles, ALL_LANGUAGES);
     const metaBuildTimerLabel = `⏱️ Built metadata map for ${articles.length} articles`;
     console.time(metaBuildTimerLabel);

package/scripts/generators/sitemap/rss.js CHANGED Viewed

@@ -37,6 +37,7 @@ export function generateRssFeed(articleInfos, buildDate = new Date().toUTCString
       <dc:language>${escapeXML(item.lang)}</dc:language>
     </item>`)
         .join('\n');
+    // REUSE-IgnoreStart
     return `<?xml version="1.0" encoding="UTF-8"?>
 <!-- SPDX-FileCopyrightText: 2024-2026 Hack23 AB -->
 <!-- SPDX-License-Identifier: Apache-2.0 -->

package/scripts/generators/sitemap/xml.js CHANGED Viewed

@@ -86,6 +86,7 @@ export function generateSitemap(articles, docsFiles = []) {
         ...buildArticleUrls(articles),
         ...buildDocsUrls(docsFiles, today),
     ];
+    // REUSE-IgnoreStart
     return `<?xml version="1.0" encoding="UTF-8"?>
 <!-- SPDX-FileCopyrightText: 2024-2026 Hack23 AB -->
 <!-- SPDX-License-Identifier: Apache-2.0 -->

package/scripts/minify-assets.js ADDED Viewed

@@ -0,0 +1,238 @@
+#!/usr/bin/env node
+// SPDX-FileCopyrightText: 2024-2026 Hack23 AB
+// SPDX-License-Identifier: Apache-2.0
+//
+// Minifies HTML, CSS, and JS files in place using pure-Node packages so that
+// the deploy pipeline never needs to pull a Docker image (compatible with the
+// `egress-policy: block` harden-runner configuration in deploy-s3.yml).
+//
+// Run order in deploy-s3.yml:
+//   1. prebuild      — generate all pages
+//   2. optimize-css  — PurgeCSS drops unused selectors from styles.css
+//   3. minify-assets (THIS SCRIPT) — compress the now-smaller CSS + HTML + JS
+//   4. rm -rf node_modules         — clean up before S3 sync
+//   5. aws s3 sync passes          — upload minified payload
+//
+// Must run BEFORE `rm -rf node_modules` because html-minifier-terser,
+// clean-css, and terser are devDependencies.
+//
+// Scopes:
+//   CSS  — styles.css only (the one deployed stylesheet)
+//   HTML — root *.html + news/*.html (all pages shipped to S3)
+//   JS   — js/**/*.js excluding *.min.js (vendor files already minified upstream;
+//           re-minifying risks stripping required license banners)
+//
+// HTML files are processed with a concurrency cap (CONCURRENCY) to avoid
+// overwhelming the event loop on the 4400+ news/*.html archive while still
+// finishing in reasonable time.
+//
+// Exits non-zero if any file fails so the deploy halts before uploading a
+// partially-minified payload.
+import { readFileSync, writeFileSync, readdirSync } from 'node:fs';
+import { resolve, join, dirname } from 'node:path';
+import { fileURLToPath } from 'node:url';
+import { minify as minifyHtml } from 'html-minifier-terser';
+import CleanCSS from 'clean-css';
+import { minify as minifyJs } from 'terser';
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const repoRoot = resolve(__dirname, '..');
+const CONCURRENCY = 32; // parallel HTML workers
+// ─── helpers ────────────────────────────────────────────────────────────────
+function fmt(before, after) {
+  const saved = before - after;
+  const pct = before > 0 ? ((saved / before) * 100).toFixed(1) : '0.0';
+  return `${before} → ${after} B (saved ${saved} B / ${pct}%)`;
+}
+function errorMessage(e) {
+  return e instanceof Error ? e.message : String(e);
+}
+/** Run tasks with at most `limit` in-flight at once. */
+async function pool(tasks, limit) {
+  const results = [];
+  let next = 0;
+  async function worker() {
+    while (next < tasks.length) {
+      const task = tasks[next++];
+      results.push(await task());
+    }
+  }
+  const workers = Array.from({ length: Math.min(limit, tasks.length) }, worker);
+  await Promise.all(workers);
+  return results;
+}
+let totalBefore = 0;
+let totalAfter = 0;
+let errors = 0;
+// ─── CSS ────────────────────────────────────────────────────────────────────
+const cssPath = resolve(repoRoot, 'styles.css');
+{
+  const src = readFileSync(cssPath, 'utf8');
+  const before = Buffer.byteLength(src, 'utf8');
+  const result = new CleanCSS({ level: 2 }).minify(src);
+  if (result.errors && result.errors.length) {
+    console.error('❌ clean-css errors in styles.css:', result.errors);
+    errors++;
+  } else {
+    writeFileSync(cssPath, result.styles);
+    const after = Buffer.byteLength(result.styles, 'utf8');
+    totalBefore += before;
+    totalAfter += after;
+    console.log(`  styles.css  ${fmt(before, after)}`);
+  }
+}
+// ─── HTML ────────────────────────────────────────────────────────────────────
+const htmlOpts = {
+  collapseWhitespace: true,
+  removeComments: true,
+  removeOptionalTags: false,
+  removeRedundantAttributes: true,
+  removeScriptTypeAttributes: true,
+  removeStyleLinkTypeAttributes: true,
+  minifyCSS: true,
+  minifyJS: true,
+  useShortDoctype: true,
+};
+// Collect HTML files: root *.html + news/*.html
+const rootHtml = readdirSync(repoRoot)
+  .filter((f) => f.endsWith('.html'))
+  .map((f) => resolve(repoRoot, f));
+const newsDir = resolve(repoRoot, 'news');
+let newsHtml = [];
+try {
+  newsHtml = readdirSync(newsDir)
+    .filter((f) => f.endsWith('.html'))
+    .map((f) => join(newsDir, f));
+} catch {
+  // news/ directory may not exist in all environments
+}
+const allHtml = [...rootHtml, ...newsHtml];
+let htmlBefore = 0;
+let htmlAfter = 0;
+let htmlErrors = 0;
+const htmlTasks = allHtml.map((p) => async () => {
+  try {
+    const src = readFileSync(p, 'utf8');
+    const before = Buffer.byteLength(src, 'utf8');
+    const minified = await minifyHtml(src, htmlOpts);
+    writeFileSync(p, minified);
+    const after = Buffer.byteLength(minified, 'utf8');
+    return { before, after, ok: true };
+  } catch (e) {
+    console.error(`❌ HTML minify failed for ${p}: ${errorMessage(e)}`);
+    return { before: 0, after: 0, ok: false };
+  }
+});
+const htmlResults = await pool(htmlTasks, CONCURRENCY);
+for (const r of htmlResults) {
+  if (r.ok) {
+    htmlBefore += r.before;
+    htmlAfter += r.after;
+  } else {
+    htmlErrors++;
+  }
+}
+totalBefore += htmlBefore;
+totalAfter += htmlAfter;
+errors += htmlErrors;
+console.log(
+  `  HTML: ${allHtml.length - htmlErrors} files minified  ${fmt(htmlBefore, htmlAfter)}`,
+);
+// ─── JS ─────────────────────────────────────────────────────────────────────
+const jsDir = resolve(repoRoot, 'js');
+let jsFiles = [];
+function collectJs(dir) {
+  try {
+    for (const entry of readdirSync(dir, { withFileTypes: true })) {
+      const full = join(dir, entry.name);
+      if (entry.isDirectory()) {
+        collectJs(full);
+      } else if (entry.name.endsWith('.js') && !entry.name.endsWith('.min.js')) {
+        // Skip *.min.js — vendor bundles are already minified upstream;
+        // re-minifying them is wasteful and risks stripping required license banners.
+        jsFiles.push(full);
+      }
+    }
+  } catch {
+    // js/ may not exist in test environments
+  }
+}
+collectJs(jsDir);
+let jsBefore = 0;
+let jsAfter = 0;
+let jsErrors = 0;
+const jsTasks = jsFiles.map((p) => async () => {
+  try {
+    const src = readFileSync(p, 'utf8');
+    const before = Buffer.byteLength(src, 'utf8');
+    const result = await minifyJs(src, {
+      compress: true,
+      mangle: true,
+      // Preserve /*! ... */ license banners (e.g. Chart.js, D3, MIT headers).
+      // terser 'some' keeps comments that start with ! or contain @license / @preserve.
+      format: { comments: 'some' },
+    });
+    if (result.code) {
+      writeFileSync(p, result.code);
+      const after = Buffer.byteLength(result.code, 'utf8');
+      return { before, after, ok: true };
+    }
+    // Terser succeeded but produced no output — log and skip (file stays as-is)
+    console.warn(`⚠️  terser returned no code for ${p} — skipping`);
+    return { before, after: before, ok: true };
+  } catch (e) {
+    console.error(`❌ JS minify failed for ${p}: ${errorMessage(e)}`);
+    return { before: 0, after: 0, ok: false };
+  }
+});
+const jsResults = await pool(jsTasks, CONCURRENCY);
+for (const r of jsResults) {
+  if (r.ok) {
+    jsBefore += r.before;
+    jsAfter += r.after;
+  } else {
+    jsErrors++;
+  }
+}
+totalBefore += jsBefore;
+totalAfter += jsAfter;
+errors += jsErrors;
+console.log(
+  `  JS:   ${jsFiles.length - jsErrors} files minified  ${fmt(jsBefore, jsAfter)}`,
+);
+// ─── summary ────────────────────────────────────────────────────────────────
+const savedTotal = totalBefore - totalAfter;
+const pctTotal =
+  totalBefore > 0 ? ((savedTotal / totalBefore) * 100).toFixed(1) : '0.0';
+console.log(
+  `✅ Minification complete: ${totalBefore} → ${totalAfter} B ` +
+    `(saved ${savedTotal} B / ${pctTotal}% across CSS + ${allHtml.length} HTML + ${jsFiles.length} JS)`,
+);
+if (errors > 0) {
+  console.error(`❌ ${errors} file(s) failed to minify — aborting deploy.`);
+  process.exit(1);
+}

package/scripts/optimize-css.js ADDED Viewed

@@ -0,0 +1,79 @@
+#!/usr/bin/env node
+// SPDX-FileCopyrightText: 2024-2026 Hack23 AB
+// SPDX-License-Identifier: Apache-2.0
+//
+// Run PurgeCSS against the deployed CSS using the committed config in
+// purgecss.config.cjs. Writes the purged result back to styles.css
+// in place — keeps the existing filename so every HTML
+// `<link rel="stylesheet" href="styles.css">` continues to resolve and
+// no rewrite of generated pages is required.
+//
+// Invoked from `.github/workflows/deploy-s3.yml` after `npm run prebuild`
+// (so all generated HTML pages exist) and before the
+// `npm run minify-assets` step (which then minifies the now-smaller CSS).
+//
+// Logs before/after byte counts so the deploy log records the saving,
+// and exits non-zero on failure so the deploy halts before publishing
+// half-stripped CSS.
+import { readFileSync, statSync, writeFileSync } from 'node:fs';
+import { fileURLToPath } from 'node:url';
+import { dirname, resolve } from 'node:path';
+import { createRequire } from 'node:module';
+import { PurgeCSS } from 'purgecss';
+const require = createRequire(import.meta.url);
+const __dirname = dirname(fileURLToPath(import.meta.url));
+const repoRoot = resolve(__dirname, '..');
+const configPath = resolve(repoRoot, 'purgecss.config.cjs');
+const cssPath = resolve(repoRoot, 'styles.css');
+const config = require(configPath);
+const beforeBytes = statSync(cssPath).size;
+// Capture the pre-purge CSS so we can restore it verbatim if the purge
+// produces output that fails the downstream sanity floor — reading the
+// file AFTER the in-place write would only recover the (broken) purged
+// content.
+const originalCss = readFileSync(cssPath, 'utf8');
+const result = await new PurgeCSS().purge({
+  content: config.content,
+  css: config.css,
+  safelist: config.safelist,
+  variables: config.variables,
+  keyframes: config.keyframes,
+  fontFace: config.fontFace,
+});
+if (!result.length || typeof result[0].css !== 'string') {
+  console.error('❌ PurgeCSS returned no result for styles.css — aborting.');
+  process.exit(1);
+}
+const purged = result[0].css;
+writeFileSync(cssPath, purged);
+const afterBytes = statSync(cssPath).size;
+const savedBytes = beforeBytes - afterBytes;
+const savedPct = ((savedBytes / beforeBytes) * 100).toFixed(1);
+console.log(
+  `✅ styles.css purged: ${beforeBytes} → ${afterBytes} bytes ` +
+    `(saved ${savedBytes} B / ${savedPct}%)`,
+);
+// Sanity floor: if the purge produces a styles.css smaller than 32 KiB,
+// something has likely scanned the wrong content set (eg. globs missed
+// the news/ directory). Halt instead of shipping a near-empty stylesheet.
+const FLOOR_BYTES = 32 * 1024;
+if (afterBytes < FLOOR_BYTES) {
+  console.error(
+    `❌ styles.css after purge (${afterBytes} B) is below the ${FLOOR_BYTES} B sanity ` +
+      'floor — restoring the pre-purge CSS and refusing to ship a likely-broken stylesheet.',
+  );
+  // Restore from the in-memory capture taken BEFORE the purge so a re-run
+  // from cache cannot observe the broken file.
+  writeFileSync(cssPath, originalCss);
+  process.exit(1);
+}