npm - @nuasite/cms - Versions diffs - 0.46.1 → 0.46.2 - Mend

@nuasite/cms 0.46.1 → 0.46.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/editor.js +1 -1
package/package.json +7 -7
package/src/source-finder/cache.ts +12 -0
package/src/source-finder/collection-finder.ts +231 -79

package/dist/editor.js CHANGED Viewed

@@ -386,7 +386,7 @@ function IC(t, e) {
 function _C(t, e) {
   return typeof e == "function" ? e(t) : e;
 }
-const u5 = "0.46.1", h5 = u5, ct = {
+const u5 = "0.46.2", h5 = u5, ct = {
   /** Highlight overlay for hovered elements */
   HIGHLIGHT: 2147483644,
   /** Hover outline for elements/components */

package/package.json CHANGED Viewed

@@ -14,7 +14,7 @@
     "directory": "packages/astro-cms"
   },
   "license": "Apache-2.0",
-  "version": "0.46.1",
+  "version": "0.46.2",
   "module": "src/index.ts",
   "types": "src/index.ts",
   "type": "module",
@@ -26,8 +26,8 @@
     }
   },
   "dependencies": {
-    "@nuasite/cms-core": "0.46.1",
-    "@nuasite/cms-types": "0.46.1",
+    "@nuasite/cms-core": "0.46.2",
+    "@nuasite/cms-types": "0.46.2",
     "@astrojs/compiler": "^3.0.1",
     "@babel/parser": "^7.29.2",
     "node-html-parser": "^7.1.0",
@@ -35,8 +35,8 @@
     "yaml": "^2.8.3"
   },
   "devDependencies": {
-    "@nuasite/cms-sidecar": "0.46.1",
-    "@nuasite/collections-admin": "0.46.1",
+    "@nuasite/cms-sidecar": "0.46.2",
+    "@nuasite/collections-admin": "0.46.2",
     "@babel/types": "^7.29.0",
     "@types/react": "^19.2.7",
     "@types/react-dom": "^19.2.3",
@@ -76,8 +76,8 @@
     "typescript": "^6.0.2",
     "vite": "^7.0.0",
     "@aws-sdk/client-s3": "^3.0.0",
-    "@nuasite/cms-sidecar": "0.46.1",
-    "@nuasite/collections-admin": "0.46.1",
+    "@nuasite/cms-sidecar": "0.46.2",
+    "@nuasite/collections-admin": "0.46.2",
     "react": "^19.0.0",
     "react-dom": "^19.0.0"
   },

package/src/source-finder/cache.ts CHANGED Viewed

@@ -21,6 +21,9 @@ let searchIndexInitialized = false
 /** Pre-built reverse index: normalizedText → SourceLocation[] (collection data files) */
 let collectionTextIndex: Map<string, SourceLocation[]> | null = null
+/** Per-collection-directory index: declared page URL → file abs path — used by the same-slug URL-disambiguation fallback */
+const declaredUrlIndexCache = new Map<string, Map<string, string>>()
 /** Lazy reverse index on i18n entries: translationKey → SearchIndexEntry[]. Rebuilt on demand after any mutation. */
 let translationKeyIndex: Map<string, SearchIndexEntry[]> | null = null
@@ -93,6 +96,10 @@ export function setCollectionTextIndex(index: Map<string, SourceLocation[]> | nu
 	collectionTextIndex = index
 }
+export function getDeclaredUrlIndexCache(): Map<string, Map<string, string>> {
+	return declaredUrlIndexCache
+}
 // ============================================================================
 // Dirty File Tracking (incremental re-indexing)
 // ============================================================================
@@ -106,6 +113,10 @@ export function markFileDirty(absPath: string): void {
 	dirtyFiles.add(absPath)
 	// Also evict the parsed file cache so it's re-read from disk
 	parsedFileCache.delete(absPath)
+	// A changed file may add/remove/alter a declared URL anywhere in its
+	// collection directory — cheaper to drop the whole cache than track
+	// per-directory membership for a rarely-hit index.
+	declaredUrlIndexCache.clear()
 }
 export function getDirtyFiles(): Set<string> {
@@ -155,4 +166,5 @@ export function clearSourceFinderCache(): void {
 	searchIndexInitialized = false
 	collectionTextIndex = null
 	translationKeyIndex = null
+	declaredUrlIndexCache.clear()
 }

package/src/source-finder/collection-finder.ts CHANGED Viewed

@@ -4,7 +4,7 @@ import { isMap, isPair, isScalar, isSeq, LineCounter, parseDocument } from 'yaml
 import { getProjectRoot } from '../config'
 import type { CollectionDefinition } from '../types'
-import { getCollectionTextIndex, getMarkdownFileCache, setCollectionTextIndex } from './cache'
+import { getCollectionTextIndex, getDeclaredUrlIndexCache, getMarkdownFileCache, setCollectionTextIndex } from './cache'
 import { normalizeText } from './snippet-utils'
 import type { CollectionInfo, MarkdownContent, SourceLocation } from './types'
@@ -52,20 +52,10 @@ async function doBuildCollectionTextIndex(
 				} else {
 					// Markdown — index scalars from frontmatter only
 					const { lines } = cached
-					let fmStart = -1
-					let fmEnd = -1
-					for (let i = 0; i < lines.length; i++) {
-						if (lines[i]?.trim() === '---') {
-							if (fmStart === -1) fmStart = i
-							else {
-								fmEnd = i
-								break
-							}
-						}
-					}
-					if (fmEnd > 0) {
-						const yamlStr = lines.slice(fmStart + 1, fmEnd).join('\n')
-						collectScalarsFromYaml(yamlStr, fmStart + 1, lines, info, index)
+					const bounds = findFrontmatterBounds(lines)
+					if (bounds) {
+						const yamlStr = lines.slice(bounds.start + 1, bounds.end).join('\n')
+						collectScalarsFromYaml(yamlStr, bounds.start + 1, lines, info, index)
 					}
 				}
 			} catch {
@@ -187,6 +177,22 @@ export function lookupCollectionText(
 // Markdown File Cache
 // ============================================================================
+/**
+ * Locate the `---`-delimited frontmatter block in a markdown file's lines.
+ * Returns the indexes of the opening and closing `---` lines, or undefined if
+ * the file has no closed frontmatter block.
+ */
+function findFrontmatterBounds(lines: string[]): { start: number; end: number } | undefined {
+	let start = -1
+	for (let i = 0; i < lines.length; i++) {
+		if (lines[i]?.trim() === '---') {
+			if (start === -1) start = i
+			else return { start, end: i }
+		}
+	}
+	return undefined
+}
 /**
  * Get cached markdown file content
  */
@@ -210,6 +216,17 @@ async function getCachedMarkdownFile(filePath: string): Promise<{ content: strin
 // Collection Source Finding
 // ============================================================================
+/**
+ * Frontmatter fields, in preference order, that may declare an entry's own
+ * canonical page URL. Only site-absolute values (starting with `/`) are trusted
+ * — external `url: https://…` values and bare slugs are ignored. Deliberately
+ * excludes `canonical`/`canonicalUrl`: by SEO convention those declare the URL
+ * that should be indexed *instead of* the current page (duplicate-content
+ * consolidation), which can point at a different entry entirely — trusting it
+ * as self-identity could resolve an edit to the wrong file.
+ */
+const DECLARED_URL_FIELDS = ['urlpath', 'permalink', 'pathname', 'route', 'url']
 /**
  * Find markdown collection file for a given page path.
  *
@@ -217,6 +234,14 @@ async function getCachedMarkdownFile(filePath: string): Promise<{ content: strin
  * matching entry regardless of the URL prefix. This supports localized or
  * renamed routes (e.g. `/aktuality/my-article` with content in `src/content/news/`).
  *
+ * Filename matching alone cannot tell apart two entries that share a slug but
+ * live under different URL prefixes (e.g. the same article slug published under
+ * two topic prefixes, where one file carries a disambiguating filename suffix).
+ * When a filename match declares a canonical URL in its frontmatter that
+ * contradicts the requested path, we fall back to matching entries by that
+ * declared URL. Projects whose entries declare no URL field keep the exact
+ * previous (filename-only) behavior.
+ *
  * @param pagePath - The URL path of the page (e.g., '/services/3d-tisk')
  * @param contentDir - The content directory (default: 'src/content')
  * @returns Collection info if found, undefined otherwise
@@ -233,6 +258,7 @@ export async function findCollectionSource(
 		return undefined
 	}
+	const requestedUrl = normalizeSitePath(`/${cleanPath}`)
 	const contentPath = path.join(getProjectRoot(), contentDir)
 	try {
@@ -245,9 +271,12 @@ export async function findCollectionSource(
 	let collectionDirs: string[]
 	try {
 		const entries = await fs.readdir(contentPath, { withFileTypes: true })
+		// Sorted so match/resolution order is deterministic across runs and
+		// platforms, not dependent on readdir's unspecified enumeration order.
 		collectionDirs = entries
 			.filter(e => e.isDirectory() && !e.name.startsWith('_') && !e.name.startsWith('.'))
 			.map(e => e.name)
+			.sort()
 	} catch {
 		return undefined
 	}
@@ -266,6 +295,20 @@ export async function findCollectionSource(
 			}
 		}
+		if (matches.length === 0) continue
+		// Prefer the entry whose declared canonical URL equals the requested
+		// path. Only kicks in when an entry actually declares a URL, so
+		// URL-less projects fall through to the filename logic unchanged.
+		const byUrl = await resolveByDeclaredUrl(matches, requestedUrl, contentPath)
+		if (byUrl) {
+			// byUrl.file may differ from the file the filename match found
+			// (that's the whole point of this fallback) — its slug must be
+			// derived from the actual resolved file, not the URL-tail slug
+			// candidate, or downstream collectionSlug lookups break.
+			return { name: byUrl.name, slug: slugFromFilePath(byUrl.file), file: path.relative(getProjectRoot(), byUrl.file) }
+		}
 		if (matches.length === 1 && matches[0]) {
 			return {
 				name: matches[0].name,
@@ -291,6 +334,162 @@ export async function findCollectionSource(
 	return undefined
 }
+/** Normalize a site-absolute path: ensure a leading slash, drop query/hash and any trailing slash. */
+function normalizeSitePath(p: string): string {
+	let s = p.split('?')[0]?.split('#')[0] ?? p
+	if (!s.startsWith('/')) s = `/${s}`
+	if (s.length > 1 && s.endsWith('/')) s = s.slice(0, -1)
+	return s
+}
+/**
+ * Derive a collection entry's slug from its file path, matching the same
+ * convention collection-scanner.ts uses: flat `<slug>.md(x)` files use the
+ * basename minus extension; Hugo-style `<slug>/index.md(x)` files use the
+ * parent directory name.
+ */
+function slugFromFilePath(fileAbsPath: string): string {
+	const base = path.basename(fileAbsPath)
+	if (base === 'index.md' || base === 'index.mdx') {
+		return path.basename(path.dirname(fileAbsPath))
+	}
+	return base.replace(/\.mdx?$/, '')
+}
+/**
+ * Read an entry's declared canonical page URL from its frontmatter, if any.
+ * Returns the normalized site-absolute path, or undefined when the file has no
+ * frontmatter or declares no site-absolute URL field.
+ */
+async function readDeclaredPageUrl(fileAbsPath: string): Promise<string | undefined> {
+	const cached = await getCachedMarkdownFile(fileAbsPath)
+	if (!cached) return undefined
+	const bounds = findFrontmatterBounds(cached.lines)
+	if (!bounds) return undefined
+	let doc
+	try {
+		doc = parseDocument(cached.lines.slice(bounds.start + 1, bounds.end).join('\n'))
+	} catch {
+		return undefined
+	}
+	if (!isMap(doc.contents)) return undefined
+	const found: Record<string, string> = {}
+	for (const pair of doc.contents.items) {
+		if (!isPair(pair) || !isScalar(pair.key) || !isScalar(pair.value)) continue
+		const key = String(pair.key.value).toLowerCase()
+		if (!DECLARED_URL_FIELDS.includes(key)) continue
+		const val = pair.value.value
+		if (typeof val === 'string' && val.startsWith('/')) {
+			found[key] ??= normalizeSitePath(val)
+		}
+	}
+	for (const field of DECLARED_URL_FIELDS) {
+		if (found[field]) return found[field]
+	}
+	return undefined
+}
+/**
+ * Resolve the correct entry for `requestedUrl` using declared canonical URLs.
+ *
+ * 1. If a filename candidate declares exactly `requestedUrl`, use it.
+ * 2. Otherwise, if any candidate declares *some* URL (so the collection is
+ *    URL-aware) but none matches, the filename match is for a same-slug sibling
+ *    under a different prefix — scan the candidate collection(s) for the file
+ *    whose declared URL is `requestedUrl`.
+ * 3. If no candidate declares any URL, return undefined so the caller keeps the
+ *    legacy filename behavior.
+ */
+async function resolveByDeclaredUrl(
+	matches: { name: string; file: string }[],
+	requestedUrl: string,
+	contentPath: string,
+): Promise<{ name: string; file: string } | undefined> {
+	let sawDeclaredUrl = false
+	for (const m of matches) {
+		const declared = await readDeclaredPageUrl(m.file)
+		if (declared === undefined) continue
+		sawDeclaredUrl = true
+		if (declared === requestedUrl) return m
+	}
+	if (!sawDeclaredUrl) return undefined
+	// Contradiction: the right entry is named differently from its slug. Scan
+	// the collection(s) that produced filename matches for a declared-URL hit.
+	// `matches` (and thus this Set) is built by iterating the sorted
+	// `collectionDirs`, so directory order here is deterministic.
+	for (const dir of new Set(matches.map(m => m.name))) {
+		const hit = await findFileByDeclaredUrl(path.join(contentPath, dir), requestedUrl)
+		if (hit) return { name: dir, file: hit }
+	}
+	return undefined
+}
+/**
+ * Find the file in a collection directory whose declared canonical URL
+ * matches, via a per-directory URL→file index that's built once and cached
+ * (see `getDeclaredUrlIndexCache`) — only the first request for an ambiguous
+ * slug in a given directory pays for the full scan.
+ */
+async function findFileByDeclaredUrl(collectionPathAbs: string, requestedUrl: string): Promise<string | undefined> {
+	const cache = getDeclaredUrlIndexCache()
+	let index = cache.get(collectionPathAbs)
+	if (!index) {
+		index = await buildDeclaredUrlIndex(collectionPathAbs)
+		cache.set(collectionPathAbs, index)
+	}
+	return index.get(requestedUrl)
+}
+/**
+ * Scan a collection directory (flat `*.md(x)` files and Hugo-style
+ * `<slug>/index.md(x)`) and index every entry by its declared canonical URL.
+ * Entries are visited in sorted order so that if two entries declare the same
+ * URL (a content bug), the winner is deterministic rather than readdir-order
+ * dependent.
+ */
+async function buildDeclaredUrlIndex(collectionPathAbs: string): Promise<Map<string, string>> {
+	const index = new Map<string, string>()
+	let dirEntries
+	try {
+		dirEntries = await fs.readdir(collectionPathAbs, { withFileTypes: true })
+	} catch {
+		return index
+	}
+	const files = dirEntries
+		.filter(e => e.isFile() && /\.mdx?$/.test(e.name))
+		.map(e => e.name)
+		.sort()
+	for (const name of files) {
+		const file = path.join(collectionPathAbs, name)
+		const declared = await readDeclaredPageUrl(file)
+		if (declared && !index.has(declared)) index.set(declared, file)
+	}
+	const subDirs = dirEntries
+		.filter(e => e.isDirectory() && !e.name.startsWith('_') && !e.name.startsWith('.'))
+		.map(e => e.name)
+		.sort()
+	for (const dir of subDirs) {
+		for (const idx of ['index.md', 'index.mdx']) {
+			const file = path.join(collectionPathAbs, dir, idx)
+			const declared = await readDeclaredPageUrl(file)
+			if (declared) {
+				if (!index.has(declared)) index.set(declared, file)
+				break
+			}
+		}
+	}
+	return index
+}
 /**
  * Find a markdown file in a collection directory by slug
  */
@@ -370,23 +569,11 @@ export async function findMarkdownSourceLocation(
 		const { lines } = cached
 		const normalizedSearch = normalizeText(textContent)
-		// Find frontmatter boundaries
-		let frontmatterStart = -1
-		let frontmatterEnd = -1
-		for (let i = 0; i < lines.length; i++) {
-			if (lines[i]?.trim() === '---') {
-				if (frontmatterStart === -1) {
-					frontmatterStart = i
-				} else {
-					frontmatterEnd = i
-					break
-				}
-			}
-		}
-		if (frontmatterEnd <= 0) return undefined
+		const bounds = findFrontmatterBounds(lines)
+		if (!bounds) return undefined
-		const yamlStr = lines.slice(frontmatterStart + 1, frontmatterEnd).join('\n')
-		const lineOffset = frontmatterStart + 1
+		const yamlStr = lines.slice(bounds.start + 1, bounds.end).join('\n')
+		const lineOffset = bounds.start + 1
 		return findScalarInYamlAst(yamlStr, lineOffset, normalizedSearch, lines, collectionInfo)
 	} catch {
 		// Error reading file
@@ -550,20 +737,10 @@ export async function findFieldInCollectionEntry(
 		// For markdown, search inside frontmatter only
 		const { lines } = cached
-		let fmStart = -1
-		let fmEnd = -1
-		for (let i = 0; i < lines.length; i++) {
-			if (lines[i]?.trim() === '---') {
-				if (fmStart === -1) fmStart = i
-				else {
-					fmEnd = i
-					break
-				}
-			}
-		}
-		if (fmEnd <= 0) return undefined
-		const yamlStr = lines.slice(fmStart + 1, fmEnd).join('\n')
-		return findFieldByNameInYaml(yamlStr, fmStart + 1, fieldName, lines, info)
+		const bounds = findFrontmatterBounds(lines)
+		if (!bounds) return undefined
+		const yamlStr = lines.slice(bounds.start + 1, bounds.end).join('\n')
+		return findFieldByNameInYaml(yamlStr, bounds.start + 1, fieldName, lines, info)
 	} catch {
 		return undefined
 	}
@@ -598,20 +775,10 @@ export async function findFieldsInCollectionEntry(
 		// For markdown, search inside frontmatter only
 		const { lines } = cached
-		let fmStart = -1
-		let fmEnd = -1
-		for (let i = 0; i < lines.length; i++) {
-			if (lines[i]?.trim() === '---') {
-				if (fmStart === -1) fmStart = i
-				else {
-					fmEnd = i
-					break
-				}
-			}
-		}
-		if (fmEnd <= 0) return new Map()
-		const yamlStr = lines.slice(fmStart + 1, fmEnd).join('\n')
-		return findFieldsByNameInYaml(yamlStr, fmStart + 1, fieldNames, lines, info)
+		const bounds = findFrontmatterBounds(lines)
+		if (!bounds) return new Map()
+		const yamlStr = lines.slice(bounds.start + 1, bounds.end).join('\n')
+		return findFieldsByNameInYaml(yamlStr, bounds.start + 1, fieldNames, lines, info)
 	} catch {
 		return new Map()
 	}
@@ -695,27 +862,12 @@ export async function parseMarkdownContent(
 		const { lines } = cached
-		// Parse frontmatter
-		let frontmatterStart = -1
-		let frontmatterEnd = -1
-		for (let i = 0; i < lines.length; i++) {
-			const line = lines[i]?.trim()
-			if (line === '---') {
-				if (frontmatterStart === -1) {
-					frontmatterStart = i
-				} else {
-					frontmatterEnd = i
-					break
-				}
-			}
-		}
+		const bounds = findFrontmatterBounds(lines)
 		const frontmatter: Record<string, { value: string; line: number }> = {}
 		// Extract frontmatter fields using yaml parser
-		if (frontmatterEnd > 0) {
-			const yamlStr = lines.slice(frontmatterStart + 1, frontmatterEnd).join('\n')
+		if (bounds) {
+			const yamlStr = lines.slice(bounds.start + 1, bounds.end).join('\n')
 			const lineCounter = new LineCounter()
 			const doc = parseDocument(yamlStr, { lineCounter })
@@ -726,7 +878,7 @@ export async function parseMarkdownContent(
 						const value = isScalar(pair.value) ? String(pair.value.value) : ''
 						const keyRange = (pair.key as any).range
 						const yamlLine = keyRange ? lineCounter.linePos(keyRange[0]).line : 0
-						const fileLine = yamlLine + frontmatterStart + 1
+						const fileLine = yamlLine + bounds.start + 1
 						if (key && value) {
 							frontmatter[key] = { value, line: fileLine }
 						}
@@ -736,7 +888,7 @@ export async function parseMarkdownContent(
 		}
 		// Extract body (everything after frontmatter)
-		const bodyStartLine = frontmatterEnd > 0 ? frontmatterEnd + 1 : 0
+		const bodyStartLine = bounds ? bounds.end + 1 : 0
 		const bodyLines = lines.slice(bodyStartLine)
 		const body = bodyLines.join('\n').trim()