npm - @markuplint/html-parser - Versions diffs - 4.6.23 → 5.0.0-alpha.1 - Mend

@markuplint/html-parser 4.6.23 → 5.0.0-alpha.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (6) hide show

package/ARCHITECTURE.md CHANGED Viewed

@@ -8,10 +8,9 @@
 ```
 src/
-├── index.ts                              — Re-exports HtmlParser, parser, getNamespace
+├── index.ts                              — Re-exports HtmlParser and parser
 ├── parser.ts                             — HtmlParser class extending Parser<Node, State>
 ├── types.ts                              — Re-exports parse5 types (Node, Element, etc.)
-├── get-namespace.ts                      — Namespace URI resolution (HTML/SVG/MathML)
 ├── is-document-fragment.ts               — Regex-based fragment vs document detection
 └── optimize-starts-head-or-body.ts       — Head/body tag placeholder optimization
 ```
@@ -28,7 +27,6 @@ flowchart TD
     subgraph pkg ["@markuplint/html-parser"]
         htmlParser["HtmlParser\nextends Parser‹Node, State›"]
-        getNs["getNamespace()\nNamespace resolution"]
         isFragment["isDocumentFragment()\nFragment detection"]
         optimize["optimizeStartsHeadTagOrBodyTag\nHead/body optimization"]
         types["types.ts\nparse5 type re-exports"]
@@ -44,11 +42,8 @@ flowchart TD
     mlAst -->|"AST types"| htmlParser
     parserUtils -->|"Parser base class"| htmlParser
     parse5 -->|"parse / parseFragment"| htmlParser
-    parse5 -->|"parseFragment"| getNs
     htmlParser --> isFragment
     htmlParser --> optimize
-    htmlParser --> getNs
     htmlParser -->|"extends / imports"| downstream
 ```
@@ -73,15 +68,15 @@ The parser maintains internal state through the `State` type:
 ### Override Methods
-| Method              | Purpose                                                                                                  |
-| ------------------- | -------------------------------------------------------------------------------------------------------- |
-| `tokenize()`        | Invokes parse5 `parse()` or `parseFragment()` based on fragment detection                                |
-| `beforeParse()`     | Sets up head/body optimization and offset tracking                                                       |
-| `afterParse()`      | Restores original head/body tag names from placeholders                                                  |
-| `nodeize()`         | Converts parse5 nodes to markuplint AST nodes, handling ghost elements, template content, and namespaces |
-| `afterNodeize()`    | Updates `afterPosition` state for ghost element positioning                                              |
-| `visitText()`       | Delegates to parent with `researchTags: true` and `invalidTagAsText: true`                               |
-| `visitSpreadAttr()` | Returns `null` (HTML does not support spread attributes)                                                 |
+| Method              | Purpose                                                                                     |
+| ------------------- | ------------------------------------------------------------------------------------------- |
+| `tokenize()`        | Invokes parse5 `parse()` or `parseFragment()` based on fragment detection                   |
+| `beforeParse()`     | Sets up head/body optimization and offset tracking                                          |
+| `afterParse()`      | Restores original head/body tag names from placeholders                                     |
+| `nodeize()`         | Converts parse5 nodes to markuplint AST nodes, handling ghost elements and template content |
+| `afterNodeize()`    | Updates `afterPosition` state for ghost element positioning                                 |
+| `visitText()`       | Delegates to parent with `researchTags: true` and `invalidTagAsText: true`                  |
+| `visitSpreadAttr()` | Returns `null` (HTML does not support spread attributes)                                    |
 ## Parse Pipeline
@@ -91,7 +86,7 @@ The HTML-specific pipeline extends the base `Parser` pipeline:
 flowchart LR
     A["beforeParse\n- super.beforeParse()\n- head/body optimization setup\n- offset tracking"]
     B["tokenize\n- isDocumentFragment() check\n- parse5 parse/parseFragment"]
-    C["nodeize\n- Ghost element handling\n- Doctype/text/comment/element dispatch\n- Template content extraction\n- Namespace resolution"]
+    C["nodeize\n- Ghost element handling\n- Doctype/text/comment/element dispatch\n- Template content extraction"]
     D["afterNodeize\n- Update afterPosition state"]
     E["afterParse\n- Restore head/body names"]
@@ -132,12 +127,7 @@ The optimization uses a placeholder replacement strategy:
 ## Namespace Resolution
-`getNamespace()` determines the namespace URI for an element:
-- **Default**: `http://www.w3.org/1999/xhtml` (HTML namespace)
-- **SVG context**: When the parent namespace is `http://www.w3.org/2000/svg`, wraps the tag in `<svg>` and parses to determine the resolved namespace
-- **MathML context**: When the parent namespace is `http://www.w3.org/1998/Math/MathML`, wraps in `<math>` and parses
-- **Fallback**: For tags that produce no nodes as fragments, falls back to `parse()` (full document mode)
+Namespace resolution is handled by `getNamespace()` in `@markuplint/parser-utils`. The HTML parser delegates namespace detection to the base `Parser` class, which automatically determines namespaces from tag names and parent node context.
 ## Fragment vs Document Detection

package/CHANGELOG.md CHANGED Viewed

@@ -3,6 +3,29 @@
 All notable changes to this project will be documented in this file.
 See [Conventional Commits](https://conventionalcommits.org) for commit guidelines.
+# [5.0.0-alpha.1](https://github.com/markuplint/markuplint/compare/v5.0.0-alpha.0...v5.0.0-alpha.1) (2026-02-22)
+**Note:** Version bump only for package @markuplint/html-parser
+# [5.0.0-alpha.0](https://github.com/markuplint/markuplint/compare/v4.14.1...v5.0.0-alpha.0) (2026-02-20)
+### Bug Fixes
+- **ml-core:** improve detection of namespace ([5b507ad](https://github.com/markuplint/markuplint/commit/5b507ad7c19c5015b8ce587845d901e31dfa6518))
+- refactor(html-parser)!: update for simplified AST token properties ([524ce5d](https://github.com/markuplint/markuplint/commit/524ce5d6fc23c8bff73583ed4ac42fdff1759938))
+### BREAKING CHANGES
+- Adapt to renamed MLASTToken properties.
+* Use getEndPosition() for ghost element position calculation
+* Update test assertions: startCol -> col, startOffset -> offset,
+  startLine -> line
+* Remove endOffset/endLine/endCol assertions from tests
+Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
 ## [4.6.23](https://github.com/markuplint/markuplint/compare/@markuplint/html-parser@4.6.22...@markuplint/html-parser@4.6.23) (2026-02-10)
 **Note:** Version bump only for package @markuplint/html-parser

package/lib/index.d.ts CHANGED Viewed

	@@ -1,2 +1 @@
1	- export { getNamespace } from './get-namespace.js';
2 1	export { parser, HtmlParser } from './parser.js';

package/lib/index.js CHANGED Viewed

	@@ -1,2 +1 @@
1	- export { getNamespace } from './get-namespace.js';
2 1	export { parser, HtmlParser } from './parser.js';

package/lib/parser.js CHANGED Viewed

@@ -2,6 +2,7 @@ import { Parser } from '@markuplint/parser-utils';
 import { parse, parseFragment } from 'parse5';
 import { isDocumentFragment } from './is-document-fragment.js';
 import { optimizeStartsHeadTagOrBodyTagResume, optimizeStartsHeadTagOrBodyTagSetup, } from './optimize-starts-head-or-body.js';
+import { getEndPosition } from '@markuplint/parser-utils/location';
 /**
  * Parser implementation for standard HTML, built on top of parse5.
  * Handles document and fragment parsing, ghost elements (omitted tags),
@@ -57,24 +58,26 @@ export class HtmlParser extends Parser {
     nodeize(
     // eslint-disable-next-line @typescript-eslint/prefer-readonly-parameter-types
     originNode, parentNode, depth) {
-        const namespace = 'namespaceURI' in originNode ? originNode.namespaceURI : '';
         const location = originNode.sourceCodeLocation;
         if (!location) {
             // Ghost element
-            const afterNode = this.state.afterPosition.depth === depth ? this.state.afterPosition : parentNode;
-            const startOffset = afterNode?.endOffset ?? 0;
-            const startLine = afterNode?.endLine ?? 0;
-            const startCol = afterNode?.endCol ?? 0;
+            const afterNode = this.state.afterPosition.depth === depth
+                ? this.state.afterPosition
+                : parentNode
+                    ? getEndPosition(parentNode.raw, parentNode.offset, parentNode.line, parentNode.col)
+                    : null;
+            const offset = afterNode?.endOffset ?? 0;
+            const line = afterNode?.endLine ?? 0;
+            const col = afterNode?.endCol ?? 0;
             const childNodes = 'childNodes' in originNode ? originNode.childNodes : [];
             return this.visitElement({
                 raw: '',
-                startOffset,
-                startLine,
-                startCol,
+                offset,
+                line,
+                col,
                 depth,
                 parentNode,
                 nodeName: originNode.nodeName,
-                namespace,
             }, childNodes);
         }
         const { startOffset, endOffset } = location;
@@ -122,7 +125,6 @@ export class HtmlParser extends Parser {
                     depth,
                     parentNode,
                     nodeName: originNode.nodeName,
-                    namespace,
                 }, childNodes, {
                     createEndTagToken: () => {
                         const endTagLoc = 'endTag' in location ? location.endTag : null;
@@ -145,10 +147,9 @@ export class HtmlParser extends Parser {
         const after = super.afterNodeize(siblings, parentNode, depth);
         const prevNode = after.siblings.at(-1) ?? after.ancestors.findLast(n => n.depth === depth);
         if (prevNode) {
+            const endPos = getEndPosition(prevNode.raw, prevNode.offset, prevNode.line, prevNode.col);
             this.state.afterPosition = {
-                endOffset: prevNode.endOffset,
-                endLine: prevNode.endLine,
-                endCol: prevNode.endCol,
+                ...endPos,
                 depth,
             };
         }

package/package.json CHANGED Viewed

@@ -1,10 +1,13 @@
 {
 	"name": "@markuplint/html-parser",
-	"version": "4.6.23",
+	"version": "5.0.0-alpha.1",
 	"description": "HTML parser for markuplint",
 	"repository": "git@github.com:markuplint/markuplint.git",
 	"author": "Yusuke Hirao <yusukehirao@me.com>",
 	"license": "MIT",
+	"engines": {
+		"node": ">=22"
+	},
 	"type": "module",
 	"exports": {
 		".": {
@@ -24,10 +27,10 @@
 		"clean": "tsc --build --clean tsconfig.build.json"
 	},
 	"dependencies": {
-		"@markuplint/ml-ast": "4.4.11",
-		"@markuplint/parser-utils": "4.8.11",
+		"@markuplint/ml-ast": "5.0.0-alpha.1",
+		"@markuplint/parser-utils": "5.0.0-alpha.1",
 		"parse5": "8.0.0",
-		"type-fest": "4.41.0"
+		"type-fest": "5.4.4"
 	},
-	"gitHead": "193ee7c1262bbed95424e38efdf1a8e56ff049f4"
+	"gitHead": "78a295e73a097a1ce09c777c06fa21ab68136387"
 }