@wdprlib/parser 3.1.2 → 4.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.cjs +10456 -8230
- package/dist/index.d.cts +313 -337
- package/dist/index.d.ts +313 -337
- package/dist/index.js +10460 -8234
- package/package.json +5 -3
- package/src/index.ts +170 -0
- package/src/lexer/anchor.ts +48 -0
- package/src/lexer/index.ts +21 -0
- package/src/lexer/lexer.ts +201 -0
- package/src/lexer/options.ts +19 -0
- package/src/lexer/punctuation.ts +70 -0
- package/src/lexer/quoted-string.ts +16 -0
- package/src/lexer/runs.ts +85 -0
- package/src/lexer/spacing-actions.ts +24 -0
- package/src/lexer/state.ts +103 -0
- package/src/lexer/syntax-actions.ts +80 -0
- package/src/lexer/text-actions.ts +41 -0
- package/src/lexer/token-actions.ts +136 -0
- package/src/lexer/token-factory.ts +62 -0
- package/src/lexer/tokenize.ts +18 -0
- package/src/lexer/tokens.ts +141 -0
- package/src/parser/constants.ts +175 -0
- package/src/parser/depth/index.ts +111 -0
- package/src/parser/depth/stack.ts +82 -0
- package/src/parser/index.ts +18 -0
- package/src/parser/parse/block.ts +42 -0
- package/src/parser/parse/context.ts +26 -0
- package/src/parser/parse/footnotes.ts +25 -0
- package/src/parser/parse/index.ts +42 -0
- package/src/parser/parse/options.ts +34 -0
- package/src/parser/parse/parser.ts +79 -0
- package/src/parser/parse/plain-non-ascii.ts +129 -0
- package/src/parser/parse/result.ts +57 -0
- package/src/parser/parse/source.ts +11 -0
- package/src/parser/postprocess/divAdjacentParagraph.ts +76 -0
- package/src/parser/postprocess/index.ts +15 -0
- package/src/parser/postprocess/spanStrip/clean-element.ts +168 -0
- package/src/parser/postprocess/spanStrip/cleanup.ts +25 -0
- package/src/parser/postprocess/spanStrip/empty-spans.ts +36 -0
- package/src/parser/postprocess/spanStrip/escaped.ts +78 -0
- package/src/parser/postprocess/spanStrip/factory.ts +23 -0
- package/src/parser/postprocess/spanStrip/index.ts +8 -0
- package/src/parser/postprocess/spanStrip/merge.ts +117 -0
- package/src/parser/postprocess/spanStrip/predicates.ts +59 -0
- package/src/parser/postprocess/spanStrip/split.ts +67 -0
- package/src/parser/preprocess/expr/chars.ts +15 -0
- package/src/parser/preprocess/expr/evaluate.ts +22 -0
- package/src/parser/preprocess/expr/index.ts +45 -0
- package/src/parser/preprocess/expr/kind.ts +19 -0
- package/src/parser/preprocess/expr/parse.ts +103 -0
- package/src/parser/preprocess/expr/scan.ts +34 -0
- package/src/parser/preprocess/expr/types.ts +14 -0
- package/src/parser/preprocess/index.ts +38 -0
- package/src/parser/preprocess/typography.ts +132 -0
- package/src/parser/preprocess/utils/bracket-depths.ts +98 -0
- package/src/parser/preprocess/utils/index.ts +13 -0
- package/src/parser/preprocess/utils/raw-regions.ts +153 -0
- package/src/parser/preprocess/whitespace/detection.ts +39 -0
- package/src/parser/preprocess/whitespace/index.ts +79 -0
- package/src/parser/preprocess/whitespace/leading-spaces.ts +11 -0
- package/src/parser/preprocess/whitespace/patterns.ts +23 -0
- package/src/parser/rules/block/align/body.ts +46 -0
- package/src/parser/rules/block/align/element.ts +13 -0
- package/src/parser/rules/block/align/index.ts +90 -0
- package/src/parser/rules/block/align/syntax.ts +113 -0
- package/src/parser/rules/block/bibliography/body.ts +81 -0
- package/src/parser/rules/block/bibliography/entries.ts +49 -0
- package/src/parser/rules/block/bibliography/entry-content.ts +73 -0
- package/src/parser/rules/block/bibliography/entry-key.ts +83 -0
- package/src/parser/rules/block/bibliography/index.ts +90 -0
- package/src/parser/rules/block/bibliography/open.ts +53 -0
- package/src/parser/rules/block/block-list/bare-content.ts +105 -0
- package/src/parser/rules/block/block-list/bare-paragraph.ts +60 -0
- package/src/parser/rules/block/block-list/index.ts +51 -0
- package/src/parser/rules/block/block-list/item-content.ts +132 -0
- package/src/parser/rules/block/block-list/li-content.ts +107 -0
- package/src/parser/rules/block/block-list/li-item.ts +77 -0
- package/src/parser/rules/block/block-list/list-block.ts +100 -0
- package/src/parser/rules/block/block-list/open.ts +51 -0
- package/src/parser/rules/block/block-list/tags.ts +50 -0
- package/src/parser/rules/block/blockquote/build.ts +62 -0
- package/src/parser/rules/block/blockquote/index.ts +80 -0
- package/src/parser/rules/block/blockquote/line.ts +79 -0
- package/src/parser/rules/block/blockquote/lines.ts +39 -0
- package/src/parser/rules/block/center/index.ts +72 -0
- package/src/parser/rules/block/center/open.ts +27 -0
- package/src/parser/rules/block/clear-float/index.ts +51 -0
- package/src/parser/rules/block/clear-float/syntax.ts +43 -0
- package/src/parser/rules/block/code/attributes.ts +30 -0
- package/src/parser/rules/block/code/content.ts +57 -0
- package/src/parser/rules/block/code/index.ts +100 -0
- package/src/parser/rules/block/collapsible/attributes.ts +95 -0
- package/src/parser/rules/block/collapsible/body.ts +69 -0
- package/src/parser/rules/block/collapsible/index.ts +117 -0
- package/src/parser/rules/block/collapsible/open.ts +51 -0
- package/src/parser/rules/block/collapsible/orphans.ts +31 -0
- package/src/parser/rules/block/collapsible/tags.ts +17 -0
- package/src/parser/rules/block/comment/consume.ts +37 -0
- package/src/parser/rules/block/comment/index.ts +47 -0
- package/src/parser/rules/block/content-separator/index.ts +49 -0
- package/src/parser/rules/block/content-separator/syntax.ts +33 -0
- package/src/parser/rules/block/definition-list/collect.ts +40 -0
- package/src/parser/rules/block/definition-list/index.ts +63 -0
- package/src/parser/rules/block/definition-list/item-key.ts +95 -0
- package/src/parser/rules/block/definition-list/item-value.ts +56 -0
- package/src/parser/rules/block/definition-list/items.ts +54 -0
- package/src/parser/rules/block/div/body.ts +41 -0
- package/src/parser/rules/block/div/close.ts +41 -0
- package/src/parser/rules/block/div/failed.ts +117 -0
- package/src/parser/rules/block/div/index.ts +112 -0
- package/src/parser/rules/block/div/nesting.ts +37 -0
- package/src/parser/rules/block/div/open.ts +59 -0
- package/src/parser/rules/block/div/paragraph-strip.ts +44 -0
- package/src/parser/rules/block/embed-block/content.ts +53 -0
- package/src/parser/rules/block/embed-block/index.ts +91 -0
- package/src/parser/rules/block/embed-block/open.ts +52 -0
- package/src/parser/rules/block/embed-block/tags.ts +5 -0
- package/src/parser/rules/block/footnoteblock/attributes.ts +73 -0
- package/src/parser/rules/block/footnoteblock/index.ts +82 -0
- package/src/parser/rules/block/footnoteblock/open.ts +53 -0
- package/src/parser/rules/block/heading/index.ts +87 -0
- package/src/parser/rules/block/heading/open.ts +50 -0
- package/src/parser/rules/block/heading/toc-text.ts +26 -0
- package/src/parser/rules/block/horizontal-rule/index.ts +44 -0
- package/src/parser/rules/block/horizontal-rule/syntax.ts +21 -0
- package/src/parser/rules/block/html/body.ts +114 -0
- package/src/parser/rules/block/html/diagnostics.ts +11 -0
- package/src/parser/rules/block/html/index.ts +95 -0
- package/src/parser/rules/block/html/open.ts +36 -0
- package/src/parser/rules/block/iframe/attributes.ts +106 -0
- package/src/parser/rules/block/iframe/index.ts +73 -0
- package/src/parser/rules/block/iframe/open.ts +58 -0
- package/src/parser/rules/block/iframe/source.ts +24 -0
- package/src/parser/rules/block/iframe/url.ts +38 -0
- package/src/parser/rules/block/iftags/body.ts +48 -0
- package/src/parser/rules/block/iftags/condition.ts +24 -0
- package/src/parser/rules/block/iftags/index.ts +108 -0
- package/src/parser/rules/block/include/arguments.ts +48 -0
- package/src/parser/rules/block/include/index.ts +75 -0
- package/src/parser/rules/block/include/location.ts +24 -0
- package/src/parser/rules/block/include/variables.ts +37 -0
- package/src/parser/rules/block/index.ts +127 -0
- package/src/parser/rules/block/list/index.ts +73 -0
- package/src/parser/rules/block/list/line.ts +77 -0
- package/src/parser/rules/block/list/native.ts +89 -0
- package/src/parser/rules/block/math/content.ts +54 -0
- package/src/parser/rules/block/math/index.ts +106 -0
- package/src/parser/rules/block/math/name.ts +35 -0
- package/src/parser/rules/block/module/backlinks/index.ts +31 -0
- package/src/parser/rules/block/module/backlinks/types.ts +21 -0
- package/src/parser/rules/block/module/body.ts +92 -0
- package/src/parser/rules/block/module/categories/index.ts +34 -0
- package/src/parser/rules/block/module/categories/types.ts +21 -0
- package/src/parser/rules/block/module/css/index.ts +37 -0
- package/src/parser/rules/block/module/element.ts +33 -0
- package/src/parser/rules/block/module/iftags/condition.ts +109 -0
- package/src/parser/rules/block/module/iftags/index.ts +26 -0
- package/src/parser/rules/block/module/iftags/preprocess.ts +140 -0
- package/src/parser/rules/block/module/iftags/resolve.ts +73 -0
- package/src/parser/rules/block/module/iftags/types.ts +63 -0
- package/src/parser/rules/block/module/include/directive.ts +91 -0
- package/src/parser/rules/block/module/include/index.ts +29 -0
- package/src/parser/rules/block/module/include/references.ts +42 -0
- package/src/parser/rules/block/module/include/resolve/cache.ts +44 -0
- package/src/parser/rules/block/module/include/resolve/index.ts +106 -0
- package/src/parser/rules/block/module/include/resolve/iterate.ts +202 -0
- package/src/parser/rules/block/module/include/resolve/replace.ts +31 -0
- package/src/parser/rules/block/module/include/resolve/types.ts +105 -0
- package/src/parser/rules/block/module/include/scanner.ts +121 -0
- package/src/parser/rules/block/module/index.ts +134 -0
- package/src/parser/rules/block/module/join/index.ts +34 -0
- package/src/parser/rules/block/module/join/types.ts +23 -0
- package/src/parser/rules/block/module/listpages/compiler.ts +73 -0
- package/src/parser/rules/block/module/listpages/extract.ts +76 -0
- package/src/parser/rules/block/module/listpages/extraction/listpages.ts +42 -0
- package/src/parser/rules/block/module/listpages/extraction/listusers.ts +30 -0
- package/src/parser/rules/block/module/listpages/extraction/query.ts +51 -0
- package/src/parser/rules/block/module/listpages/extraction/result.ts +18 -0
- package/src/parser/rules/block/module/listpages/extraction/template.ts +96 -0
- package/src/parser/rules/block/module/listpages/extraction/variables.ts +58 -0
- package/src/parser/rules/block/module/listpages/index.ts +83 -0
- package/src/parser/rules/block/module/listpages/normalization/date-selector.ts +53 -0
- package/src/parser/rules/block/module/listpages/normalization/numeric-selector.ts +32 -0
- package/src/parser/rules/block/module/listpages/normalization/order-parent.ts +82 -0
- package/src/parser/rules/block/module/listpages/normalization/selectors.ts +2 -0
- package/src/parser/rules/block/module/listpages/normalization/tags-category.ts +86 -0
- package/src/parser/rules/block/module/listpages/normalize.ts +74 -0
- package/src/parser/rules/block/module/listpages/parser.ts +106 -0
- package/src/parser/rules/block/module/listpages/resolution/items.ts +43 -0
- package/src/parser/rules/block/module/listpages/resolution/wrapper.ts +42 -0
- package/src/parser/rules/block/module/listpages/resolve.ts +60 -0
- package/src/parser/rules/block/module/listpages/template/format/content.ts +41 -0
- package/src/parser/rules/block/module/listpages/template/format/date.ts +116 -0
- package/src/parser/rules/block/module/listpages/template/format/index.ts +4 -0
- package/src/parser/rules/block/module/listpages/template/format/tags.ts +7 -0
- package/src/parser/rules/block/module/listpages/template/format/user.ts +9 -0
- package/src/parser/rules/block/module/listpages/template/getters/index.ts +36 -0
- package/src/parser/rules/block/module/listpages/template/getters/parameterized.ts +60 -0
- package/src/parser/rules/block/module/listpages/template/getters/simple.ts +65 -0
- package/src/parser/rules/block/module/listpages/template/getters/types.ts +3 -0
- package/src/parser/rules/block/module/listpages/template/syntax.ts +97 -0
- package/src/parser/rules/block/module/listpages/types/data-fetcher.ts +15 -0
- package/src/parser/rules/block/module/listpages/types/data-requirements.ts +52 -0
- package/src/parser/rules/block/module/listpages/types/external-data.ts +77 -0
- package/src/parser/rules/block/module/listpages/types/index.ts +17 -0
- package/src/parser/rules/block/module/listpages/types/normalized-query.ts +120 -0
- package/src/parser/rules/block/module/listpages/types/query.ts +67 -0
- package/src/parser/rules/block/module/listpages/types/template.ts +17 -0
- package/src/parser/rules/block/module/listpages/types/variables.ts +69 -0
- package/src/parser/rules/block/module/listpages/url-resolution/fields.ts +48 -0
- package/src/parser/rules/block/module/listpages/url-resolution/params.ts +19 -0
- package/src/parser/rules/block/module/listpages/url-resolution/query.ts +24 -0
- package/src/parser/rules/block/module/listpages/url-resolution/resolve.ts +53 -0
- package/src/parser/rules/block/module/listpages/url-resolution/value.ts +25 -0
- package/src/parser/rules/block/module/listpages/url-resolver.ts +29 -0
- package/src/parser/rules/block/module/listusers/compiler.ts +56 -0
- package/src/parser/rules/block/module/listusers/extract.ts +40 -0
- package/src/parser/rules/block/module/listusers/getters.ts +21 -0
- package/src/parser/rules/block/module/listusers/index.ts +36 -0
- package/src/parser/rules/block/module/listusers/parser.ts +54 -0
- package/src/parser/rules/block/module/listusers/resolve.ts +58 -0
- package/src/parser/rules/block/module/listusers/types.ts +93 -0
- package/src/parser/rules/block/module/listusers/variables.ts +15 -0
- package/src/parser/rules/block/module/mapping.ts +61 -0
- package/src/parser/rules/block/module/open.ts +57 -0
- package/src/parser/rules/block/module/page-tree/index.ts +38 -0
- package/src/parser/rules/block/module/page-tree/types.ts +29 -0
- package/src/parser/rules/block/module/rate/index.ts +28 -0
- package/src/parser/rules/block/module/rate/types.ts +19 -0
- package/src/parser/rules/block/module/resolution/contexts.ts +78 -0
- package/src/parser/rules/block/module/resolution/data-maps.ts +39 -0
- package/src/parser/rules/block/module/resolution/dynamic-modules.ts +93 -0
- package/src/parser/rules/block/module/resolution/styles.ts +53 -0
- package/src/parser/rules/block/module/resolution/walk-resolve.ts +107 -0
- package/src/parser/rules/block/module/resolve.ts +198 -0
- package/src/parser/rules/block/module/rule.ts +56 -0
- package/src/parser/rules/block/module/types-common.ts +70 -0
- package/src/parser/rules/block/module/types.ts +61 -0
- package/src/parser/rules/block/module/utils.ts +43 -0
- package/src/parser/rules/block/module/walk/children.ts +35 -0
- package/src/parser/rules/block/module/walk/index.ts +9 -0
- package/src/parser/rules/block/module/walk/map/index.ts +2 -0
- package/src/parser/rules/block/module/walk/map/stateful-definition-list.ts +25 -0
- package/src/parser/rules/block/module/walk/map/stateful-list.ts +40 -0
- package/src/parser/rules/block/module/walk/map/stateful-table.ts +23 -0
- package/src/parser/rules/block/module/walk/map/stateful-tabs.ts +19 -0
- package/src/parser/rules/block/module/walk/map/stateful.ts +71 -0
- package/src/parser/rules/block/module/walk/map/stateless-definition-list.ts +12 -0
- package/src/parser/rules/block/module/walk/map/stateless-list.ts +29 -0
- package/src/parser/rules/block/module/walk/map/stateless-table.ts +11 -0
- package/src/parser/rules/block/module/walk/map/stateless-tabs.ts +5 -0
- package/src/parser/rules/block/module/walk/map/stateless.ts +51 -0
- package/src/parser/rules/block/module/walk/map/types.ts +6 -0
- package/src/parser/rules/block/module/walk/traverse.ts +65 -0
- package/src/parser/rules/block/orphan-li/content.ts +60 -0
- package/src/parser/rules/block/orphan-li/index.ts +75 -0
- package/src/parser/rules/block/orphan-li/open.ts +25 -0
- package/src/parser/rules/block/orphan-li/tags.ts +40 -0
- package/src/parser/rules/block/paragraph/content.ts +12 -0
- package/src/parser/rules/block/paragraph/index.ts +60 -0
- package/src/parser/rules/block/paragraph/normalize.ts +52 -0
- package/src/parser/rules/block/paragraph/span-markers.ts +52 -0
- package/src/parser/rules/block/parsing/attributes/index.ts +32 -0
- package/src/parser/rules/block/parsing/attributes/names.ts +93 -0
- package/src/parser/rules/block/parsing/attributes/scanner.ts +75 -0
- package/src/parser/rules/block/parsing/attributes/values.ts +26 -0
- package/src/parser/rules/block/parsing/block-item.ts +29 -0
- package/src/parser/rules/block/parsing/content.ts +127 -0
- package/src/parser/rules/block/parsing/end-condition.ts +51 -0
- package/src/parser/rules/block/parsing/inline-content.ts +105 -0
- package/src/parser/rules/block/parsing/inline-newline.ts +41 -0
- package/src/parser/rules/block/parsing/non-boundary.ts +24 -0
- package/src/parser/rules/block/parsing/rule-dispatch.ts +44 -0
- package/src/parser/rules/block/table/index.ts +80 -0
- package/src/parser/rules/block/table/pipe/cell-start.ts +69 -0
- package/src/parser/rules/block/table/pipe/cell.ts +106 -0
- package/src/parser/rules/block/table/pipe/index.ts +2 -0
- package/src/parser/rules/block/table/pipe/row.ts +88 -0
- package/src/parser/rules/block/table/pipe/tokens.ts +14 -0
- package/src/parser/rules/block/table/pipe/trim.ts +50 -0
- package/src/parser/rules/block/table-block/body.ts +79 -0
- package/src/parser/rules/block/table-block/cell-attributes.ts +33 -0
- package/src/parser/rules/block/table-block/cell-boundary.ts +99 -0
- package/src/parser/rules/block/table-block/cell-content/index.ts +88 -0
- package/src/parser/rules/block/table-block/cell-content/segments.ts +134 -0
- package/src/parser/rules/block/table-block/cell-newline.ts +47 -0
- package/src/parser/rules/block/table-block/cell.ts +64 -0
- package/src/parser/rules/block/table-block/index.ts +113 -0
- package/src/parser/rules/block/table-block/row-boundary.ts +75 -0
- package/src/parser/rules/block/table-block/structure.ts +80 -0
- package/src/parser/rules/block/tabview/body.ts +64 -0
- package/src/parser/rules/block/tabview/index.ts +90 -0
- package/src/parser/rules/block/tabview/open.ts +50 -0
- package/src/parser/rules/block/tabview/tab.ts +92 -0
- package/src/parser/rules/block/tabview/tags.ts +30 -0
- package/src/parser/rules/block/toc/element.ts +11 -0
- package/src/parser/rules/block/toc/index.ts +44 -0
- package/src/parser/rules/block/toc/open.ts +84 -0
- package/src/parser/rules/block/utils.ts +15 -0
- package/src/parser/rules/common/attribute-safety.ts +109 -0
- package/src/parser/rules/common/block-name.ts +33 -0
- package/src/parser/rules/common/index.ts +2 -0
- package/src/parser/rules/contracts/index.ts +3 -0
- package/src/parser/rules/contracts/parse-context.ts +38 -0
- package/src/parser/rules/contracts/rule.ts +43 -0
- package/src/parser/rules/contracts/scope.ts +31 -0
- package/src/parser/rules/index.ts +49 -0
- package/src/parser/rules/inline/anchor/attributes.ts +54 -0
- package/src/parser/rules/inline/anchor/child.ts +26 -0
- package/src/parser/rules/inline/anchor/close.ts +34 -0
- package/src/parser/rules/inline/anchor/content.ts +59 -0
- package/src/parser/rules/inline/anchor/index.ts +103 -0
- package/src/parser/rules/inline/anchor/newline.ts +26 -0
- package/src/parser/rules/inline/anchor/open.ts +47 -0
- package/src/parser/rules/inline/anchor/paragraph-strip.ts +14 -0
- package/src/parser/rules/inline/anchor/syntax.ts +40 -0
- package/src/parser/rules/inline/anchor-name/index.ts +38 -0
- package/src/parser/rules/inline/anchor-name/name.ts +39 -0
- package/src/parser/rules/inline/anchor-name/syntax.ts +46 -0
- package/src/parser/rules/inline/bibcite/element.ts +14 -0
- package/src/parser/rules/inline/bibcite/index.ts +34 -0
- package/src/parser/rules/inline/bibcite/syntax.ts +64 -0
- package/src/parser/rules/inline/bold.ts +49 -0
- package/src/parser/rules/inline/color/index.ts +35 -0
- package/src/parser/rules/inline/color/syntax.ts +69 -0
- package/src/parser/rules/inline/comment/consume.ts +31 -0
- package/src/parser/rules/inline/comment/index.ts +64 -0
- package/src/parser/rules/inline/equation-ref/element.ts +8 -0
- package/src/parser/rules/inline/equation-ref/index.ts +34 -0
- package/src/parser/rules/inline/equation-ref/syntax.ts +45 -0
- package/src/parser/rules/inline/expr/branch.ts +104 -0
- package/src/parser/rules/inline/expr/conditional-branch.ts +27 -0
- package/src/parser/rules/inline/expr/conditional.ts +80 -0
- package/src/parser/rules/inline/expr/depth.ts +25 -0
- package/src/parser/rules/inline/expr/elements.ts +39 -0
- package/src/parser/rules/inline/expr/index.ts +84 -0
- package/src/parser/rules/inline/expr/syntax.ts +45 -0
- package/src/parser/rules/inline/footnote/child.ts +22 -0
- package/src/parser/rules/inline/footnote/close.ts +33 -0
- package/src/parser/rules/inline/footnote/content.ts +54 -0
- package/src/parser/rules/inline/footnote/elements.ts +38 -0
- package/src/parser/rules/inline/footnote/index.ts +54 -0
- package/src/parser/rules/inline/footnote/newline.ts +27 -0
- package/src/parser/rules/inline/footnote/open.ts +38 -0
- package/src/parser/rules/inline/formatting/container.ts +50 -0
- package/src/parser/rules/inline/guillemet/index.ts +56 -0
- package/src/parser/rules/inline/guillemet/text.ts +11 -0
- package/src/parser/rules/inline/html/gate.ts +64 -0
- package/src/parser/rules/inline/html/index.ts +81 -0
- package/src/parser/rules/inline/html/open.ts +37 -0
- package/src/parser/rules/inline/image/attributes.ts +22 -0
- package/src/parser/rules/inline/image/body.ts +36 -0
- package/src/parser/rules/inline/image/index.ts +89 -0
- package/src/parser/rules/inline/image/open.ts +56 -0
- package/src/parser/rules/inline/image/source.ts +62 -0
- package/src/parser/rules/inline/image/syntax.ts +76 -0
- package/src/parser/rules/inline/index.ts +150 -0
- package/src/parser/rules/inline/italic.ts +46 -0
- package/src/parser/rules/inline/line-break/backslash.ts +58 -0
- package/src/parser/rules/inline/line-break/elements.ts +9 -0
- package/src/parser/rules/inline/line-break/index.ts +3 -0
- package/src/parser/rules/inline/line-break/newline.ts +82 -0
- package/src/parser/rules/inline/line-break/underscore.ts +45 -0
- package/src/parser/rules/inline/link-anchor.ts +72 -0
- package/src/parser/rules/inline/link-bracket/anchor.ts +3 -0
- package/src/parser/rules/inline/link-bracket/direct-url.ts +5 -0
- package/src/parser/rules/inline/link-bracket/parsed.ts +81 -0
- package/src/parser/rules/inline/link-bracket/parts.ts +64 -0
- package/src/parser/rules/inline/link-bracket/prefix.ts +15 -0
- package/src/parser/rules/inline/link-single.ts +73 -0
- package/src/parser/rules/inline/link-star.ts +72 -0
- package/src/parser/rules/inline/link-triple/fallback.ts +10 -0
- package/src/parser/rules/inline/link-triple/index.ts +62 -0
- package/src/parser/rules/inline/link-triple/interwiki.ts +11 -0
- package/src/parser/rules/inline/link-triple/label.ts +35 -0
- package/src/parser/rules/inline/link-triple/syntax.ts +72 -0
- package/src/parser/rules/inline/link-triple/target.ts +36 -0
- package/src/parser/rules/inline/math-inline/index.ts +40 -0
- package/src/parser/rules/inline/math-inline/syntax.ts +55 -0
- package/src/parser/rules/inline/monospace.ts +50 -0
- package/src/parser/rules/inline/parsing/block-boundary.ts +42 -0
- package/src/parser/rules/inline/parsing/block-start-predicates.ts +117 -0
- package/src/parser/rules/inline/parsing/collect.ts +23 -0
- package/src/parser/rules/inline/parsing/inline-content.ts +115 -0
- package/src/parser/rules/inline/parsing/paragraph-boundary.ts +47 -0
- package/src/parser/rules/inline/parsing/plain-text.ts +69 -0
- package/src/parser/rules/inline/parsing/preserved-line-break.ts +11 -0
- package/src/parser/rules/inline/parsing/rules.ts +34 -0
- package/src/parser/rules/inline/parsing/simple-token.ts +26 -0
- package/src/parser/rules/inline/raw/angle.ts +40 -0
- package/src/parser/rules/inline/raw/double-at.ts +78 -0
- package/src/parser/rules/inline/raw/index.ts +26 -0
- package/src/parser/rules/inline/raw/result.ts +26 -0
- package/src/parser/rules/inline/size/content.ts +65 -0
- package/src/parser/rules/inline/size/index.ts +55 -0
- package/src/parser/rules/inline/size/open.ts +43 -0
- package/src/parser/rules/inline/size/value.ts +45 -0
- package/src/parser/rules/inline/span/content.ts +97 -0
- package/src/parser/rules/inline/span/elements.ts +108 -0
- package/src/parser/rules/inline/span/index.ts +79 -0
- package/src/parser/rules/inline/span/newline.ts +50 -0
- package/src/parser/rules/inline/span/syntax.ts +70 -0
- package/src/parser/rules/inline/strikethrough/index.ts +60 -0
- package/src/parser/rules/inline/strikethrough/parse.ts +14 -0
- package/src/parser/rules/inline/strikethrough/syntax.ts +24 -0
- package/src/parser/rules/inline/subscript.ts +47 -0
- package/src/parser/rules/inline/superscript.ts +49 -0
- package/src/parser/rules/inline/text/element.ts +5 -0
- package/src/parser/rules/inline/text/index.ts +85 -0
- package/src/parser/rules/inline/underline/child.ts +26 -0
- package/src/parser/rules/inline/underline/content.ts +29 -0
- package/src/parser/rules/inline/underline/index.ts +84 -0
- package/src/parser/rules/inline/user/element.ts +11 -0
- package/src/parser/rules/inline/user/index.ts +34 -0
- package/src/parser/rules/inline/user/syntax.ts +67 -0
- package/src/parser/rules/inline/utils.ts +4 -0
- package/src/parser/rules/tokens.ts +106 -0
- package/src/parser/rules/types.ts +9 -0
- package/src/parser/toc.ts +130 -0
|
@@ -0,0 +1,129 @@
|
|
|
1
|
+
import type { Element, ParseResult } from "@wdprlib/ast";
|
|
2
|
+
|
|
3
|
+
const LARGE_PLAIN_TEXT_MIN_LENGTH = 100_000;
|
|
4
|
+
|
|
5
|
+
export function parsePlainNonAsciiDocument(source: string): ParseResult | null {
|
|
6
|
+
if (!isPlainNonAsciiDocument(source)) {
|
|
7
|
+
return null;
|
|
8
|
+
}
|
|
9
|
+
|
|
10
|
+
const text = trimNewlineEdges(source);
|
|
11
|
+
const elements = text === "" ? [] : buildPlainParagraphs(text);
|
|
12
|
+
|
|
13
|
+
elements.push({
|
|
14
|
+
element: "footnote-block",
|
|
15
|
+
data: { title: null, hide: false },
|
|
16
|
+
});
|
|
17
|
+
|
|
18
|
+
return { ast: { elements }, diagnostics: [] };
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
function isPlainNonAsciiDocument(source: string): boolean {
|
|
22
|
+
for (let i = 0; i < source.length; i++) {
|
|
23
|
+
const code = source.charCodeAt(i);
|
|
24
|
+
if ((code >= 0x00 && code <= 0x09) || (code >= 0x0b && code <= 0x7f) || code === 0xe000) {
|
|
25
|
+
return false;
|
|
26
|
+
}
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
return true;
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
export function parseLargePlainTextDocument(source: string): ParseResult | null {
|
|
33
|
+
if (source.length < LARGE_PLAIN_TEXT_MIN_LENGTH || hasWikitextSyntaxCandidate(source)) {
|
|
34
|
+
return null;
|
|
35
|
+
}
|
|
36
|
+
|
|
37
|
+
const text = trimNewlineEdges(source);
|
|
38
|
+
const elements = text === "" ? [] : buildPlainParagraphs(text);
|
|
39
|
+
|
|
40
|
+
elements.push({
|
|
41
|
+
element: "footnote-block",
|
|
42
|
+
data: { title: null, hide: false },
|
|
43
|
+
});
|
|
44
|
+
|
|
45
|
+
return { ast: { elements }, diagnostics: [] };
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
function hasWikitextSyntaxCandidate(source: string): boolean {
|
|
49
|
+
for (let i = 0; i < source.length; i++) {
|
|
50
|
+
switch (source.charCodeAt(i)) {
|
|
51
|
+
case 42: // *
|
|
52
|
+
case 43: // +
|
|
53
|
+
case 47: // /
|
|
54
|
+
case 60: // <
|
|
55
|
+
case 61: // =
|
|
56
|
+
case 62: // >
|
|
57
|
+
case 64: // @
|
|
58
|
+
case 91: // [
|
|
59
|
+
case 92: // \
|
|
60
|
+
case 93: // ]
|
|
61
|
+
case 94: // ^
|
|
62
|
+
case 95: // _
|
|
63
|
+
case 124: // |
|
|
64
|
+
case 126: // ~
|
|
65
|
+
case 0xe000:
|
|
66
|
+
return true;
|
|
67
|
+
case 35: // #
|
|
68
|
+
if (isLineStart(source, i)) return true;
|
|
69
|
+
break;
|
|
70
|
+
case 45: // -
|
|
71
|
+
if (source.charCodeAt(i + 1) === 45) return true;
|
|
72
|
+
break;
|
|
73
|
+
case 44: // ,
|
|
74
|
+
if (source.charCodeAt(i + 1) === 44) return true;
|
|
75
|
+
break;
|
|
76
|
+
case 123: // {
|
|
77
|
+
if (source.charCodeAt(i + 1) === 123) return true;
|
|
78
|
+
break;
|
|
79
|
+
case 125: // }
|
|
80
|
+
if (source.charCodeAt(i + 1) === 125) return true;
|
|
81
|
+
break;
|
|
82
|
+
}
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
return false;
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
function isLineStart(source: string, index: number): boolean {
|
|
89
|
+
if (index === 0) return true;
|
|
90
|
+
const prev = source.charCodeAt(index - 1);
|
|
91
|
+
return prev === 10 || prev === 13;
|
|
92
|
+
}
|
|
93
|
+
|
|
94
|
+
function trimNewlineEdges(source: string): string {
|
|
95
|
+
let start = 0;
|
|
96
|
+
let end = source.length;
|
|
97
|
+
while (start < end && source.charCodeAt(start) === 10) start++;
|
|
98
|
+
while (end > start && source.charCodeAt(end - 1) === 10) end--;
|
|
99
|
+
return start === 0 && end === source.length ? source : source.slice(start, end);
|
|
100
|
+
}
|
|
101
|
+
|
|
102
|
+
function buildPlainParagraphs(text: string): Element[] {
|
|
103
|
+
const paragraphs =
|
|
104
|
+
text.indexOf("\n\n") === -1 ? [text] : text.split(/\n{2,}/).filter((part) => part !== "");
|
|
105
|
+
|
|
106
|
+
return paragraphs.map((paragraphText) => ({
|
|
107
|
+
element: "container",
|
|
108
|
+
data: {
|
|
109
|
+
type: "paragraph",
|
|
110
|
+
attributes: {},
|
|
111
|
+
elements: buildPlainParagraphElements(paragraphText),
|
|
112
|
+
},
|
|
113
|
+
}));
|
|
114
|
+
}
|
|
115
|
+
|
|
116
|
+
function buildPlainParagraphElements(text: string): Element[] {
|
|
117
|
+
const lines = text.split("\n");
|
|
118
|
+
const elements: Element[] = Array.from({ length: lines.length * 2 - 1 });
|
|
119
|
+
let out = 0;
|
|
120
|
+
|
|
121
|
+
for (let i = 0; i < lines.length; i++) {
|
|
122
|
+
elements[out++] = { element: "text", data: lines[i]! };
|
|
123
|
+
if (i !== lines.length - 1) {
|
|
124
|
+
elements[out++] = { element: "line-break" };
|
|
125
|
+
}
|
|
126
|
+
}
|
|
127
|
+
|
|
128
|
+
return elements;
|
|
129
|
+
}
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
import type { Element, ParseResult, SyntaxTree } from "@wdprlib/ast";
|
|
2
|
+
import type { ParseContext } from "../rules";
|
|
3
|
+
import {
|
|
4
|
+
cleanInternalFlags,
|
|
5
|
+
mergeSpanStripParagraphs,
|
|
6
|
+
suppressDivAdjacentParagraphs,
|
|
7
|
+
} from "../postprocess";
|
|
8
|
+
import { buildTableOfContents } from "../toc";
|
|
9
|
+
import { containsFootnoteBlock } from "./footnotes";
|
|
10
|
+
|
|
11
|
+
export function finalizeParseResult(ctx: ParseContext, children: Element[]): ParseResult {
|
|
12
|
+
const cleanedChildren = postprocessChildren(children);
|
|
13
|
+
appendImplicitFootnoteBlock(cleanedChildren);
|
|
14
|
+
|
|
15
|
+
return {
|
|
16
|
+
ast: buildSyntaxTree(ctx, cleanedChildren),
|
|
17
|
+
diagnostics: ctx.diagnostics,
|
|
18
|
+
};
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
function postprocessChildren(children: Element[]): Element[] {
|
|
22
|
+
const mergedChildren = mergeSpanStripParagraphs(children);
|
|
23
|
+
const divProcessed = suppressDivAdjacentParagraphs(mergedChildren);
|
|
24
|
+
return cleanInternalFlags(divProcessed);
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
function appendImplicitFootnoteBlock(elements: Element[]): void {
|
|
28
|
+
if (containsFootnoteBlock(elements)) return;
|
|
29
|
+
|
|
30
|
+
elements.push({
|
|
31
|
+
element: "footnote-block",
|
|
32
|
+
data: { title: null, hide: false },
|
|
33
|
+
});
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
function buildSyntaxTree(ctx: ParseContext, elements: Element[]): SyntaxTree {
|
|
37
|
+
const tableOfContents = buildTableOfContents(ctx.tocEntries);
|
|
38
|
+
const result: SyntaxTree = { elements };
|
|
39
|
+
|
|
40
|
+
if (tableOfContents.length > 0) {
|
|
41
|
+
result["table-of-contents"] = tableOfContents;
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
if (ctx.footnotes.length > 0) {
|
|
45
|
+
result.footnotes = ctx.footnotes;
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
if (ctx.codeBlocks.length > 0) {
|
|
49
|
+
result["code-blocks"] = ctx.codeBlocks;
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
if (ctx.htmlBlocks.length > 0) {
|
|
53
|
+
result["html-blocks"] = ctx.htmlBlocks;
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
return result;
|
|
57
|
+
}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import { preprocess } from "../preprocess";
|
|
2
|
+
import { preprocessExpr } from "../preprocess/expr";
|
|
3
|
+
import { preprocessIftags } from "../rules/block/module/iftags/preprocess";
|
|
4
|
+
import type { ParserOptions } from "./options";
|
|
5
|
+
|
|
6
|
+
export function prepareSourceForParse(source: string, options: ParserOptions | undefined): string {
|
|
7
|
+
const ifProcessed = preprocessExpr(source);
|
|
8
|
+
const iftagsProcessed =
|
|
9
|
+
options?.pageTags !== undefined ? preprocessIftags(ifProcessed, options.pageTags) : ifProcessed;
|
|
10
|
+
return preprocess(iftagsProcessed);
|
|
11
|
+
}
|
|
@@ -0,0 +1,76 @@
|
|
|
1
|
+
/**
|
|
2
|
+
*
|
|
3
|
+
* Post-processing pass: suppress paragraph wrapping adjacent to div containers.
|
|
4
|
+
*
|
|
5
|
+
* In Wikidot, when a paragraph is a direct sibling of a `<div>` block (no other
|
|
6
|
+
* block elements between them), the `<p>` wrapping is removed and the inner
|
|
7
|
+
* elements are promoted to the parent level.
|
|
8
|
+
*
|
|
9
|
+
* When the unwrapped paragraph follows a div, a line-break element is prepended
|
|
10
|
+
* to represent the newline between the closing `</div>` and the bare text.
|
|
11
|
+
*
|
|
12
|
+
* Examples:
|
|
13
|
+
* `[[div]]inline[[/div]]\n[[div]]\n[[/div]]` → no `<p>` (adjacent to div)
|
|
14
|
+
* `[[div]]inline[[/div]]\n> a\n[[div]]\n[[/div]]` → has `<p>` (blockquote between)
|
|
15
|
+
*
|
|
16
|
+
* @module
|
|
17
|
+
*/
|
|
18
|
+
import type { Element, ContainerData } from "@wdprlib/ast";
|
|
19
|
+
|
|
20
|
+
function isParagraphContainer(el: Element | undefined): boolean {
|
|
21
|
+
if (!el || el.element !== "container") return false;
|
|
22
|
+
return (el.data as ContainerData).type === "paragraph";
|
|
23
|
+
}
|
|
24
|
+
|
|
25
|
+
function isDivContainer(el: Element | undefined): boolean {
|
|
26
|
+
if (!el || el.element !== "container") return false;
|
|
27
|
+
return (el.data as ContainerData).type === "div";
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
/**
|
|
31
|
+
* At a single nesting level, unwrap paragraph containers that are directly
|
|
32
|
+
* adjacent to div containers. A line-break is prepended when the paragraph
|
|
33
|
+
* follows a div.
|
|
34
|
+
*/
|
|
35
|
+
function suppressAtLevel(elements: Element[]): Element[] {
|
|
36
|
+
if (elements.length <= 1) return elements;
|
|
37
|
+
|
|
38
|
+
const unwrap = Array.from({ length: elements.length }, () => false);
|
|
39
|
+
|
|
40
|
+
for (let i = 0; i < elements.length; i++) {
|
|
41
|
+
if (!isParagraphContainer(elements[i])) continue;
|
|
42
|
+
const prevIsDiv = i > 0 && isDivContainer(elements[i - 1]);
|
|
43
|
+
const nextIsDiv = i < elements.length - 1 && isDivContainer(elements[i + 1]);
|
|
44
|
+
if (prevIsDiv || nextIsDiv) {
|
|
45
|
+
unwrap[i] = true;
|
|
46
|
+
}
|
|
47
|
+
}
|
|
48
|
+
|
|
49
|
+
const result: Element[] = [];
|
|
50
|
+
for (let i = 0; i < elements.length; i++) {
|
|
51
|
+
const el = elements[i];
|
|
52
|
+
if (!el) continue;
|
|
53
|
+
|
|
54
|
+
if (unwrap[i] && el.element === "container") {
|
|
55
|
+
const inner = (el.data as ContainerData).elements;
|
|
56
|
+
if (i > 0 && isDivContainer(elements[i - 1])) {
|
|
57
|
+
result.push({ element: "line-break" });
|
|
58
|
+
}
|
|
59
|
+
result.push(...inner);
|
|
60
|
+
} else {
|
|
61
|
+
result.push(el);
|
|
62
|
+
}
|
|
63
|
+
}
|
|
64
|
+
|
|
65
|
+
return result;
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
/**
|
|
69
|
+
* Suppress paragraph wrapping adjacent to div containers.
|
|
70
|
+
*
|
|
71
|
+
* Applied only at the top level. Inside div containers, paragraphs adjacent
|
|
72
|
+
* to nested divs retain their `<p>` wrapping (matching Wikidot behavior).
|
|
73
|
+
*/
|
|
74
|
+
export function suppressDivAdjacentParagraphs(elements: Element[]): Element[] {
|
|
75
|
+
return suppressAtLevel(elements);
|
|
76
|
+
}
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
/**
|
|
2
|
+
*
|
|
3
|
+
* Post-processing pipeline for the parsed AST.
|
|
4
|
+
*
|
|
5
|
+
* After the main parser produces an initial AST, post-processing transforms handle
|
|
6
|
+
* behaviors that cannot be resolved during single-pass parsing. This includes merging
|
|
7
|
+
* paragraphs around `span_` (paragraph-strip) elements, splitting paragraphs at
|
|
8
|
+
* empty `[[#expr ]]` elements, and cleaning internal flags that were used as
|
|
9
|
+
* inter-pass communication markers.
|
|
10
|
+
*
|
|
11
|
+
* @module
|
|
12
|
+
*/
|
|
13
|
+
|
|
14
|
+
export { mergeSpanStripParagraphs, cleanInternalFlags } from "./spanStrip";
|
|
15
|
+
export { suppressDivAdjacentParagraphs } from "./divAdjacentParagraph";
|
|
@@ -0,0 +1,168 @@
|
|
|
1
|
+
import type { DefinitionListItem, Element, ListItem } from "@wdprlib/ast";
|
|
2
|
+
import type { InternalContainerData } from "./predicates";
|
|
3
|
+
|
|
4
|
+
type CleanElements = (elements: Element[]) => Element[];
|
|
5
|
+
|
|
6
|
+
export function cleanElement(el: Element, cleanElements: CleanElements): Element {
|
|
7
|
+
if (el.element === "line-break") {
|
|
8
|
+
return cleanLineBreak(el);
|
|
9
|
+
}
|
|
10
|
+
|
|
11
|
+
if (el.element === "container") {
|
|
12
|
+
return cleanContainer(el, cleanElements);
|
|
13
|
+
}
|
|
14
|
+
|
|
15
|
+
if (el.element === "collapsible") {
|
|
16
|
+
const elements = cleanElements(el.data.elements);
|
|
17
|
+
if (elements === el.data.elements) {
|
|
18
|
+
return el;
|
|
19
|
+
}
|
|
20
|
+
return {
|
|
21
|
+
element: "collapsible",
|
|
22
|
+
data: {
|
|
23
|
+
...el.data,
|
|
24
|
+
elements,
|
|
25
|
+
},
|
|
26
|
+
};
|
|
27
|
+
}
|
|
28
|
+
|
|
29
|
+
if (el.element === "color") {
|
|
30
|
+
const elements = cleanElements(el.data.elements);
|
|
31
|
+
if (elements === el.data.elements) {
|
|
32
|
+
return el;
|
|
33
|
+
}
|
|
34
|
+
return {
|
|
35
|
+
element: "color",
|
|
36
|
+
data: {
|
|
37
|
+
...el.data,
|
|
38
|
+
elements,
|
|
39
|
+
},
|
|
40
|
+
};
|
|
41
|
+
}
|
|
42
|
+
|
|
43
|
+
if (el.element === "list") {
|
|
44
|
+
let items: typeof el.data.items | null = null;
|
|
45
|
+
for (let i = 0; i < el.data.items.length; i++) {
|
|
46
|
+
const item = el.data.items[i]!;
|
|
47
|
+
const cleaned = cleanListItem(item, cleanElements);
|
|
48
|
+
if (items !== null) {
|
|
49
|
+
items.push(cleaned);
|
|
50
|
+
} else if (cleaned !== item) {
|
|
51
|
+
items = el.data.items.slice(0, i);
|
|
52
|
+
items.push(cleaned);
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
if (items === null) {
|
|
57
|
+
return el;
|
|
58
|
+
}
|
|
59
|
+
|
|
60
|
+
return {
|
|
61
|
+
element: "list",
|
|
62
|
+
data: {
|
|
63
|
+
...el.data,
|
|
64
|
+
items,
|
|
65
|
+
},
|
|
66
|
+
};
|
|
67
|
+
}
|
|
68
|
+
|
|
69
|
+
if (el.element === "definition-list") {
|
|
70
|
+
let items: typeof el.data | null = null;
|
|
71
|
+
for (let i = 0; i < el.data.length; i++) {
|
|
72
|
+
const item = el.data[i]!;
|
|
73
|
+
const cleaned = cleanDefinitionListItem(item, cleanElements);
|
|
74
|
+
if (items !== null) {
|
|
75
|
+
items.push(cleaned);
|
|
76
|
+
} else if (cleaned !== item) {
|
|
77
|
+
items = el.data.slice(0, i);
|
|
78
|
+
items.push(cleaned);
|
|
79
|
+
}
|
|
80
|
+
}
|
|
81
|
+
|
|
82
|
+
if (items === null) {
|
|
83
|
+
return el;
|
|
84
|
+
}
|
|
85
|
+
|
|
86
|
+
return {
|
|
87
|
+
element: "definition-list",
|
|
88
|
+
data: items,
|
|
89
|
+
};
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
return el;
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
function cleanLineBreak(el: Element): Element {
|
|
96
|
+
for (const key in el) {
|
|
97
|
+
if (key !== "element") {
|
|
98
|
+
return { element: "line-break" };
|
|
99
|
+
}
|
|
100
|
+
}
|
|
101
|
+
return el;
|
|
102
|
+
}
|
|
103
|
+
|
|
104
|
+
function cleanContainer(
|
|
105
|
+
el: Extract<Element, { element: "container" }>,
|
|
106
|
+
cleanElements: CleanElements,
|
|
107
|
+
): Element {
|
|
108
|
+
const data = el.data as InternalContainerData;
|
|
109
|
+
const elements = cleanElements(data.elements);
|
|
110
|
+
const hasInternalFlags =
|
|
111
|
+
data._paragraphStrip !== undefined ||
|
|
112
|
+
data._emptyParagraphStrip !== undefined ||
|
|
113
|
+
data._escapedFromParagraph !== undefined ||
|
|
114
|
+
data._splitByBlankLine !== undefined;
|
|
115
|
+
|
|
116
|
+
if (!hasInternalFlags && elements === data.elements) {
|
|
117
|
+
return el;
|
|
118
|
+
}
|
|
119
|
+
|
|
120
|
+
return {
|
|
121
|
+
element: "container",
|
|
122
|
+
data: {
|
|
123
|
+
type: data.type,
|
|
124
|
+
attributes: data.attributes,
|
|
125
|
+
elements,
|
|
126
|
+
},
|
|
127
|
+
};
|
|
128
|
+
}
|
|
129
|
+
|
|
130
|
+
function cleanListItem(item: ListItem, cleanElements: CleanElements): ListItem {
|
|
131
|
+
if (item["item-type"] === "elements") {
|
|
132
|
+
const elements = cleanElements(item.elements);
|
|
133
|
+
return elements === item.elements
|
|
134
|
+
? item
|
|
135
|
+
: {
|
|
136
|
+
...item,
|
|
137
|
+
elements,
|
|
138
|
+
};
|
|
139
|
+
}
|
|
140
|
+
|
|
141
|
+
if (item["item-type"] === "sub-list") {
|
|
142
|
+
const cleanedList = cleanElement({ element: "list", data: item.data }, cleanElements);
|
|
143
|
+
return cleanedList.element === "list" && cleanedList.data !== item.data
|
|
144
|
+
? {
|
|
145
|
+
"item-type": "sub-list",
|
|
146
|
+
element: "list",
|
|
147
|
+
data: cleanedList.data,
|
|
148
|
+
}
|
|
149
|
+
: item;
|
|
150
|
+
}
|
|
151
|
+
|
|
152
|
+
return item;
|
|
153
|
+
}
|
|
154
|
+
|
|
155
|
+
function cleanDefinitionListItem(
|
|
156
|
+
item: DefinitionListItem,
|
|
157
|
+
cleanElements: CleanElements,
|
|
158
|
+
): DefinitionListItem {
|
|
159
|
+
const key = cleanElements(item.key);
|
|
160
|
+
const value = cleanElements(item.value);
|
|
161
|
+
return key === item.key && value === item.value
|
|
162
|
+
? item
|
|
163
|
+
: {
|
|
164
|
+
...item,
|
|
165
|
+
key,
|
|
166
|
+
value,
|
|
167
|
+
};
|
|
168
|
+
}
|
|
@@ -0,0 +1,25 @@
|
|
|
1
|
+
import type { Element } from "@wdprlib/ast";
|
|
2
|
+
import { cleanElement } from "./clean-element";
|
|
3
|
+
import { removeEmptySpansAndAdjacentWhitespace } from "./empty-spans";
|
|
4
|
+
|
|
5
|
+
/**
|
|
6
|
+
* Recursively remove internal flags from AST elements and clean up empty spans.
|
|
7
|
+
*/
|
|
8
|
+
export function cleanInternalFlags(elements: Element[]): Element[] {
|
|
9
|
+
let cleaned: Element[] | null = null;
|
|
10
|
+
|
|
11
|
+
for (let i = 0; i < elements.length; i++) {
|
|
12
|
+
const el = elements[i];
|
|
13
|
+
if (!el) continue;
|
|
14
|
+
|
|
15
|
+
const next = cleanElement(el, cleanInternalFlags);
|
|
16
|
+
if (cleaned !== null) {
|
|
17
|
+
cleaned.push(next);
|
|
18
|
+
} else if (next !== el) {
|
|
19
|
+
cleaned = elements.slice(0, i);
|
|
20
|
+
cleaned.push(next);
|
|
21
|
+
}
|
|
22
|
+
}
|
|
23
|
+
|
|
24
|
+
return removeEmptySpansAndAdjacentWhitespace(cleaned ?? elements);
|
|
25
|
+
}
|
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
import type { Element } from "@wdprlib/ast";
|
|
2
|
+
import { isEmptySpan, isWhitespaceText } from "./predicates";
|
|
3
|
+
|
|
4
|
+
export function removeEmptySpansAndAdjacentWhitespace(elements: Element[]): Element[] {
|
|
5
|
+
let hasEmptySpan = false;
|
|
6
|
+
for (const el of elements) {
|
|
7
|
+
if (el && isEmptySpan(el)) {
|
|
8
|
+
hasEmptySpan = true;
|
|
9
|
+
break;
|
|
10
|
+
}
|
|
11
|
+
}
|
|
12
|
+
if (!hasEmptySpan) {
|
|
13
|
+
return elements;
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
const result: Element[] = [];
|
|
17
|
+
|
|
18
|
+
for (let i = 0; i < elements.length; i++) {
|
|
19
|
+
const el = elements[i];
|
|
20
|
+
if (!el) continue;
|
|
21
|
+
|
|
22
|
+
if (isEmptySpan(el)) {
|
|
23
|
+
if (result.length > 0 && isWhitespaceText(result[result.length - 1]!)) {
|
|
24
|
+
result.pop();
|
|
25
|
+
}
|
|
26
|
+
while (i + 1 < elements.length && elements[i + 1] && isWhitespaceText(elements[i + 1]!)) {
|
|
27
|
+
i++;
|
|
28
|
+
}
|
|
29
|
+
continue;
|
|
30
|
+
}
|
|
31
|
+
|
|
32
|
+
result.push(el);
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
return result;
|
|
36
|
+
}
|
|
@@ -0,0 +1,78 @@
|
|
|
1
|
+
import type { Element } from "@wdprlib/ast";
|
|
2
|
+
import { spanElement } from "./factory";
|
|
3
|
+
import {
|
|
4
|
+
getContainerData,
|
|
5
|
+
isEscapedSpan,
|
|
6
|
+
isSpanStripMarker,
|
|
7
|
+
type InternalContainerData,
|
|
8
|
+
} from "./predicates";
|
|
9
|
+
|
|
10
|
+
export function extractEscapedSpans(children: Element[]): Element[] {
|
|
11
|
+
const escaped: Element[] = [];
|
|
12
|
+
|
|
13
|
+
let firstEscapedIndex = -1;
|
|
14
|
+
for (let i = 0; i < children.length; i++) {
|
|
15
|
+
const child = children[i];
|
|
16
|
+
if (child && isEscapedSpan(child)) {
|
|
17
|
+
firstEscapedIndex = i;
|
|
18
|
+
break;
|
|
19
|
+
}
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
if (firstEscapedIndex === -1) {
|
|
23
|
+
return escaped;
|
|
24
|
+
}
|
|
25
|
+
|
|
26
|
+
let currentSpanChildren: Element[] = [];
|
|
27
|
+
|
|
28
|
+
for (let i = firstEscapedIndex; i < children.length; i++) {
|
|
29
|
+
const child = children[i];
|
|
30
|
+
if (!child) continue;
|
|
31
|
+
|
|
32
|
+
if (isEscapedSpan(child)) {
|
|
33
|
+
if (currentSpanChildren.length > 0) {
|
|
34
|
+
escaped.push(spanElement(currentSpanChildren));
|
|
35
|
+
currentSpanChildren = [];
|
|
36
|
+
}
|
|
37
|
+
escaped.push(child);
|
|
38
|
+
} else if (isSpanStripMarker(child)) {
|
|
39
|
+
const childData = getContainerData(child);
|
|
40
|
+
if (childData) {
|
|
41
|
+
escaped.push(spanElement(childData.elements, childData.attributes));
|
|
42
|
+
}
|
|
43
|
+
} else {
|
|
44
|
+
currentSpanChildren.push(child);
|
|
45
|
+
}
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
if (currentSpanChildren.length > 0) {
|
|
49
|
+
escaped.push(spanElement(currentSpanChildren));
|
|
50
|
+
}
|
|
51
|
+
|
|
52
|
+
children.splice(firstEscapedIndex);
|
|
53
|
+
|
|
54
|
+
return escaped;
|
|
55
|
+
}
|
|
56
|
+
|
|
57
|
+
export function removeLineBreaksAroundSpanStrip(children: Element[]): void {
|
|
58
|
+
for (let i = children.length - 1; i >= 0; i--) {
|
|
59
|
+
const child = children[i];
|
|
60
|
+
if (!child) continue;
|
|
61
|
+
|
|
62
|
+
if (child.element === "line-break") {
|
|
63
|
+
const prev = children[i - 1];
|
|
64
|
+
const next = children[i + 1];
|
|
65
|
+
if (isSpanStripMarker(prev) || isSpanStripMarker(next)) {
|
|
66
|
+
children.splice(i, 1);
|
|
67
|
+
continue;
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
if (child.element === "container") {
|
|
72
|
+
const data = child.data as InternalContainerData;
|
|
73
|
+
if (data.type === "span" && data._emptyParagraphStrip) {
|
|
74
|
+
children.splice(i, 1);
|
|
75
|
+
}
|
|
76
|
+
}
|
|
77
|
+
}
|
|
78
|
+
}
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
import type { Element } from "@wdprlib/ast";
|
|
2
|
+
|
|
3
|
+
export function paragraphElement(elements: Element[]): Element {
|
|
4
|
+
return {
|
|
5
|
+
element: "container",
|
|
6
|
+
data: {
|
|
7
|
+
type: "paragraph",
|
|
8
|
+
attributes: {},
|
|
9
|
+
elements,
|
|
10
|
+
},
|
|
11
|
+
};
|
|
12
|
+
}
|
|
13
|
+
|
|
14
|
+
export function spanElement(elements: Element[], attributes: Record<string, string> = {}): Element {
|
|
15
|
+
return {
|
|
16
|
+
element: "container",
|
|
17
|
+
data: {
|
|
18
|
+
type: "span",
|
|
19
|
+
attributes,
|
|
20
|
+
elements,
|
|
21
|
+
},
|
|
22
|
+
};
|
|
23
|
+
}
|