@wdprlib/parser 3.2.0 → 4.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/index.cjs +10451 -8402
- package/dist/index.d.cts +313 -337
- package/dist/index.d.ts +313 -337
- package/dist/index.js +10438 -8389
- package/package.json +1 -1
- package/src/index.ts +7 -0
- package/src/lexer/anchor.ts +48 -0
- package/src/lexer/index.ts +3 -2
- package/src/lexer/lexer.ts +73 -559
- package/src/lexer/options.ts +19 -0
- package/src/lexer/punctuation.ts +70 -0
- package/src/lexer/quoted-string.ts +16 -0
- package/src/lexer/runs.ts +85 -0
- package/src/lexer/spacing-actions.ts +24 -0
- package/src/lexer/state.ts +103 -0
- package/src/lexer/syntax-actions.ts +80 -0
- package/src/lexer/text-actions.ts +41 -0
- package/src/lexer/token-actions.ts +136 -0
- package/src/lexer/token-factory.ts +62 -0
- package/src/lexer/tokenize.ts +18 -0
- package/src/parser/constants.ts +2 -0
- package/src/parser/depth/index.ts +111 -0
- package/src/parser/depth/stack.ts +82 -0
- package/src/parser/parse/block.ts +42 -0
- package/src/parser/parse/context.ts +26 -0
- package/src/parser/parse/footnotes.ts +25 -0
- package/src/parser/parse/index.ts +42 -0
- package/src/parser/parse/options.ts +34 -0
- package/src/parser/parse/parser.ts +79 -0
- package/src/parser/parse/plain-non-ascii.ts +129 -0
- package/src/parser/parse/result.ts +57 -0
- package/src/parser/parse/source.ts +11 -0
- package/src/parser/postprocess/divAdjacentParagraph.ts +1 -1
- package/src/parser/postprocess/spanStrip/clean-element.ts +168 -0
- package/src/parser/postprocess/spanStrip/cleanup.ts +25 -0
- package/src/parser/postprocess/spanStrip/empty-spans.ts +36 -0
- package/src/parser/postprocess/spanStrip/escaped.ts +78 -0
- package/src/parser/postprocess/spanStrip/factory.ts +23 -0
- package/src/parser/postprocess/spanStrip/index.ts +8 -0
- package/src/parser/postprocess/spanStrip/merge.ts +117 -0
- package/src/parser/postprocess/spanStrip/predicates.ts +59 -0
- package/src/parser/postprocess/spanStrip/split.ts +67 -0
- package/src/parser/preprocess/expr/chars.ts +15 -0
- package/src/parser/preprocess/expr/evaluate.ts +22 -0
- package/src/parser/preprocess/expr/index.ts +45 -0
- package/src/parser/preprocess/expr/kind.ts +19 -0
- package/src/parser/preprocess/expr/parse.ts +103 -0
- package/src/parser/preprocess/expr/scan.ts +34 -0
- package/src/parser/preprocess/expr/types.ts +14 -0
- package/src/parser/preprocess/typography.ts +70 -5
- package/src/parser/preprocess/utils/bracket-depths.ts +98 -0
- package/src/parser/preprocess/utils/index.ts +13 -0
- package/src/parser/preprocess/utils/raw-regions.ts +153 -0
- package/src/parser/preprocess/whitespace/detection.ts +39 -0
- package/src/parser/preprocess/whitespace/index.ts +79 -0
- package/src/parser/preprocess/whitespace/leading-spaces.ts +11 -0
- package/src/parser/preprocess/whitespace/patterns.ts +23 -0
- package/src/parser/rules/block/align/body.ts +46 -0
- package/src/parser/rules/block/align/element.ts +13 -0
- package/src/parser/rules/block/align/index.ts +90 -0
- package/src/parser/rules/block/align/syntax.ts +113 -0
- package/src/parser/rules/block/bibliography/body.ts +81 -0
- package/src/parser/rules/block/bibliography/entries.ts +49 -0
- package/src/parser/rules/block/bibliography/entry-content.ts +73 -0
- package/src/parser/rules/block/bibliography/entry-key.ts +83 -0
- package/src/parser/rules/block/bibliography/index.ts +90 -0
- package/src/parser/rules/block/bibliography/open.ts +53 -0
- package/src/parser/rules/block/block-list/bare-content.ts +105 -0
- package/src/parser/rules/block/block-list/bare-paragraph.ts +60 -0
- package/src/parser/rules/block/block-list/index.ts +51 -0
- package/src/parser/rules/block/block-list/item-content.ts +132 -0
- package/src/parser/rules/block/block-list/li-content.ts +107 -0
- package/src/parser/rules/block/block-list/li-item.ts +77 -0
- package/src/parser/rules/block/block-list/list-block.ts +100 -0
- package/src/parser/rules/block/block-list/open.ts +51 -0
- package/src/parser/rules/block/block-list/tags.ts +50 -0
- package/src/parser/rules/block/blockquote/build.ts +62 -0
- package/src/parser/rules/block/blockquote/index.ts +80 -0
- package/src/parser/rules/block/blockquote/line.ts +79 -0
- package/src/parser/rules/block/blockquote/lines.ts +39 -0
- package/src/parser/rules/block/{center.ts → center/index.ts} +7 -22
- package/src/parser/rules/block/center/open.ts +27 -0
- package/src/parser/rules/block/{clear-float.ts → clear-float/index.ts} +6 -30
- package/src/parser/rules/block/clear-float/syntax.ts +43 -0
- package/src/parser/rules/block/code/attributes.ts +30 -0
- package/src/parser/rules/block/code/content.ts +57 -0
- package/src/parser/rules/block/code/index.ts +100 -0
- package/src/parser/rules/block/collapsible/attributes.ts +95 -0
- package/src/parser/rules/block/collapsible/body.ts +69 -0
- package/src/parser/rules/block/collapsible/index.ts +117 -0
- package/src/parser/rules/block/collapsible/open.ts +51 -0
- package/src/parser/rules/block/collapsible/orphans.ts +31 -0
- package/src/parser/rules/block/collapsible/tags.ts +17 -0
- package/src/parser/rules/block/comment/consume.ts +37 -0
- package/src/parser/rules/block/{comment.ts → comment/index.ts} +12 -38
- package/src/parser/rules/block/{content-separator.ts → content-separator/index.ts} +5 -35
- package/src/parser/rules/block/content-separator/syntax.ts +33 -0
- package/src/parser/rules/block/definition-list/collect.ts +40 -0
- package/src/parser/rules/block/definition-list/index.ts +63 -0
- package/src/parser/rules/block/definition-list/item-key.ts +95 -0
- package/src/parser/rules/block/definition-list/item-value.ts +56 -0
- package/src/parser/rules/block/definition-list/items.ts +54 -0
- package/src/parser/rules/block/div/body.ts +41 -0
- package/src/parser/rules/block/div/close.ts +41 -0
- package/src/parser/rules/block/div/failed.ts +117 -0
- package/src/parser/rules/block/div/index.ts +112 -0
- package/src/parser/rules/block/div/nesting.ts +37 -0
- package/src/parser/rules/block/div/open.ts +59 -0
- package/src/parser/rules/block/div/paragraph-strip.ts +44 -0
- package/src/parser/rules/block/embed-block/content.ts +53 -0
- package/src/parser/rules/block/embed-block/index.ts +91 -0
- package/src/parser/rules/block/embed-block/open.ts +52 -0
- package/src/parser/rules/block/embed-block/tags.ts +5 -0
- package/src/parser/rules/block/footnoteblock/attributes.ts +73 -0
- package/src/parser/rules/block/footnoteblock/index.ts +82 -0
- package/src/parser/rules/block/footnoteblock/open.ts +53 -0
- package/src/parser/rules/block/heading/index.ts +87 -0
- package/src/parser/rules/block/heading/open.ts +50 -0
- package/src/parser/rules/block/heading/toc-text.ts +26 -0
- package/src/parser/rules/block/{horizontal-rule.ts → horizontal-rule/index.ts} +4 -21
- package/src/parser/rules/block/horizontal-rule/syntax.ts +21 -0
- package/src/parser/rules/block/html/body.ts +114 -0
- package/src/parser/rules/block/html/diagnostics.ts +11 -0
- package/src/parser/rules/block/html/index.ts +95 -0
- package/src/parser/rules/block/html/open.ts +36 -0
- package/src/parser/rules/block/iframe/attributes.ts +106 -0
- package/src/parser/rules/block/iframe/index.ts +73 -0
- package/src/parser/rules/block/iframe/open.ts +58 -0
- package/src/parser/rules/block/iframe/source.ts +24 -0
- package/src/parser/rules/block/iframe/url.ts +38 -0
- package/src/parser/rules/block/iftags/body.ts +48 -0
- package/src/parser/rules/block/iftags/condition.ts +24 -0
- package/src/parser/rules/block/{iftags.ts → iftags/index.ts} +16 -58
- package/src/parser/rules/block/include/arguments.ts +48 -0
- package/src/parser/rules/block/include/index.ts +75 -0
- package/src/parser/rules/block/include/location.ts +24 -0
- package/src/parser/rules/block/include/variables.ts +37 -0
- package/src/parser/rules/block/list/index.ts +73 -0
- package/src/parser/rules/block/list/line.ts +77 -0
- package/src/parser/rules/block/list/native.ts +89 -0
- package/src/parser/rules/block/math/content.ts +54 -0
- package/src/parser/rules/block/math/index.ts +106 -0
- package/src/parser/rules/block/math/name.ts +35 -0
- package/src/parser/rules/block/module/body.ts +92 -0
- package/src/parser/rules/block/module/element.ts +33 -0
- package/src/parser/rules/block/module/include/directive.ts +91 -0
- package/src/parser/rules/block/module/include/index.ts +11 -2
- package/src/parser/rules/block/module/include/references.ts +42 -0
- package/src/parser/rules/block/module/include/resolve/cache.ts +44 -0
- package/src/parser/rules/block/module/include/resolve/index.ts +106 -0
- package/src/parser/rules/block/module/include/resolve/iterate.ts +202 -0
- package/src/parser/rules/block/module/include/resolve/replace.ts +31 -0
- package/src/parser/rules/block/module/include/resolve/types.ts +105 -0
- package/src/parser/rules/block/module/include/scanner.ts +121 -0
- package/src/parser/rules/block/module/index.ts +14 -2
- package/src/parser/rules/block/module/listpages/compiler.ts +12 -392
- package/src/parser/rules/block/module/listpages/extract.ts +25 -359
- package/src/parser/rules/block/module/listpages/extraction/listpages.ts +42 -0
- package/src/parser/rules/block/module/listpages/extraction/listusers.ts +30 -0
- package/src/parser/rules/block/module/listpages/extraction/query.ts +51 -0
- package/src/parser/rules/block/module/listpages/extraction/result.ts +18 -0
- package/src/parser/rules/block/module/listpages/extraction/template.ts +96 -0
- package/src/parser/rules/block/module/listpages/extraction/variables.ts +58 -0
- package/src/parser/rules/block/module/listpages/normalization/date-selector.ts +53 -0
- package/src/parser/rules/block/module/listpages/normalization/numeric-selector.ts +32 -0
- package/src/parser/rules/block/module/listpages/normalization/order-parent.ts +82 -0
- package/src/parser/rules/block/module/listpages/normalization/selectors.ts +2 -0
- package/src/parser/rules/block/module/listpages/normalization/tags-category.ts +86 -0
- package/src/parser/rules/block/module/listpages/normalize.ts +8 -324
- package/src/parser/rules/block/module/listpages/resolution/items.ts +43 -0
- package/src/parser/rules/block/module/listpages/resolution/wrapper.ts +42 -0
- package/src/parser/rules/block/module/listpages/resolve.ts +5 -75
- package/src/parser/rules/block/module/listpages/template/format/content.ts +41 -0
- package/src/parser/rules/block/module/listpages/template/format/date.ts +116 -0
- package/src/parser/rules/block/module/listpages/template/format/index.ts +4 -0
- package/src/parser/rules/block/module/listpages/template/format/tags.ts +7 -0
- package/src/parser/rules/block/module/listpages/template/format/user.ts +9 -0
- package/src/parser/rules/block/module/listpages/template/getters/index.ts +36 -0
- package/src/parser/rules/block/module/listpages/template/getters/parameterized.ts +60 -0
- package/src/parser/rules/block/module/listpages/template/getters/simple.ts +65 -0
- package/src/parser/rules/block/module/listpages/template/getters/types.ts +3 -0
- package/src/parser/rules/block/module/listpages/template/syntax.ts +97 -0
- package/src/parser/rules/block/module/listpages/types/data-fetcher.ts +15 -0
- package/src/parser/rules/block/module/listpages/types/data-requirements.ts +52 -0
- package/src/parser/rules/block/module/listpages/types/external-data.ts +77 -0
- package/src/parser/rules/block/module/listpages/types/index.ts +17 -0
- package/src/parser/rules/block/module/listpages/types/normalized-query.ts +120 -0
- package/src/parser/rules/block/module/listpages/types/query.ts +67 -0
- package/src/parser/rules/block/module/listpages/types/template.ts +17 -0
- package/src/parser/rules/block/module/listpages/types/variables.ts +69 -0
- package/src/parser/rules/block/module/listpages/url-resolution/fields.ts +48 -0
- package/src/parser/rules/block/module/listpages/url-resolution/params.ts +19 -0
- package/src/parser/rules/block/module/listpages/url-resolution/query.ts +24 -0
- package/src/parser/rules/block/module/listpages/url-resolution/resolve.ts +53 -0
- package/src/parser/rules/block/module/listpages/url-resolution/value.ts +25 -0
- package/src/parser/rules/block/module/listpages/url-resolver.ts +3 -160
- package/src/parser/rules/block/module/listusers/compiler.ts +4 -25
- package/src/parser/rules/block/module/listusers/extract.ts +4 -9
- package/src/parser/rules/block/module/listusers/getters.ts +21 -0
- package/src/parser/rules/block/module/listusers/variables.ts +15 -0
- package/src/parser/rules/block/module/open.ts +57 -0
- package/src/parser/rules/block/module/resolution/contexts.ts +78 -0
- package/src/parser/rules/block/module/resolution/data-maps.ts +39 -0
- package/src/parser/rules/block/module/resolution/dynamic-modules.ts +93 -0
- package/src/parser/rules/block/module/resolution/styles.ts +53 -0
- package/src/parser/rules/block/module/resolution/walk-resolve.ts +107 -0
- package/src/parser/rules/block/module/resolve.ts +79 -292
- package/src/parser/rules/block/module/rule.ts +56 -0
- package/src/parser/rules/block/module/types-common.ts +11 -0
- package/src/parser/rules/block/module/walk/children.ts +35 -0
- package/src/parser/rules/block/module/walk/index.ts +9 -0
- package/src/parser/rules/block/module/walk/map/index.ts +2 -0
- package/src/parser/rules/block/module/walk/map/stateful-definition-list.ts +25 -0
- package/src/parser/rules/block/module/walk/map/stateful-list.ts +40 -0
- package/src/parser/rules/block/module/walk/map/stateful-table.ts +23 -0
- package/src/parser/rules/block/module/walk/map/stateful-tabs.ts +19 -0
- package/src/parser/rules/block/module/walk/map/stateful.ts +71 -0
- package/src/parser/rules/block/module/walk/map/stateless-definition-list.ts +12 -0
- package/src/parser/rules/block/module/walk/map/stateless-list.ts +29 -0
- package/src/parser/rules/block/module/walk/map/stateless-table.ts +11 -0
- package/src/parser/rules/block/module/walk/map/stateless-tabs.ts +5 -0
- package/src/parser/rules/block/module/walk/map/stateless.ts +51 -0
- package/src/parser/rules/block/module/walk/map/types.ts +6 -0
- package/src/parser/rules/block/module/walk/traverse.ts +65 -0
- package/src/parser/rules/block/orphan-li/content.ts +60 -0
- package/src/parser/rules/block/orphan-li/index.ts +75 -0
- package/src/parser/rules/block/orphan-li/open.ts +25 -0
- package/src/parser/rules/block/orphan-li/tags.ts +40 -0
- package/src/parser/rules/block/paragraph/content.ts +12 -0
- package/src/parser/rules/block/paragraph/index.ts +60 -0
- package/src/parser/rules/block/paragraph/normalize.ts +52 -0
- package/src/parser/rules/block/paragraph/span-markers.ts +52 -0
- package/src/parser/rules/block/parsing/attributes/index.ts +32 -0
- package/src/parser/rules/block/parsing/attributes/names.ts +93 -0
- package/src/parser/rules/block/parsing/attributes/scanner.ts +75 -0
- package/src/parser/rules/block/parsing/attributes/values.ts +26 -0
- package/src/parser/rules/block/parsing/block-item.ts +29 -0
- package/src/parser/rules/block/parsing/content.ts +127 -0
- package/src/parser/rules/block/parsing/end-condition.ts +51 -0
- package/src/parser/rules/block/parsing/inline-content.ts +105 -0
- package/src/parser/rules/block/parsing/inline-newline.ts +41 -0
- package/src/parser/rules/block/parsing/non-boundary.ts +24 -0
- package/src/parser/rules/block/parsing/rule-dispatch.ts +44 -0
- package/src/parser/rules/block/table/index.ts +80 -0
- package/src/parser/rules/block/table/pipe/cell-start.ts +69 -0
- package/src/parser/rules/block/table/pipe/cell.ts +106 -0
- package/src/parser/rules/block/table/pipe/index.ts +2 -0
- package/src/parser/rules/block/table/pipe/row.ts +88 -0
- package/src/parser/rules/block/table/pipe/tokens.ts +14 -0
- package/src/parser/rules/block/table/pipe/trim.ts +50 -0
- package/src/parser/rules/block/table-block/body.ts +79 -0
- package/src/parser/rules/block/table-block/cell-attributes.ts +33 -0
- package/src/parser/rules/block/table-block/cell-boundary.ts +99 -0
- package/src/parser/rules/block/table-block/cell-content/index.ts +88 -0
- package/src/parser/rules/block/table-block/cell-content/segments.ts +134 -0
- package/src/parser/rules/block/table-block/cell-newline.ts +47 -0
- package/src/parser/rules/block/table-block/cell.ts +64 -0
- package/src/parser/rules/block/table-block/index.ts +113 -0
- package/src/parser/rules/block/table-block/row-boundary.ts +75 -0
- package/src/parser/rules/block/table-block/structure.ts +80 -0
- package/src/parser/rules/block/tabview/body.ts +64 -0
- package/src/parser/rules/block/tabview/index.ts +90 -0
- package/src/parser/rules/block/tabview/open.ts +50 -0
- package/src/parser/rules/block/tabview/tab.ts +92 -0
- package/src/parser/rules/block/tabview/tags.ts +30 -0
- package/src/parser/rules/block/toc/element.ts +11 -0
- package/src/parser/rules/block/toc/index.ts +44 -0
- package/src/parser/rules/block/toc/open.ts +84 -0
- package/src/parser/rules/block/utils.ts +10 -610
- package/src/parser/rules/{utils.ts → common/attribute-safety.ts} +3 -49
- package/src/parser/rules/common/block-name.ts +33 -0
- package/src/parser/rules/common/index.ts +2 -0
- package/src/parser/rules/contracts/index.ts +3 -0
- package/src/parser/rules/contracts/parse-context.ts +38 -0
- package/src/parser/rules/contracts/rule.ts +43 -0
- package/src/parser/rules/contracts/scope.ts +31 -0
- package/src/parser/rules/inline/anchor/attributes.ts +54 -0
- package/src/parser/rules/inline/anchor/child.ts +26 -0
- package/src/parser/rules/inline/anchor/close.ts +34 -0
- package/src/parser/rules/inline/anchor/content.ts +59 -0
- package/src/parser/rules/inline/anchor/index.ts +103 -0
- package/src/parser/rules/inline/anchor/newline.ts +26 -0
- package/src/parser/rules/inline/anchor/open.ts +47 -0
- package/src/parser/rules/inline/anchor/paragraph-strip.ts +14 -0
- package/src/parser/rules/inline/anchor/syntax.ts +40 -0
- package/src/parser/rules/inline/anchor-name/index.ts +38 -0
- package/src/parser/rules/inline/anchor-name/name.ts +39 -0
- package/src/parser/rules/inline/anchor-name/syntax.ts +46 -0
- package/src/parser/rules/inline/bibcite/element.ts +14 -0
- package/src/parser/rules/inline/bibcite/index.ts +34 -0
- package/src/parser/rules/inline/bibcite/syntax.ts +64 -0
- package/src/parser/rules/inline/bold.ts +2 -39
- package/src/parser/rules/inline/color/index.ts +35 -0
- package/src/parser/rules/inline/color/syntax.ts +69 -0
- package/src/parser/rules/inline/comment/consume.ts +31 -0
- package/src/parser/rules/inline/{comment.ts → comment/index.ts} +10 -36
- package/src/parser/rules/inline/equation-ref/element.ts +8 -0
- package/src/parser/rules/inline/equation-ref/index.ts +34 -0
- package/src/parser/rules/inline/equation-ref/syntax.ts +45 -0
- package/src/parser/rules/inline/expr/branch.ts +104 -0
- package/src/parser/rules/inline/expr/conditional-branch.ts +27 -0
- package/src/parser/rules/inline/expr/conditional.ts +80 -0
- package/src/parser/rules/inline/expr/depth.ts +25 -0
- package/src/parser/rules/inline/expr/elements.ts +39 -0
- package/src/parser/rules/inline/expr/index.ts +84 -0
- package/src/parser/rules/inline/expr/syntax.ts +45 -0
- package/src/parser/rules/inline/footnote/child.ts +22 -0
- package/src/parser/rules/inline/footnote/close.ts +33 -0
- package/src/parser/rules/inline/footnote/content.ts +54 -0
- package/src/parser/rules/inline/footnote/elements.ts +38 -0
- package/src/parser/rules/inline/footnote/index.ts +54 -0
- package/src/parser/rules/inline/footnote/newline.ts +27 -0
- package/src/parser/rules/inline/footnote/open.ts +38 -0
- package/src/parser/rules/inline/formatting/container.ts +50 -0
- package/src/parser/rules/inline/{guillemet.ts → guillemet/index.ts} +5 -13
- package/src/parser/rules/inline/guillemet/text.ts +11 -0
- package/src/parser/rules/inline/html/gate.ts +64 -0
- package/src/parser/rules/inline/{html.ts → html/index.ts} +9 -60
- package/src/parser/rules/inline/html/open.ts +37 -0
- package/src/parser/rules/inline/image/attributes.ts +22 -0
- package/src/parser/rules/inline/image/body.ts +36 -0
- package/src/parser/rules/inline/image/index.ts +89 -0
- package/src/parser/rules/inline/image/open.ts +56 -0
- package/src/parser/rules/inline/image/source.ts +62 -0
- package/src/parser/rules/inline/image/syntax.ts +76 -0
- package/src/parser/rules/inline/italic.ts +2 -30
- package/src/parser/rules/inline/line-break/backslash.ts +58 -0
- package/src/parser/rules/inline/line-break/elements.ts +9 -0
- package/src/parser/rules/inline/line-break/index.ts +3 -0
- package/src/parser/rules/inline/line-break/newline.ts +82 -0
- package/src/parser/rules/inline/line-break/underscore.ts +45 -0
- package/src/parser/rules/inline/link-anchor.ts +6 -81
- package/src/parser/rules/inline/link-bracket/anchor.ts +3 -0
- package/src/parser/rules/inline/link-bracket/direct-url.ts +5 -0
- package/src/parser/rules/inline/link-bracket/parsed.ts +81 -0
- package/src/parser/rules/inline/link-bracket/parts.ts +64 -0
- package/src/parser/rules/inline/link-bracket/prefix.ts +15 -0
- package/src/parser/rules/inline/link-single.ts +7 -98
- package/src/parser/rules/inline/link-star.ts +7 -69
- package/src/parser/rules/inline/link-triple/fallback.ts +10 -0
- package/src/parser/rules/inline/link-triple/index.ts +62 -0
- package/src/parser/rules/inline/link-triple/interwiki.ts +11 -0
- package/src/parser/rules/inline/link-triple/label.ts +35 -0
- package/src/parser/rules/inline/link-triple/syntax.ts +72 -0
- package/src/parser/rules/inline/link-triple/target.ts +36 -0
- package/src/parser/rules/inline/math-inline/index.ts +40 -0
- package/src/parser/rules/inline/math-inline/syntax.ts +55 -0
- package/src/parser/rules/inline/monospace.ts +2 -30
- package/src/parser/rules/inline/parsing/block-boundary.ts +42 -0
- package/src/parser/rules/inline/parsing/block-start-predicates.ts +117 -0
- package/src/parser/rules/inline/parsing/collect.ts +23 -0
- package/src/parser/rules/inline/parsing/inline-content.ts +115 -0
- package/src/parser/rules/inline/parsing/paragraph-boundary.ts +47 -0
- package/src/parser/rules/inline/parsing/plain-text.ts +69 -0
- package/src/parser/rules/inline/parsing/preserved-line-break.ts +11 -0
- package/src/parser/rules/inline/parsing/rules.ts +34 -0
- package/src/parser/rules/inline/parsing/simple-token.ts +26 -0
- package/src/parser/rules/inline/raw/angle.ts +40 -0
- package/src/parser/rules/inline/raw/double-at.ts +78 -0
- package/src/parser/rules/inline/raw/index.ts +26 -0
- package/src/parser/rules/inline/raw/result.ts +26 -0
- package/src/parser/rules/inline/size/content.ts +65 -0
- package/src/parser/rules/inline/size/index.ts +55 -0
- package/src/parser/rules/inline/size/open.ts +43 -0
- package/src/parser/rules/inline/size/value.ts +45 -0
- package/src/parser/rules/inline/span/content.ts +97 -0
- package/src/parser/rules/inline/span/elements.ts +108 -0
- package/src/parser/rules/inline/span/index.ts +79 -0
- package/src/parser/rules/inline/span/newline.ts +50 -0
- package/src/parser/rules/inline/span/syntax.ts +70 -0
- package/src/parser/rules/inline/{strikethrough.ts → strikethrough/index.ts} +5 -60
- package/src/parser/rules/inline/strikethrough/parse.ts +14 -0
- package/src/parser/rules/inline/strikethrough/syntax.ts +24 -0
- package/src/parser/rules/inline/subscript.ts +2 -39
- package/src/parser/rules/inline/superscript.ts +4 -39
- package/src/parser/rules/inline/text/element.ts +5 -0
- package/src/parser/rules/inline/{text.ts → text/index.ts} +5 -4
- package/src/parser/rules/inline/underline/child.ts +26 -0
- package/src/parser/rules/inline/underline/content.ts +29 -0
- package/src/parser/rules/inline/{underline.ts → underline/index.ts} +6 -49
- package/src/parser/rules/inline/user/element.ts +11 -0
- package/src/parser/rules/inline/user/index.ts +34 -0
- package/src/parser/rules/inline/user/syntax.ts +67 -0
- package/src/parser/rules/inline/utils.ts +4 -344
- package/src/parser/rules/tokens.ts +106 -0
- package/src/parser/rules/types.ts +9 -252
- package/src/parser/depth.ts +0 -251
- package/src/parser/parse.ts +0 -315
- package/src/parser/postprocess/spanStrip.ts +0 -697
- package/src/parser/preprocess/expr.ts +0 -265
- package/src/parser/preprocess/utils.ts +0 -250
- package/src/parser/preprocess/whitespace.ts +0 -111
- package/src/parser/rules/block/align.ts +0 -282
- package/src/parser/rules/block/bibliography.ts +0 -359
- package/src/parser/rules/block/block-list.ts +0 -689
- package/src/parser/rules/block/blockquote.ts +0 -238
- package/src/parser/rules/block/code.ts +0 -187
- package/src/parser/rules/block/collapsible.ts +0 -337
- package/src/parser/rules/block/definition-list.ts +0 -270
- package/src/parser/rules/block/div.ts +0 -400
- package/src/parser/rules/block/embed-block.ts +0 -153
- package/src/parser/rules/block/footnoteblock.ts +0 -200
- package/src/parser/rules/block/heading.ts +0 -142
- package/src/parser/rules/block/html.ts +0 -222
- package/src/parser/rules/block/iframe.ts +0 -239
- package/src/parser/rules/block/include.ts +0 -179
- package/src/parser/rules/block/list.ts +0 -244
- package/src/parser/rules/block/math.ts +0 -183
- package/src/parser/rules/block/module/include/resolve.ts +0 -556
- package/src/parser/rules/block/module/listpages/types.ts +0 -513
- package/src/parser/rules/block/module/walk.ts +0 -380
- package/src/parser/rules/block/module.ts +0 -164
- package/src/parser/rules/block/orphan-li.ts +0 -177
- package/src/parser/rules/block/paragraph.ts +0 -157
- package/src/parser/rules/block/table-block.ts +0 -726
- package/src/parser/rules/block/table.ts +0 -441
- package/src/parser/rules/block/tabview.ts +0 -331
- package/src/parser/rules/block/toc.ts +0 -129
- package/src/parser/rules/inline/anchor-name.ts +0 -154
- package/src/parser/rules/inline/anchor.ts +0 -327
- package/src/parser/rules/inline/bibcite.ts +0 -153
- package/src/parser/rules/inline/color.ts +0 -140
- package/src/parser/rules/inline/equation-ref.ts +0 -115
- package/src/parser/rules/inline/expr.ts +0 -526
- package/src/parser/rules/inline/footnote.ts +0 -223
- package/src/parser/rules/inline/image.ts +0 -328
- package/src/parser/rules/inline/line-break.ts +0 -326
- package/src/parser/rules/inline/link-triple.ts +0 -267
- package/src/parser/rules/inline/math-inline.ts +0 -126
- package/src/parser/rules/inline/raw.ts +0 -262
- package/src/parser/rules/inline/size.ts +0 -244
- package/src/parser/rules/inline/span.ts +0 -424
- package/src/parser/rules/inline/user.ts +0 -147
|
@@ -0,0 +1,62 @@
|
|
|
1
|
+
/**
|
|
2
|
+
*
|
|
3
|
+
* Parses the Wikidot triple-bracket link syntax: `[[[target | label]]]`.
|
|
4
|
+
*
|
|
5
|
+
* @module
|
|
6
|
+
*/
|
|
7
|
+
import type { Element } from "@wdprlib/ast";
|
|
8
|
+
import type { InlineRule, ParseContext, RuleResult } from "../../types";
|
|
9
|
+
import { currentToken } from "../../types";
|
|
10
|
+
import { literalOpenLink } from "./fallback";
|
|
11
|
+
import { buildTripleLinkLabel } from "./label";
|
|
12
|
+
import { collectTripleLinkParts, hasClosingLinkMarker } from "./syntax";
|
|
13
|
+
import {
|
|
14
|
+
determineLinkTypeAndLocation,
|
|
15
|
+
isInvalidTripleLinkTarget,
|
|
16
|
+
normalizeTripleLinkTarget,
|
|
17
|
+
} from "./target";
|
|
18
|
+
|
|
19
|
+
export const linkTripleRule: InlineRule = {
|
|
20
|
+
name: "linkTriple",
|
|
21
|
+
startTokens: ["LINK_OPEN"],
|
|
22
|
+
|
|
23
|
+
parse(ctx: ParseContext): RuleResult<Element> {
|
|
24
|
+
const startToken = currentToken(ctx);
|
|
25
|
+
|
|
26
|
+
if (!hasClosingLinkMarker(ctx, ctx.pos + 1)) {
|
|
27
|
+
return literalOpenLink(startToken.value);
|
|
28
|
+
}
|
|
29
|
+
|
|
30
|
+
const parts = collectTripleLinkParts(ctx, ctx.pos + 1);
|
|
31
|
+
const trimmedTarget = parts.target.trim();
|
|
32
|
+
if (isInvalidTripleLinkTarget(trimmedTarget, parts.foundPipe)) {
|
|
33
|
+
return literalOpenLink(startToken.value);
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
const normalized = normalizeTripleLinkTarget(trimmedTarget);
|
|
37
|
+
const { linkType, link } = determineLinkTypeAndLocation(normalized.target);
|
|
38
|
+
const label = buildTripleLinkLabel({
|
|
39
|
+
foundPipe: parts.foundPipe,
|
|
40
|
+
labelText: parts.labelText,
|
|
41
|
+
finalTarget: normalized.target,
|
|
42
|
+
originalTarget: trimmedTarget,
|
|
43
|
+
});
|
|
44
|
+
|
|
45
|
+
return {
|
|
46
|
+
success: true,
|
|
47
|
+
elements: [
|
|
48
|
+
{
|
|
49
|
+
element: "link",
|
|
50
|
+
data: {
|
|
51
|
+
type: linkType,
|
|
52
|
+
link,
|
|
53
|
+
extra: null,
|
|
54
|
+
label,
|
|
55
|
+
target: normalized.hasStar && linkType === "direct" ? "new-tab" : null,
|
|
56
|
+
},
|
|
57
|
+
},
|
|
58
|
+
],
|
|
59
|
+
consumed: parts.consumed,
|
|
60
|
+
};
|
|
61
|
+
},
|
|
62
|
+
};
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
const INTERWIKI_PREFIXES = new Set(["wikipedia", "google", "dictionary", "wikidot"]);
|
|
2
|
+
|
|
3
|
+
export function isInterwikiTarget(target: string): boolean {
|
|
4
|
+
const colonIdx = target.indexOf(":");
|
|
5
|
+
if (colonIdx <= 0 || target.includes("/")) {
|
|
6
|
+
return false;
|
|
7
|
+
}
|
|
8
|
+
|
|
9
|
+
const prefix = target.slice(0, colonIdx).toLowerCase();
|
|
10
|
+
return INTERWIKI_PREFIXES.has(prefix);
|
|
11
|
+
}
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
import type { LinkLabel } from "@wdprlib/ast";
|
|
2
|
+
|
|
3
|
+
export function buildTripleLinkLabel(args: {
|
|
4
|
+
foundPipe: boolean;
|
|
5
|
+
labelText: string;
|
|
6
|
+
finalTarget: string;
|
|
7
|
+
originalTarget: string;
|
|
8
|
+
}): LinkLabel {
|
|
9
|
+
return {
|
|
10
|
+
text: getTripleLinkDisplayText(args),
|
|
11
|
+
};
|
|
12
|
+
}
|
|
13
|
+
|
|
14
|
+
function getTripleLinkDisplayText(args: {
|
|
15
|
+
foundPipe: boolean;
|
|
16
|
+
labelText: string;
|
|
17
|
+
finalTarget: string;
|
|
18
|
+
originalTarget: string;
|
|
19
|
+
}): string {
|
|
20
|
+
const trimmedLabel = args.labelText.trim();
|
|
21
|
+
if (args.foundPipe) {
|
|
22
|
+
return trimmedLabel || args.finalTarget;
|
|
23
|
+
}
|
|
24
|
+
|
|
25
|
+
const colonIdx = args.originalTarget.indexOf(":");
|
|
26
|
+
if (
|
|
27
|
+
colonIdx !== -1 &&
|
|
28
|
+
!args.originalTarget.startsWith("http") &&
|
|
29
|
+
!args.originalTarget.startsWith("*")
|
|
30
|
+
) {
|
|
31
|
+
return args.originalTarget.slice(colonIdx + 1).trim();
|
|
32
|
+
}
|
|
33
|
+
|
|
34
|
+
return args.originalTarget;
|
|
35
|
+
}
|
|
@@ -0,0 +1,72 @@
|
|
|
1
|
+
import type { ParseContext } from "../../types";
|
|
2
|
+
|
|
3
|
+
export interface TripleLinkParts {
|
|
4
|
+
target: string;
|
|
5
|
+
labelText: string;
|
|
6
|
+
foundPipe: boolean;
|
|
7
|
+
consumed: number;
|
|
8
|
+
}
|
|
9
|
+
|
|
10
|
+
export function hasClosingLinkMarker(ctx: ParseContext, startPos: number): boolean {
|
|
11
|
+
let pos = startPos;
|
|
12
|
+
while (pos < ctx.tokens.length) {
|
|
13
|
+
const token = ctx.tokens[pos];
|
|
14
|
+
if (!token || token.type === "EOF") {
|
|
15
|
+
return false;
|
|
16
|
+
}
|
|
17
|
+
if (token.type === "LINK_CLOSE") {
|
|
18
|
+
return true;
|
|
19
|
+
}
|
|
20
|
+
if (token.type === "NEWLINE") {
|
|
21
|
+
const next = ctx.tokens[pos + 1];
|
|
22
|
+
if (next?.type === "NEWLINE" || next?.type === "LINK_CLOSE") {
|
|
23
|
+
return false;
|
|
24
|
+
}
|
|
25
|
+
}
|
|
26
|
+
pos++;
|
|
27
|
+
}
|
|
28
|
+
return false;
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
export function collectTripleLinkParts(ctx: ParseContext, startPos: number): TripleLinkParts {
|
|
32
|
+
let target = "";
|
|
33
|
+
let labelText = "";
|
|
34
|
+
let foundPipe = false;
|
|
35
|
+
let consumed = 1;
|
|
36
|
+
let pos = startPos;
|
|
37
|
+
|
|
38
|
+
while (pos < ctx.tokens.length) {
|
|
39
|
+
const token = ctx.tokens[pos];
|
|
40
|
+
if (!token || token.type === "LINK_CLOSE" || token.type === "EOF") {
|
|
41
|
+
break;
|
|
42
|
+
}
|
|
43
|
+
|
|
44
|
+
if (token.type === "NEWLINE") {
|
|
45
|
+
if (foundPipe) {
|
|
46
|
+
labelText += " ";
|
|
47
|
+
} else {
|
|
48
|
+
target += " ";
|
|
49
|
+
}
|
|
50
|
+
consumed++;
|
|
51
|
+
pos++;
|
|
52
|
+
continue;
|
|
53
|
+
}
|
|
54
|
+
|
|
55
|
+
if (token.type === "PIPE" && !foundPipe) {
|
|
56
|
+
foundPipe = true;
|
|
57
|
+
} else if (foundPipe) {
|
|
58
|
+
labelText += token.value;
|
|
59
|
+
} else {
|
|
60
|
+
target += token.value;
|
|
61
|
+
}
|
|
62
|
+
|
|
63
|
+
consumed++;
|
|
64
|
+
pos++;
|
|
65
|
+
}
|
|
66
|
+
|
|
67
|
+
if (ctx.tokens[pos]?.type === "LINK_CLOSE") {
|
|
68
|
+
consumed++;
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
return { target, labelText, foundPipe, consumed };
|
|
72
|
+
}
|
|
@@ -0,0 +1,36 @@
|
|
|
1
|
+
import type { LinkLocation, LinkType } from "@wdprlib/ast";
|
|
2
|
+
import { isInterwikiTarget } from "./interwiki";
|
|
3
|
+
|
|
4
|
+
export interface TripleLinkTarget {
|
|
5
|
+
target: string;
|
|
6
|
+
hasStar: boolean;
|
|
7
|
+
}
|
|
8
|
+
|
|
9
|
+
export function normalizeTripleLinkTarget(trimmedTarget: string): TripleLinkTarget {
|
|
10
|
+
if (trimmedTarget.startsWith("*")) {
|
|
11
|
+
return { target: trimmedTarget.slice(1), hasStar: true };
|
|
12
|
+
}
|
|
13
|
+
return { target: trimmedTarget, hasStar: false };
|
|
14
|
+
}
|
|
15
|
+
|
|
16
|
+
export function isInvalidTripleLinkTarget(trimmedTarget: string, foundPipe: boolean): boolean {
|
|
17
|
+
return (trimmedTarget === "" && foundPipe) || /#{2,}/.test(trimmedTarget);
|
|
18
|
+
}
|
|
19
|
+
|
|
20
|
+
export function determineLinkTypeAndLocation(target: string): {
|
|
21
|
+
linkType: LinkType;
|
|
22
|
+
link: LinkLocation;
|
|
23
|
+
} {
|
|
24
|
+
if (target.startsWith("#")) {
|
|
25
|
+
return { linkType: "anchor", link: target };
|
|
26
|
+
}
|
|
27
|
+
if (target.startsWith("http://") || target.startsWith("https://")) {
|
|
28
|
+
return { linkType: "direct", link: target };
|
|
29
|
+
}
|
|
30
|
+
|
|
31
|
+
if (isInterwikiTarget(target)) {
|
|
32
|
+
return { linkType: "interwiki", link: target };
|
|
33
|
+
}
|
|
34
|
+
|
|
35
|
+
return { linkType: "page", link: { site: null, page: target } };
|
|
36
|
+
}
|
|
@@ -0,0 +1,40 @@
|
|
|
1
|
+
/**
|
|
2
|
+
*
|
|
3
|
+
* Parses the Wikidot inline math syntax: `[[$ LaTeX $]]`.
|
|
4
|
+
*
|
|
5
|
+
* @module
|
|
6
|
+
*/
|
|
7
|
+
import type { Element } from "@wdprlib/ast";
|
|
8
|
+
import type { InlineRule, ParseContext, RuleResult } from "../../types";
|
|
9
|
+
import { currentToken } from "../../types";
|
|
10
|
+
import { parseInlineMathSource } from "./syntax";
|
|
11
|
+
|
|
12
|
+
export const mathInlineRule: InlineRule = {
|
|
13
|
+
name: "math-inline",
|
|
14
|
+
startTokens: ["BLOCK_OPEN"],
|
|
15
|
+
|
|
16
|
+
parse(ctx: ParseContext): RuleResult<Element> {
|
|
17
|
+
const openToken = currentToken(ctx);
|
|
18
|
+
if (openToken.type !== "BLOCK_OPEN") {
|
|
19
|
+
return { success: false };
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
const parsed = parseInlineMathSource(ctx, ctx.pos + 1);
|
|
23
|
+
if (!parsed) {
|
|
24
|
+
return { success: false };
|
|
25
|
+
}
|
|
26
|
+
|
|
27
|
+
return {
|
|
28
|
+
success: true,
|
|
29
|
+
elements: [
|
|
30
|
+
{
|
|
31
|
+
element: "math-inline",
|
|
32
|
+
data: {
|
|
33
|
+
"latex-source": parsed.latexSource,
|
|
34
|
+
},
|
|
35
|
+
},
|
|
36
|
+
],
|
|
37
|
+
consumed: 1 + parsed.consumed,
|
|
38
|
+
};
|
|
39
|
+
},
|
|
40
|
+
};
|
|
@@ -0,0 +1,55 @@
|
|
|
1
|
+
import type { ParseContext } from "../../types";
|
|
2
|
+
|
|
3
|
+
export function parseInlineMathSource(
|
|
4
|
+
ctx: ParseContext,
|
|
5
|
+
startPos: number,
|
|
6
|
+
): { latexSource: string; consumed: number } | null {
|
|
7
|
+
let pos = startPos;
|
|
8
|
+
let consumed = 0;
|
|
9
|
+
|
|
10
|
+
if (ctx.tokens[pos]?.type !== "TEXT" || ctx.tokens[pos]?.value !== "$") {
|
|
11
|
+
return null;
|
|
12
|
+
}
|
|
13
|
+
pos++;
|
|
14
|
+
consumed++;
|
|
15
|
+
|
|
16
|
+
while (ctx.tokens[pos]?.type === "WHITESPACE") {
|
|
17
|
+
pos++;
|
|
18
|
+
consumed++;
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
let latexSource = "";
|
|
22
|
+
while (pos < ctx.tokens.length) {
|
|
23
|
+
const token = ctx.tokens[pos];
|
|
24
|
+
if (!token || token.type === "NEWLINE") {
|
|
25
|
+
return null;
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
if (
|
|
29
|
+
token.type === "TEXT" &&
|
|
30
|
+
token.value === "$" &&
|
|
31
|
+
ctx.tokens[pos + 1]?.type === "BLOCK_CLOSE"
|
|
32
|
+
) {
|
|
33
|
+
break;
|
|
34
|
+
}
|
|
35
|
+
|
|
36
|
+
latexSource += token.value;
|
|
37
|
+
pos++;
|
|
38
|
+
consumed++;
|
|
39
|
+
}
|
|
40
|
+
|
|
41
|
+
if (ctx.tokens[pos]?.type !== "TEXT" || ctx.tokens[pos]?.value !== "$") {
|
|
42
|
+
return null;
|
|
43
|
+
}
|
|
44
|
+
pos++;
|
|
45
|
+
consumed++;
|
|
46
|
+
|
|
47
|
+
if (ctx.tokens[pos]?.type !== "BLOCK_CLOSE") {
|
|
48
|
+
return null;
|
|
49
|
+
}
|
|
50
|
+
|
|
51
|
+
return {
|
|
52
|
+
latexSource: latexSource.trim(),
|
|
53
|
+
consumed: consumed + 1,
|
|
54
|
+
};
|
|
55
|
+
}
|
|
@@ -21,8 +21,7 @@
|
|
|
21
21
|
*/
|
|
22
22
|
import type { Element } from "@wdprlib/ast";
|
|
23
23
|
import type { InlineRule, ParseContext, RuleResult } from "../types";
|
|
24
|
-
import {
|
|
25
|
-
import { parseInlineUntil } from "./utils";
|
|
24
|
+
import { parseSameLineDelimitedContainer } from "./formatting/container";
|
|
26
25
|
|
|
27
26
|
/**
|
|
28
27
|
* Inline rule for parsing `{{monospace}}` formatting.
|
|
@@ -46,33 +45,6 @@ export const monospaceRule: InlineRule = {
|
|
|
46
45
|
* with `type: "monospace"`, or a text fallback for unmatched markers
|
|
47
46
|
*/
|
|
48
47
|
parse(ctx: ParseContext): RuleResult<Element> {
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
// Check if closing marker exists
|
|
52
|
-
if (!hasClosingMarkerBeforeNewline({ ...ctx, pos: ctx.pos + 1 }, "MONO_CLOSE")) {
|
|
53
|
-
return {
|
|
54
|
-
success: true,
|
|
55
|
-
elements: [{ element: "text", data: startToken.value }],
|
|
56
|
-
consumed: 1,
|
|
57
|
-
};
|
|
58
|
-
}
|
|
59
|
-
|
|
60
|
-
// Parse content between markers
|
|
61
|
-
const result = parseInlineUntil({ ...ctx, pos: ctx.pos + 1 }, "MONO_CLOSE");
|
|
62
|
-
|
|
63
|
-
return {
|
|
64
|
-
success: true,
|
|
65
|
-
elements: [
|
|
66
|
-
{
|
|
67
|
-
element: "container",
|
|
68
|
-
data: {
|
|
69
|
-
type: "monospace",
|
|
70
|
-
attributes: {},
|
|
71
|
-
elements: result.elements,
|
|
72
|
-
},
|
|
73
|
-
},
|
|
74
|
-
],
|
|
75
|
-
consumed: 1 + result.consumed + 1, // open + content + close
|
|
76
|
-
};
|
|
48
|
+
return parseSameLineDelimitedContainer(ctx, "MONO_CLOSE", "monospace");
|
|
77
49
|
},
|
|
78
50
|
};
|
|
@@ -0,0 +1,42 @@
|
|
|
1
|
+
import type { ParseContext } from "../../types";
|
|
2
|
+
import { INDENT_ACCEPTING_BLOCK_NAMES, KNOWN_BLOCK_NAMES } from "../../../constants";
|
|
3
|
+
import { parseBlockName } from "../../common";
|
|
4
|
+
|
|
5
|
+
/**
|
|
6
|
+
* Checks whether the block token at `tokenPos` names a block in the excluded set.
|
|
7
|
+
*/
|
|
8
|
+
export function isExcludedBlockToken(ctx: ParseContext, tokenPos: number): boolean {
|
|
9
|
+
const excluded = ctx.scope.excludedBlockNames;
|
|
10
|
+
if (!excluded?.size) return false;
|
|
11
|
+
const token = ctx.tokens[tokenPos];
|
|
12
|
+
if (token?.type !== "BLOCK_OPEN" && token?.type !== "BLOCK_END_OPEN") return false;
|
|
13
|
+
const nameResult = parseBlockName(ctx, tokenPos + 1);
|
|
14
|
+
return nameResult !== null && excluded.has(nameResult.name);
|
|
15
|
+
}
|
|
16
|
+
|
|
17
|
+
/**
|
|
18
|
+
* Checks whether the block token at `tokenPos` names a block that no rule recognizes.
|
|
19
|
+
*/
|
|
20
|
+
export function isUnknownBlockToken(ctx: ParseContext, tokenPos: number): boolean {
|
|
21
|
+
const token = ctx.tokens[tokenPos];
|
|
22
|
+
if (token?.type !== "BLOCK_OPEN" && token?.type !== "BLOCK_END_OPEN") return false;
|
|
23
|
+
const nameResult = parseBlockName(ctx, tokenPos + 1);
|
|
24
|
+
if (nameResult === null) {
|
|
25
|
+
if (ctx.tokens[tokenPos + 1]?.type === "EQUALS") {
|
|
26
|
+
return false;
|
|
27
|
+
}
|
|
28
|
+
return true;
|
|
29
|
+
}
|
|
30
|
+
return !KNOWN_BLOCK_NAMES.has(nameResult.name);
|
|
31
|
+
}
|
|
32
|
+
|
|
33
|
+
/**
|
|
34
|
+
* Checks whether the block token at `tokenPos` names a block whose rule accepts indentation.
|
|
35
|
+
*/
|
|
36
|
+
export function isIndentAcceptingBlock(ctx: ParseContext, tokenPos: number): boolean {
|
|
37
|
+
const token = ctx.tokens[tokenPos];
|
|
38
|
+
if (token?.type !== "BLOCK_OPEN" && token?.type !== "BLOCK_END_OPEN") return false;
|
|
39
|
+
const nameResult = parseBlockName(ctx, tokenPos + 1);
|
|
40
|
+
if (nameResult === null) return false;
|
|
41
|
+
return INDENT_ACCEPTING_BLOCK_NAMES.has(nameResult.name);
|
|
42
|
+
}
|
|
@@ -0,0 +1,117 @@
|
|
|
1
|
+
import type { ParseContext } from "../../types";
|
|
2
|
+
import { BLOCK_START_TOKEN_SET } from "../../../constants";
|
|
3
|
+
import {
|
|
4
|
+
isExcludedBlockToken,
|
|
5
|
+
isIndentAcceptingBlock,
|
|
6
|
+
isUnknownBlockToken,
|
|
7
|
+
} from "./block-boundary";
|
|
8
|
+
|
|
9
|
+
export function isParagraphBreakingBlockStart(
|
|
10
|
+
ctx: ParseContext,
|
|
11
|
+
newlinePos: number,
|
|
12
|
+
lookAhead: number,
|
|
13
|
+
): boolean {
|
|
14
|
+
const nextPos = newlinePos + lookAhead;
|
|
15
|
+
const nextMeaningfulToken = ctx.tokens[nextPos];
|
|
16
|
+
if (!nextMeaningfulToken || !BLOCK_START_TOKEN_SET.has(nextMeaningfulToken.type)) {
|
|
17
|
+
return false;
|
|
18
|
+
}
|
|
19
|
+
|
|
20
|
+
const isIndentedBlockOpener =
|
|
21
|
+
(nextMeaningfulToken.type === "BLOCK_OPEN" || nextMeaningfulToken.type === "BLOCK_END_OPEN") &&
|
|
22
|
+
isIndentAcceptingBlock(ctx, nextPos);
|
|
23
|
+
|
|
24
|
+
if (!nextMeaningfulToken.lineStart && !isIndentedBlockOpener) {
|
|
25
|
+
return false;
|
|
26
|
+
}
|
|
27
|
+
|
|
28
|
+
return (
|
|
29
|
+
!isOrphanCloseSpan(ctx, nextPos) &&
|
|
30
|
+
!isAnchorName(ctx, nextPos) &&
|
|
31
|
+
!isInvalidBlockOpen(ctx, nextPos) &&
|
|
32
|
+
!isInvalidHeading(ctx, nextPos) &&
|
|
33
|
+
!isExcludedBlockStart(ctx, nextPos) &&
|
|
34
|
+
!isUnknownBlockStart(ctx, nextPos)
|
|
35
|
+
);
|
|
36
|
+
}
|
|
37
|
+
|
|
38
|
+
function isOrphanCloseSpan(ctx: ParseContext, blockEndOpenPos: number): boolean {
|
|
39
|
+
const token = ctx.tokens[blockEndOpenPos];
|
|
40
|
+
if (token?.type !== "BLOCK_END_OPEN") return false;
|
|
41
|
+
|
|
42
|
+
const namePos = skipWhitespace(ctx, blockEndOpenPos + 1);
|
|
43
|
+
const nameToken = ctx.tokens[namePos];
|
|
44
|
+
return nameToken?.type === "IDENTIFIER" && nameToken.value.toLowerCase() === "span";
|
|
45
|
+
}
|
|
46
|
+
|
|
47
|
+
function isAnchorName(ctx: ParseContext, blockOpenPos: number): boolean {
|
|
48
|
+
const token = ctx.tokens[blockOpenPos];
|
|
49
|
+
if (token?.type !== "BLOCK_OPEN") return false;
|
|
50
|
+
|
|
51
|
+
const hashPos = skipWhitespace(ctx, blockOpenPos + 1);
|
|
52
|
+
const hashToken = ctx.tokens[hashPos];
|
|
53
|
+
return hashToken?.type === "HASH" || (hashToken?.type === "TEXT" && hashToken.value === "#");
|
|
54
|
+
}
|
|
55
|
+
|
|
56
|
+
function isInvalidBlockOpen(ctx: ParseContext, blockOpenPos: number): boolean {
|
|
57
|
+
const token = ctx.tokens[blockOpenPos];
|
|
58
|
+
if (token?.type !== "BLOCK_OPEN") return false;
|
|
59
|
+
|
|
60
|
+
const firstAfter = ctx.tokens[blockOpenPos + 1];
|
|
61
|
+
if (firstAfter?.type === "TEXT" && (firstAfter.value === ">" || firstAfter.value === "<")) {
|
|
62
|
+
const secondAfter = ctx.tokens[blockOpenPos + 2];
|
|
63
|
+
if (secondAfter && secondAfter.type !== "BLOCK_CLOSE") {
|
|
64
|
+
return true;
|
|
65
|
+
}
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
const blockNamePos = skipWhitespace(ctx, blockOpenPos + 1);
|
|
69
|
+
const blockNameToken = ctx.tokens[blockNamePos];
|
|
70
|
+
return (
|
|
71
|
+
blockNameToken !== undefined &&
|
|
72
|
+
(blockNameToken.type === "TEXT" || blockNameToken.type === "IDENTIFIER") &&
|
|
73
|
+
blockNameToken.value.toLowerCase() === "footnoteblock" &&
|
|
74
|
+
Boolean(ctx.scope.footnoteBlockParsed)
|
|
75
|
+
);
|
|
76
|
+
}
|
|
77
|
+
|
|
78
|
+
function isInvalidHeading(ctx: ParseContext, markerPos: number): boolean {
|
|
79
|
+
const marker = ctx.tokens[markerPos];
|
|
80
|
+
if (marker?.type !== "HEADING_MARKER") return false;
|
|
81
|
+
|
|
82
|
+
const markerLen = marker.value.length;
|
|
83
|
+
const afterMarker = ctx.tokens[markerPos + 1];
|
|
84
|
+
if (markerLen > 6) {
|
|
85
|
+
return true;
|
|
86
|
+
}
|
|
87
|
+
|
|
88
|
+
if (afterMarker?.type === "STAR") {
|
|
89
|
+
return ctx.tokens[markerPos + 2]?.type !== "WHITESPACE";
|
|
90
|
+
}
|
|
91
|
+
|
|
92
|
+
return afterMarker?.type !== "WHITESPACE";
|
|
93
|
+
}
|
|
94
|
+
|
|
95
|
+
function isExcludedBlockStart(ctx: ParseContext, tokenPos: number): boolean {
|
|
96
|
+
const token = ctx.tokens[tokenPos];
|
|
97
|
+
return (
|
|
98
|
+
(token?.type === "BLOCK_OPEN" || token?.type === "BLOCK_END_OPEN") &&
|
|
99
|
+
isExcludedBlockToken(ctx, tokenPos)
|
|
100
|
+
);
|
|
101
|
+
}
|
|
102
|
+
|
|
103
|
+
function isUnknownBlockStart(ctx: ParseContext, tokenPos: number): boolean {
|
|
104
|
+
const token = ctx.tokens[tokenPos];
|
|
105
|
+
return (
|
|
106
|
+
(token?.type === "BLOCK_OPEN" || token?.type === "BLOCK_END_OPEN") &&
|
|
107
|
+
isUnknownBlockToken(ctx, tokenPos)
|
|
108
|
+
);
|
|
109
|
+
}
|
|
110
|
+
|
|
111
|
+
function skipWhitespace(ctx: ParseContext, startPos: number): number {
|
|
112
|
+
let pos = startPos;
|
|
113
|
+
while (ctx.tokens[pos]?.type === "WHITESPACE") {
|
|
114
|
+
pos++;
|
|
115
|
+
}
|
|
116
|
+
return pos;
|
|
117
|
+
}
|
|
@@ -0,0 +1,23 @@
|
|
|
1
|
+
import type { Token } from "../../../../lexer";
|
|
2
|
+
import type { ParseContext } from "../../types";
|
|
3
|
+
|
|
4
|
+
/**
|
|
5
|
+
* Collect tokens until newline or EOF.
|
|
6
|
+
*/
|
|
7
|
+
export function collectUntilNewline(ctx: ParseContext): { tokens: Token[]; consumed: number } {
|
|
8
|
+
const tokens: Token[] = [];
|
|
9
|
+
let consumed = 0;
|
|
10
|
+
let pos = ctx.pos;
|
|
11
|
+
|
|
12
|
+
while (pos < ctx.tokens.length) {
|
|
13
|
+
const token = ctx.tokens[pos];
|
|
14
|
+
if (!token || token.type === "NEWLINE" || token.type === "EOF") {
|
|
15
|
+
break;
|
|
16
|
+
}
|
|
17
|
+
tokens.push(token);
|
|
18
|
+
consumed++;
|
|
19
|
+
pos++;
|
|
20
|
+
}
|
|
21
|
+
|
|
22
|
+
return { tokens, consumed };
|
|
23
|
+
}
|
|
@@ -0,0 +1,115 @@
|
|
|
1
|
+
import type { Element } from "@wdprlib/ast";
|
|
2
|
+
import type { ParseContext } from "../../types";
|
|
3
|
+
import {
|
|
4
|
+
collectLongPlainTextRun,
|
|
5
|
+
MIN_INLINE_TEXT_RUN_DOCUMENT_TOKENS,
|
|
6
|
+
type InlineEndType,
|
|
7
|
+
} from "./plain-text";
|
|
8
|
+
import { getParagraphNewlineBoundary } from "./paragraph-boundary";
|
|
9
|
+
import { createPreservedTrailingLineBreak } from "./preserved-line-break";
|
|
10
|
+
import { getCandidateInlineRules } from "./rules";
|
|
11
|
+
import { parseSimpleInlineToken } from "./simple-token";
|
|
12
|
+
|
|
13
|
+
/**
|
|
14
|
+
* Result of parsing inline content.
|
|
15
|
+
*/
|
|
16
|
+
export interface InlineParseResult {
|
|
17
|
+
elements: Element[];
|
|
18
|
+
consumed: number;
|
|
19
|
+
}
|
|
20
|
+
|
|
21
|
+
/**
|
|
22
|
+
* Parse inline content until a specific token type.
|
|
23
|
+
*
|
|
24
|
+
* When endType is "PARAGRAPH_BREAK", handles NEWLINEs and stops at:
|
|
25
|
+
* - Double NEWLINE (paragraph break)
|
|
26
|
+
* - NEWLINE followed by block-start token
|
|
27
|
+
* - EOF
|
|
28
|
+
*/
|
|
29
|
+
export function parseInlineUntil(ctx: ParseContext, endType: InlineEndType): InlineParseResult {
|
|
30
|
+
const nodes: Element[] = [];
|
|
31
|
+
let consumed = 0;
|
|
32
|
+
let pos = ctx.pos;
|
|
33
|
+
|
|
34
|
+
const paragraphMode = endType === "PARAGRAPH_BREAK";
|
|
35
|
+
const { inlineRules } = ctx;
|
|
36
|
+
const inlineCtx: ParseContext = {
|
|
37
|
+
...ctx,
|
|
38
|
+
pos,
|
|
39
|
+
};
|
|
40
|
+
const canCollectLongPlainTextRuns = ctx.tokens.length >= MIN_INLINE_TEXT_RUN_DOCUMENT_TOKENS;
|
|
41
|
+
|
|
42
|
+
while (pos < ctx.tokens.length) {
|
|
43
|
+
const token = ctx.tokens[pos];
|
|
44
|
+
if (!token || token.type === "EOF") {
|
|
45
|
+
break;
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
if (paragraphMode && ctx.scope.blockCloseCondition) {
|
|
49
|
+
const checkCtx: ParseContext = { ...ctx, pos };
|
|
50
|
+
if (ctx.scope.blockCloseCondition(checkCtx)) {
|
|
51
|
+
break;
|
|
52
|
+
}
|
|
53
|
+
}
|
|
54
|
+
|
|
55
|
+
if (!paragraphMode && token.type === "NEWLINE") {
|
|
56
|
+
break;
|
|
57
|
+
}
|
|
58
|
+
|
|
59
|
+
if (paragraphMode && token.type === "NEWLINE") {
|
|
60
|
+
const boundary = getParagraphNewlineBoundary(ctx, pos, nodes.length > 0);
|
|
61
|
+
if (boundary.shouldBreak) {
|
|
62
|
+
if (boundary.preservePrecedingLineBreak) {
|
|
63
|
+
nodes.push(createPreservedTrailingLineBreak());
|
|
64
|
+
}
|
|
65
|
+
|
|
66
|
+
consumed += boundary.consumed;
|
|
67
|
+
break;
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
|
|
71
|
+
if (token.type === endType) {
|
|
72
|
+
break;
|
|
73
|
+
}
|
|
74
|
+
|
|
75
|
+
if (canCollectLongPlainTextRuns) {
|
|
76
|
+
const plainTextRun = collectLongPlainTextRun(ctx, pos, endType);
|
|
77
|
+
if (plainTextRun) {
|
|
78
|
+
nodes.push({ element: "text", data: plainTextRun.value });
|
|
79
|
+
consumed += plainTextRun.consumed;
|
|
80
|
+
pos += plainTextRun.consumed;
|
|
81
|
+
continue;
|
|
82
|
+
}
|
|
83
|
+
}
|
|
84
|
+
|
|
85
|
+
const simpleToken = parseSimpleInlineToken(token, ctx.tokens[pos + 1]);
|
|
86
|
+
if (simpleToken) {
|
|
87
|
+
nodes.push(simpleToken.element);
|
|
88
|
+
consumed += simpleToken.consumed;
|
|
89
|
+
pos += simpleToken.consumed;
|
|
90
|
+
continue;
|
|
91
|
+
}
|
|
92
|
+
|
|
93
|
+
inlineCtx.pos = pos;
|
|
94
|
+
|
|
95
|
+
let matched = false;
|
|
96
|
+
for (const rule of getCandidateInlineRules(inlineRules, token.type)) {
|
|
97
|
+
const result = rule.parse(inlineCtx);
|
|
98
|
+
if (result.success) {
|
|
99
|
+
nodes.push(...result.elements);
|
|
100
|
+
consumed += result.consumed;
|
|
101
|
+
pos += result.consumed;
|
|
102
|
+
matched = true;
|
|
103
|
+
break;
|
|
104
|
+
}
|
|
105
|
+
}
|
|
106
|
+
|
|
107
|
+
if (!matched) {
|
|
108
|
+
nodes.push({ element: "text", data: token.value });
|
|
109
|
+
consumed++;
|
|
110
|
+
pos++;
|
|
111
|
+
}
|
|
112
|
+
}
|
|
113
|
+
|
|
114
|
+
return { elements: nodes, consumed };
|
|
115
|
+
}
|