npm - simple-customize-markdown-converter - Versions diffs - 1.0.7 → 1.2.0 - Mend

simple-customize-markdown-converter 1.0.7 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (55) hide show

package/README.md +74 -17
package/dist/core/lexer/handler.d.ts +23 -0
package/dist/core/lexer/handler.js +272 -0
package/dist/core/lexer/index.d.ts +42 -0
package/dist/core/lexer/index.js +177 -0
package/dist/core/lexer.d.ts +46 -0
package/dist/core/lexer.js +433 -0
package/dist/core/parser/handler.d.ts +19 -0
package/dist/core/parser/handler.js +254 -0
package/dist/core/parser/index.d.ts +33 -0
package/dist/core/parser/index.js +149 -0
package/dist/core/parser.d.ts +37 -0
package/dist/core/parser.js +346 -0
package/dist/core/renderer.d.ts +3 -0
package/dist/core/renderer.js +99 -0
package/dist/core/resolver/footnote-resolver.d.ts +15 -0
package/dist/core/resolver/footnote-resolver.js +36 -0
package/dist/core/resolver.d.ts +15 -0
package/dist/core/resolver.js +36 -0
package/dist/index.d.ts +6 -3
package/dist/index.js +10 -7
package/dist/react.d.ts +36 -0
package/dist/react.js +56 -0
package/dist/renderers/default/handler.d.ts +21 -0
package/dist/renderers/default/handler.js +114 -0
package/dist/renderers/default/index.d.ts +14 -0
package/dist/renderers/default/index.js +117 -0
package/dist/renderers/default.d.ts +26 -0
package/dist/renderers/default.js +105 -0
package/dist/renderers/index.d.ts +10 -0
package/dist/renderers/index.js +2 -0
package/dist/renderers/react/handler.d.ts +22 -0
package/dist/renderers/react/handler.js +123 -0
package/dist/renderers/react/index.d.ts +15 -0
package/dist/renderers/react/index.js +123 -0
package/dist/renderers/react.d.ts +26 -0
package/dist/renderers/react.js +123 -0
package/dist/types/options/converterOptions.d.ts +11 -0
package/dist/types/options/converterOptions.js +2 -0
package/dist/types/options/index.d.ts +10 -0
package/dist/types/options/index.js +2 -0
package/dist/types/options/reactRenderOptions.d.ts +50 -0
package/dist/types/options/reactRenderOptions.js +2 -0
package/dist/types/options/renderOptions.d.ts +86 -0
package/dist/types/options/renderOptions.js +2 -0
package/dist/types/parser.d.ts +132 -0
package/dist/types/parser.js +2 -0
package/dist/types/renderer.d.ts +12 -0
package/dist/types/renderer.js +2 -0
package/dist/types/token.d.ts +94 -74
package/dist/utilities/parser-utils.d.ts +5 -0
package/dist/utilities/parser-utils.js +65 -0
package/dist/utilities/tokenizer-utils.d.ts +11 -0
package/dist/utilities/tokenizer-utils.js +159 -0
package/package.json +24 -3

package/dist/core/lexer.js ADDED Viewed

@@ -0,0 +1,433 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+class Lexer {
+    constructor(input) {
+        this.pos = 0;
+        this.listToken = [];
+        // Flag for handle special syntax
+        this.listLevelFlag = 0;
+        this.input = input;
+    }
+    //Reset input and other attribute
+    setInput(input) {
+        this.input = input;
+        this.pos = 0;
+        this.listLevelFlag = 0;
+        this.listToken = [];
+    }
+    /**
+     * Tokenize the markdown into a list of tokens.
+     * @param isEof - `True` when input is whole markdown, `False` if input is just a part of markdown.
+     * @returns List of tokens
+     */
+    tokenize(isEof = true) {
+        const TOKEN_HANDLER = [
+            //Handle escape character first
+            {
+                match: (lex) => lex.peek() === "\\" && lex.peek(1) !== undefined,
+                emit: (lex) => {
+                    lex.next(1);
+                    lex.handleTextBlock();
+                }
+            },
+            //For HTML
+            //Comment
+            { match: (lex) => lex.startsWith("<!--"), emit: (lex) => lex.readUntilMatchString("-->", true), },
+            //Normal HTML
+            {
+                match: (lex) => lex.peek() === "<",
+                emit: (lex) => {
+                    //Handle comment
+                    const line = lex.peekUntil(">");
+                    const blockRegex = /^<(h[1-6]|div|table|pre|blockquote|ul|ol|li|p|section|article|header|footer|nav|aside|hr|form|iframe)\b/i;
+                    if (blockRegex.test(line)) {
+                        lex.handleHtmlBlock();
+                    }
+                    else {
+                        lex.handleHtmlInline();
+                    }
+                }
+            },
+            {
+                //Regex: if line started with at least 3 characters: -, *, _
+                match: (lex) => /^([-*_])\1{2,}$/.test(lex.peekUntil("\n").trim()) && this.getLastToken()?.type === "NewLine",
+                emit: (lex) => lex.handleHorizontalLine()
+            },
+            { match: (lex) => lex.startsWith("```"), emit: (lex) => lex.handleCodeBlock() },
+            { match: (lex) => lex.startsWith("**"), emit: (lex) => lex.handleBold() },
+            { match: (lex) => lex.startsWith("~~"), emit: (lex) => lex.handleStrikethrough() },
+            // Footnote Definition
+            { match: (lex) => lex.isStartOfLine() && /^\[\^[^\]]+\]:/.test(lex.peekUntil("\n")), emit: (lex) => lex.handleFootnoteDef() },
+            // Footnote Reference
+            { match: (lex) => lex.startsWith("[^"), emit: (lex) => lex.handleFootnoteRef() },
+            //For List
+            {
+                match: (lex) => lex.isStartOfLine() && /^(\s*)([-*+]) \[( |x|X)\] /.test(lex.peekUntil("\n")),
+                emit: (lex) => lex.handleList(false, true)
+            },
+            {
+                //Regex: if line started with zero or more spaces, then have - or + or * + 1 space
+                match: (lex) => lex.isStartOfLine() && /^(\s*)([-*+]) /.test(lex.peekUntil("\n")),
+                emit: (lex) => lex.handleList(false, false)
+            },
+            {
+                //Regex: if line started with zero or more spaces, then have number. character + 1 space
+                match: (lex) => lex.isStartOfLine() && /^(\s*)(\d+)\. /.test(lex.peekUntil("\n")),
+                emit: (lex) => lex.handleList(true, false)
+            },
+            {
+                match: (lex) => lex.listLevelFlag > 0 && lex.isStartOfLine() && !/^(\s*)([-+*]|\d+\.) /.test(lex.peekUntil("\n")),
+                emit: (lex) => {
+                    while (lex.listLevelFlag > 0) {
+                        lex.handleEndList();
+                    }
+                }
+            },
+            //For table
+            { match: (lex) => lex.isStartOfLine() && /^\s*\|.*\|\s*$/.test(lex.peekUntil("\n")), emit: (lex) => lex.handleTable() },
+            //For common syntax
+            { match: (lex) => lex.peek() === "`", emit: (lex) => lex.handleInlineBlock() },
+            { match: (lex) => lex.peek() === "#", emit: (lex) => lex.handleHeader() },
+            { match: (lex) => lex.peek() === "*" || lex.peek() === "_", emit: (lex) => lex.handleItalic() },
+            { match: (lex) => lex.peek() === ">", emit: (lex) => lex.handleQuoteBlock() },
+            { match: (lex) => lex.peek() === "[", emit: (lex) => lex.handleLink() },
+            { match: (lex) => lex.peek() === "!" && lex.peek(1) === "[", emit: (lex) => lex.handleImage() },
+            { match: (lex) => lex.peek() === "\n", emit: (lex) => lex.listToken.push({ type: "NewLine" }) },
+        ];
+        while (!this.isEndOfFile()) {
+            let matched = false;
+            for (const handler of TOKEN_HANDLER) {
+                if (handler.match(this)) {
+                    handler.emit(this);
+                    matched = true;
+                    break;
+                }
+            }
+            if (!matched) {
+                this.handleTextBlock();
+            }
+            this.next();
+        }
+        while (this.listLevelFlag > 0) {
+            this.handleEndList();
+        }
+        if (isEof)
+            this.listToken.push({ type: "EOF" });
+        return this.listToken;
+    }
+    //Get current character with offset
+    peek(offset = 0) {
+        const i = this.pos + offset;
+        return i < this.input.length ? this.input[i] : null;
+    }
+    //Move cursor by amount
+    next(amount = 1) {
+        this.pos += amount;
+    }
+    //If current cursor startsWith given str
+    startsWith(str) {
+        return this.input.slice(this.pos, this.pos + str.length) === str;
+    }
+    isEndOfFile() {
+        return this.pos >= this.input.length;
+    }
+    getLastToken() {
+        return this.listToken[this.listToken.length - 1];
+    }
+    handleTable() {
+        const tokenizeResult = [];
+        const handler = new Lexer("");
+        const header = this.readUntil("\n", true);
+        const headerDetails = header.trim().replace(/^ *\|/, "").replace(/\| *$/, "").split("|");
+        const align = this.readUntil("\n", true);
+        const alignDetails = align.trim().replace(/^ *\|/, "").replace(/\| *$/, "").split("|");
+        if (alignDetails.length !== headerDetails.length || !alignDetails.every(c => /^:?-{3,}:?$/.test(c))) {
+            this.listToken.push({ type: "Text", value: `${header}\n${align}\n` });
+            return;
+        }
+        else {
+            //Handle alignment
+            const normalizeAlign = alignDetails.map(value => {
+                if (value.startsWith(":") && value.endsWith(":"))
+                    return "center";
+                else if (value.endsWith(":"))
+                    return "right";
+                else
+                    return "left";
+            });
+            tokenizeResult.push({ type: "TableStart" });
+            //Handle header
+            tokenizeResult.push({ type: "RowStart", isHeader: true });
+            headerDetails.forEach((cell, index) => {
+                tokenizeResult.push({ type: "CellStart", align: normalizeAlign[index] ?? "left" });
+                handler.setInput(cell.trim());
+                tokenizeResult.push(...handler.tokenize(false));
+                tokenizeResult.push({ type: "CellEnd" });
+            });
+            tokenizeResult.push({ type: "RowEnd" });
+            //Handle body
+            while (!this.isEndOfFile()) {
+                const body = this.readUntil("\n", true);
+                if (!body)
+                    break;
+                const line = body.trim();
+                if (!line.startsWith("|") || !line.endsWith("|"))
+                    break; //End of table
+                const bodyDetail = body.trim().replace(/^ *\|/, "").replace(/\| *$/, "").split("|");
+                tokenizeResult.push({ type: "RowStart", isHeader: false });
+                bodyDetail.forEach((cell, index) => {
+                    tokenizeResult.push({ type: "CellStart", align: normalizeAlign[index] ?? "left" });
+                    handler.setInput(cell.trim());
+                    tokenizeResult.push(...handler.tokenize(false));
+                    tokenizeResult.push({ type: "CellEnd" });
+                });
+                tokenizeResult.push({ type: "RowEnd" });
+            }
+            tokenizeResult.push({ type: "TableEnd" });
+            this.listToken.push(...tokenizeResult);
+        }
+    }
+    handleHeader() {
+        let level = 0;
+        while (this.peek() === "#") {
+            level++;
+            this.next();
+        }
+        if (this.peek() === " ") {
+            this.next();
+            this.pos--;
+        }
+        this.listToken.push({ type: "Header", level });
+    }
+    handleCodeBlock() {
+        let lang = "";
+        let content = "";
+        this.next(3); //Skip open block
+        while (!this.isEndOfFile() && this.peek() !== "\n") {
+            lang += this.peek();
+            this.next();
+        }
+        this.next(); //Skip \n
+        while (!this.isEndOfFile() && !this.startsWith("```")) {
+            content += this.peek();
+            this.next();
+        }
+        this.next(2); //Skip close block (due to next() after each tokenize iteration)
+        this.listToken.push({ "type": "CodeBlock", lang: lang.trim(), content: content.trimEnd() });
+    }
+    handleTextBlock() {
+        const currentChar = this.peek();
+        if (currentChar === null)
+            return;
+        const lastToken = this.getLastToken();
+        if (lastToken?.type === "Text")
+            lastToken.value += currentChar;
+        else
+            this.listToken.push({ type: "Text", value: currentChar });
+    }
+    handleItalic() {
+        this.listToken.push({ type: "Italic" });
+    }
+    handleBold() {
+        this.listToken.push({ type: "Bold" });
+        this.next(); //Skip remain *
+    }
+    handleStrikethrough() {
+        this.listToken.push({ type: "Strikethrough" });
+        this.next(); //Skip remain ~
+    }
+    handleInlineBlock() {
+        let content = "";
+        this.next(); //Skip open block
+        while (!this.isEndOfFile() && !this.startsWith("`")) {
+            content += this.peek();
+            this.next();
+        }
+        this.listToken.push({ "type": "InlineCode", content: content });
+    }
+    handleQuoteBlock() {
+        this.listToken.push({ type: "Quote" });
+    }
+    handleList(isOrdered, isTask) {
+        const line = this.peekUntil("\n");
+        if (isTask) {
+            const m = line.match(/^(\s*)([-*+]) \[( |x|X)\] (.*)$/);
+            const indent = Math.floor(m[1].length / 2) + 1;
+            while (this.listLevelFlag < indent)
+                this.handleStartList(false);
+            while (this.listLevelFlag > indent)
+                this.handleEndList();
+            this.next(m[1].length + 4);
+            this.handleTaskItem(m[3].toLowerCase() === "x");
+        }
+        else {
+            //Regex: line started with: Group 1: zero or more spaces, group 2: (- or + or * + 1 space) or (number with . character), group 3: everything else in line
+            const m = isOrdered ? line.match(/^(\s*)(\d+)\. (.*)$/) : line.match(/^(\s*)([-*+]) (.*)$/);
+            const indent = Math.floor(m[1].length / 2) + 1; //m[1] to get the spaces in group 1
+            while (this.listLevelFlag < indent)
+                this.handleStartList(isOrdered);
+            while (this.listLevelFlag > indent)
+                this.handleEndList();
+            this.next(m[1].length + (isOrdered ? 1 : 0)); //+1 due to marker have 2 characters (e.g: 1.) instead 1 like unordered list
+            this.handleListItem();
+        }
+    }
+    handleStartList(isOrder) {
+        this.listLevelFlag++;
+        this.listToken.push({ type: "ListStart", level: this.listLevelFlag, ordered: isOrder });
+    }
+    handleListItem() {
+        this.next(); // Skip space between - and text
+        this.listToken.push({ type: "ListItem" });
+    }
+    handleTaskItem(isChecked) {
+        this.next(); // Skip space between last ] and text
+        this.listToken.push({ type: "TaskItem", checked: isChecked });
+    }
+    handleEndList() {
+        this.listLevelFlag === 0 ? 0 : this.listLevelFlag--;
+        this.listToken.push({ type: "ListEnd" });
+    }
+    handleLink() {
+        this.next(); //Skip [
+        const text = this.readUntil("]");
+        this.next(); //Skip ]
+        if (this.peek() === "(") {
+            this.next(); //Skip (
+            const url = this.readUntil(")");
+            //Don't skip ) due to auto skip on while loop
+            this.listToken.push({ type: "Link", text: text, href: url });
+        }
+        else
+            this.listToken.push({ type: "Text", value: `[${text}]` });
+    }
+    handleImage() {
+        this.next(); //Skip !
+        if (this.peek() !== "[")
+            return;
+        this.next(); //Skip [
+        const alt = this.readUntil("]");
+        this.next(); //Skip ]
+        if (this.peek() === "(") {
+            this.next(); //Skip (
+            const src = this.readUntil(")");
+            this.next(); //Skip )
+            this.listToken.push({ type: "Image", alt: alt, src: src });
+        }
+        else
+            this.listToken.push({ type: "Text", value: `![${alt}]` });
+    }
+    handleHorizontalLine() {
+        this.next(2); //Skip two first characters, remain will be skiped after loop
+        this.listToken.push({ type: "HorizontalLine" });
+    }
+    handleHtmlBlock() {
+        const openTag = this.readUntil(">", true) + ">";
+        const matchTagName = /^<\s*([a-zA-Z0-9]+)/.exec(openTag);
+        const tagName = matchTagName ? matchTagName[1] : null;
+        //Tagname is not valid
+        if (!tagName) {
+            this.listToken.push({ type: "Text", value: "<" });
+            return;
+        }
+        //If it's self-closing tag
+        if (openTag.endsWith("/>") || ["hr", "img", "br", "input", "meta", "link"].includes(tagName)) {
+            this.listToken.push({ type: "HTMLBlock", value: openTag });
+            return;
+        }
+        let content = "";
+        while (!this.isEndOfFile()) {
+            if (this.peekUntilByOffset(`</${tagName}>`.length).toLowerCase() === `</${tagName}>`) {
+                break;
+            }
+            content += this.peek();
+            this.next();
+        }
+        const closeTag = `</${tagName}>`;
+        this.next(closeTag.length - 1); //Skip closing tag
+        this.listToken.push({ type: "HTMLBlock", value: openTag + content + closeTag });
+    }
+    handleHtmlInline() {
+        const openTag = this.readUntil(">", true) + ">";
+        const matchTagName = /^<\s*([a-zA-Z0-9]+)/.exec(openTag);
+        const tagName = matchTagName ? matchTagName[1] : null;
+        if (!tagName) {
+            this.listToken.push({ type: "Text", value: "<" });
+            return;
+        }
+        const content = this.readUntilMatchString(`</${tagName}>`);
+        const closeTag = `</${tagName}>`;
+        this.next(closeTag.length - 1); //Skip closing tag
+        this.listToken.push({ type: "HTMLInline", value: openTag + content + closeTag });
+    }
+    handleFootnoteDef() {
+        const line = this.readUntil("\n");
+        const match = line.match(/^\[\^([^\]]+)\]:\s*(.*)$/);
+        if (match) {
+            const id = match[1];
+            const content = match[2];
+            this.listToken.push({ type: "FootnoteDef", id, content });
+        }
+    }
+    handleFootnoteRef() {
+        this.next(2); //Skip [^
+        const id = this.readUntil("]");
+        this.listToken.push({ type: "FootnoteRef", id });
+    }
+    //Utilities function
+    readUntil(char, isConsumeChar = false) {
+        let result = "";
+        while (this.peek() !== char) {
+            result += this.peek();
+            this.next();
+            if (this.isEndOfFile())
+                break;
+        }
+        if (isConsumeChar)
+            this.next(char.length); //Make cursor skip the char
+        return result;
+    }
+    peekUntil(char) {
+        let result = "";
+        let i = 0;
+        while (true) {
+            const current = this.peek(i++);
+            if (current == null)
+                break;
+            if (current == char)
+                break;
+            result += current;
+        }
+        return result;
+    }
+    peekUntilByOffset(offset) {
+        let result = "";
+        let i = 0;
+        while (i !== offset) {
+            const current = this.peek(i++);
+            if (current == null)
+                break;
+            if (this.isEndOfFile())
+                break;
+            result += current;
+        }
+        return result;
+    }
+    isStartOfLine() {
+        return this.pos === 0 || this.peek(-1) === "\n";
+    }
+    readUntilMatchString(str, isConsume = false) {
+        let result = "";
+        while (!this.isEndOfFile()) {
+            if (this.peekUntilByOffset(str.length) === str) {
+                if (isConsume)
+                    this.next(str.length);
+                break;
+            }
+            result += this.peek();
+            this.next();
+        }
+        return result;
+    }
+}
+exports.default = Lexer;

package/dist/core/parser/handler.d.ts ADDED Viewed

@@ -0,0 +1,19 @@
+import { ParsingStrategy } from "../../types/parser";
+declare const CodeBlockHandler: ParsingStrategy;
+declare const HeaderHandler: ParsingStrategy;
+declare const BoldHandler: ParsingStrategy;
+declare const ItalicHandler: ParsingStrategy;
+declare const StrikethroughHandler: ParsingStrategy;
+declare const InlineHandler: ParsingStrategy;
+declare const QuoteHandler: ParsingStrategy;
+declare const ListHandler: ParsingStrategy;
+declare const LinkHandler: ParsingStrategy;
+declare const ImageHandler: ParsingStrategy;
+declare const TableHandler: ParsingStrategy;
+declare const HtmlBlockHandler: ParsingStrategy;
+declare const HtmlInlineHandler: ParsingStrategy;
+declare const HorizontalLineHandler: ParsingStrategy;
+declare const FootnoteDefHandler: ParsingStrategy;
+declare const FootnoteRefHandler: ParsingStrategy;
+declare const NewLineHandler: ParsingStrategy;
+export { BoldHandler, CodeBlockHandler, FootnoteDefHandler, FootnoteRefHandler, HeaderHandler, HorizontalLineHandler, HtmlBlockHandler, HtmlInlineHandler, ImageHandler, InlineHandler, ItalicHandler, LinkHandler, ListHandler, NewLineHandler, QuoteHandler, StrikethroughHandler, TableHandler, };