npm - @cj-tech-master/excelts - Versions diffs - 7.6.0 → 8.0.0 - Mend

@cj-tech-master/excelts 7.6.0 → 8.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (79) hide show

package/README.md +99 -577
package/README_zh.md +101 -577
package/dist/browser/index.browser.d.ts +3 -0
package/dist/browser/index.browser.js +2 -0
package/dist/browser/index.d.ts +3 -0
package/dist/browser/index.js +2 -0
package/dist/browser/modules/archive/compression/compress.browser.js +4 -4
package/dist/browser/modules/archive/compression/deflate-fallback.d.ts +24 -22
package/dist/browser/modules/archive/compression/deflate-fallback.js +664 -360
package/dist/browser/modules/archive/compression/streaming-compress.browser.d.ts +7 -0
package/dist/browser/modules/archive/compression/streaming-compress.browser.js +15 -3
package/dist/browser/modules/archive/compression/streaming-compress.d.ts +5 -0
package/dist/browser/modules/archive/compression/streaming-compress.js +7 -0
package/dist/browser/modules/archive/zip/stream.js +27 -3
package/dist/browser/modules/excel/workbook.browser.d.ts +72 -0
package/dist/browser/modules/excel/workbook.browser.js +226 -0
package/dist/browser/modules/excel/workbook.d.ts +32 -1
package/dist/browser/modules/excel/workbook.js +47 -2
package/dist/browser/modules/excel/xlsx/xlsx.browser.js +42 -4
package/dist/browser/modules/markdown/constants.d.ts +30 -0
package/dist/browser/modules/markdown/constants.js +30 -0
package/dist/browser/modules/markdown/errors.d.ts +21 -0
package/dist/browser/modules/markdown/errors.js +23 -0
package/dist/browser/modules/markdown/format/index.d.ts +54 -0
package/dist/browser/modules/markdown/format/index.js +307 -0
package/dist/browser/modules/markdown/index.d.ts +15 -0
package/dist/browser/modules/markdown/index.js +22 -0
package/dist/browser/modules/markdown/parse/index.d.ts +70 -0
package/dist/browser/modules/markdown/parse/index.js +428 -0
package/dist/browser/modules/markdown/types.d.ts +130 -0
package/dist/browser/modules/markdown/types.js +6 -0
package/dist/cjs/index.js +5 -1
package/dist/cjs/modules/archive/compression/compress.browser.js +4 -4
package/dist/cjs/modules/archive/compression/deflate-fallback.js +664 -360
package/dist/cjs/modules/archive/compression/streaming-compress.browser.js +15 -2
package/dist/cjs/modules/archive/compression/streaming-compress.js +8 -0
package/dist/cjs/modules/archive/zip/stream.js +26 -2
package/dist/cjs/modules/excel/workbook.browser.js +226 -0
package/dist/cjs/modules/excel/workbook.js +46 -1
package/dist/cjs/modules/excel/xlsx/xlsx.browser.js +42 -4
package/dist/cjs/modules/markdown/constants.js +33 -0
package/dist/cjs/modules/markdown/errors.js +28 -0
package/dist/cjs/modules/markdown/format/index.js +310 -0
package/dist/cjs/modules/markdown/index.js +30 -0
package/dist/cjs/modules/markdown/parse/index.js +432 -0
package/dist/cjs/modules/markdown/types.js +7 -0
package/dist/esm/index.browser.js +2 -0
package/dist/esm/index.js +2 -0
package/dist/esm/modules/archive/compression/compress.browser.js +4 -4
package/dist/esm/modules/archive/compression/deflate-fallback.js +664 -360
package/dist/esm/modules/archive/compression/streaming-compress.browser.js +15 -3
package/dist/esm/modules/archive/compression/streaming-compress.js +7 -0
package/dist/esm/modules/archive/zip/stream.js +27 -3
package/dist/esm/modules/excel/workbook.browser.js +226 -0
package/dist/esm/modules/excel/workbook.js +47 -2
package/dist/esm/modules/excel/xlsx/xlsx.browser.js +42 -4
package/dist/esm/modules/markdown/constants.js +30 -0
package/dist/esm/modules/markdown/errors.js +23 -0
package/dist/esm/modules/markdown/format/index.js +307 -0
package/dist/esm/modules/markdown/index.js +22 -0
package/dist/esm/modules/markdown/parse/index.js +428 -0
package/dist/esm/modules/markdown/types.js +6 -0
package/dist/iife/excelts.iife.js +1342 -283
package/dist/iife/excelts.iife.js.map +1 -1
package/dist/iife/excelts.iife.min.js +38 -34
package/dist/types/index.browser.d.ts +3 -0
package/dist/types/index.d.ts +3 -0
package/dist/types/modules/archive/compression/deflate-fallback.d.ts +24 -22
package/dist/types/modules/archive/compression/streaming-compress.browser.d.ts +7 -0
package/dist/types/modules/archive/compression/streaming-compress.d.ts +5 -0
package/dist/types/modules/excel/workbook.browser.d.ts +72 -0
package/dist/types/modules/excel/workbook.d.ts +32 -1
package/dist/types/modules/markdown/constants.d.ts +30 -0
package/dist/types/modules/markdown/errors.d.ts +21 -0
package/dist/types/modules/markdown/format/index.d.ts +54 -0
package/dist/types/modules/markdown/index.d.ts +15 -0
package/dist/types/modules/markdown/parse/index.d.ts +70 -0
package/dist/types/modules/markdown/types.d.ts +130 -0
package/package.json +56 -32

package/dist/esm/modules/markdown/parse/index.js ADDED Viewed

@@ -0,0 +1,428 @@
+/**
+ * Markdown Table Parser
+ *
+ * Parses Markdown tables into structured data.
+ *
+ * Supports:
+ * - Standard GFM (GitHub Flavored Markdown) table syntax
+ * - Column alignment detection via separator row
+ * - Escaped pipes (`\|`) in cell content
+ * - Tables with or without leading/trailing pipes
+ * - Tolerant parsing (mismatched column counts, extra whitespace)
+ * - Multiline cell content via `<br>` / `<br/>` / `<br />` tags
+ *
+ * @example
+ * ```ts
+ * const result = parseMarkdown("| Name | Age |\n| --- | --- |\n| Alice | 30 |");
+ * // result.headers = ["Name", "Age"]
+ * // result.rows = [["Alice", "30"]]
+ * // result.alignments = ["none", "none"]
+ * ```
+ */
+import { BR_TAG_REGEX, LINEBREAK_REGEX, UNESCAPE_REGEX } from "../constants.js";
+import { MarkdownParseError } from "../errors.js";
+// =============================================================================
+// Character Codes (avoid repeated charCodeAt comparisons with magic numbers)
+// =============================================================================
+const CH_PIPE = 0x7c; // |
+const CH_BACKSLASH = 0x5c; // \
+const CH_COLON = 0x3a; // :
+const CH_DASH = 0x2d; // -
+const CH_SPACE = 0x20; // space
+const CH_TAB = 0x09; // tab
+function resolveParseOpts(options) {
+    return {
+        trim: options.trim !== false,
+        unescape: options.unescape !== false,
+        skipEmpty: options.skipEmptyRows !== false,
+        maxRows: options.maxRows,
+        convertBr: options.convertBr === true
+    };
+}
+// =============================================================================
+// Internal Helpers
+// =============================================================================
+/**
+ * Split a Markdown table row into cell values.
+ * Handles escaped pipes (`\|`) correctly by scanning character by character.
+ *
+ * Optimized: uses start/end index tracking with `slice()` instead of
+ * character-by-character string concatenation to avoid O(n²) worst case.
+ */
+function splitRow(line) {
+    const cells = [];
+    const len = line.length;
+    // Skip leading pipe
+    let i = len > 0 && line.charCodeAt(0) === CH_PIPE ? 1 : 0;
+    // Check for trailing pipe (to exclude it from the last cell)
+    // Must count consecutive backslashes before the pipe:
+    // even count (0, 2, 4...) → backslashes are all escaped, pipe is real
+    // odd count (1, 3, 5...) → last backslash escapes the pipe
+    let end = len;
+    if (len > 1 && line.charCodeAt(len - 1) === CH_PIPE) {
+        let backslashCount = 0;
+        let k = len - 2;
+        while (k >= 0 && line.charCodeAt(k) === CH_BACKSLASH) {
+            backslashCount++;
+            k--;
+        }
+        if (backslashCount % 2 === 0) {
+            end = len - 1;
+        }
+    }
+    // Track the start of the current cell segment
+    // We collect segments (between escape sequences) to minimize allocations
+    let segStart = i;
+    let current = "";
+    let hasEscape = false;
+    while (i < end) {
+        const ch = line.charCodeAt(i);
+        if (ch === CH_BACKSLASH && i + 1 < end) {
+            // Escape sequence: flush preceding segment, add escape pair
+            hasEscape = true;
+            if (i > segStart) {
+                current += line.slice(segStart, i);
+            }
+            current += line.slice(i, i + 2);
+            i += 2;
+            segStart = i;
+        }
+        else if (ch === CH_PIPE) {
+            // Cell boundary: flush and push
+            if (hasEscape) {
+                if (i > segStart) {
+                    current += line.slice(segStart, i);
+                }
+                cells.push(current);
+                current = "";
+                hasEscape = false;
+            }
+            else {
+                cells.push(line.slice(segStart, i));
+            }
+            i++;
+            segStart = i;
+        }
+        else {
+            i++;
+        }
+    }
+    // Push the last cell
+    if (hasEscape) {
+        if (end > segStart) {
+            current += line.slice(segStart, end);
+        }
+        cells.push(current);
+    }
+    else {
+        cells.push(line.slice(segStart, end));
+    }
+    return cells;
+}
+/**
+ * Determine column alignment from a separator cell.
+ *
+ * - `:---:` → center
+ * - `:---`  → left
+ * - `---:`  → right
+ * - `---`   → none
+ */
+function parseAlignment(cell) {
+    const trimmed = cell.trim();
+    const tLen = trimmed.length;
+    if (tLen === 0) {
+        return "none";
+    }
+    const leftColon = trimmed.charCodeAt(0) === CH_COLON;
+    const rightColon = trimmed.charCodeAt(tLen - 1) === CH_COLON;
+    if (leftColon && rightColon) {
+        return "center";
+    }
+    if (leftColon) {
+        return "left";
+    }
+    if (rightColon) {
+        return "right";
+    }
+    return "none";
+}
+/**
+ * Check if a cell string is a valid separator cell.
+ * Hand-rolled check replacing regex for better performance.
+ * Pattern: optional whitespace, optional colon, one or more dashes, optional colon, optional whitespace.
+ */
+function isSeparatorCell(cell) {
+    const len = cell.length;
+    let i = 0;
+    // Skip leading whitespace
+    while (i < len) {
+        const ch = cell.charCodeAt(i);
+        if (ch !== CH_SPACE && ch !== CH_TAB) {
+            break;
+        }
+        i++;
+    }
+    // Optional leading colon
+    if (i < len && cell.charCodeAt(i) === CH_COLON) {
+        i++;
+    }
+    // At least one dash required
+    const dashStart = i;
+    while (i < len && cell.charCodeAt(i) === CH_DASH) {
+        i++;
+    }
+    if (i === dashStart) {
+        return false;
+    }
+    // Optional trailing colon
+    if (i < len && cell.charCodeAt(i) === CH_COLON) {
+        i++;
+    }
+    // Skip trailing whitespace
+    while (i < len) {
+        const ch = cell.charCodeAt(i);
+        if (ch !== CH_SPACE && ch !== CH_TAB) {
+            return false;
+        }
+        i++;
+    }
+    return true;
+}
+/**
+ * Check if a line is a valid separator row.
+ * A separator row consists entirely of cells matching the pattern `:?-+:?`.
+ */
+function isSeparatorRow(cells) {
+    if (cells.length === 0) {
+        return false;
+    }
+    for (let i = 0; i < cells.length; i++) {
+        if (!isSeparatorCell(cells[i])) {
+            return false;
+        }
+    }
+    return true;
+}
+/**
+ * Process cell content: trim, optionally unescape, and optionally convert `<br>` to newlines.
+ */
+function processCell(value, opts) {
+    let result = opts.trim ? value.trim() : value;
+    if (opts.unescape) {
+        result = result.replace(UNESCAPE_REGEX, "$1");
+    }
+    if (opts.convertBr) {
+        result = result.replace(BR_TAG_REGEX, "\n");
+    }
+    return result;
+}
+/**
+ * Normalize a row to the expected column count.
+ * - If row has fewer cells, pad with empty strings
+ * - If row has more cells, truncate
+ */
+function normalizeRow(cells, columnCount, opts) {
+    const row = new Array(columnCount);
+    for (let i = 0; i < columnCount; i++) {
+        row[i] = i < cells.length ? processCell(cells[i], opts) : "";
+    }
+    return row;
+}
+/**
+ * Check if a row is empty (all cells are empty strings).
+ */
+function isEmptyRow(row) {
+    for (let i = 0; i < row.length; i++) {
+        if (row[i] !== "") {
+            return false;
+        }
+    }
+    return true;
+}
+/**
+ * Check if a line could be part of a table (contains a pipe character).
+ */
+function isTableLine(line) {
+    return line.indexOf("|") !== -1;
+}
+/**
+ * Check if a line starts with a pipe (after optional leading whitespace).
+ * Used to determine the table's "piped" style for data row validation.
+ */
+function startsWithPipe(line) {
+    const len = line.length;
+    let i = 0;
+    while (i < len) {
+        const ch = line.charCodeAt(i);
+        if (ch !== CH_SPACE && ch !== CH_TAB) {
+            return ch === CH_PIPE;
+        }
+        i++;
+    }
+    return false;
+}
+/**
+ * Check if a line could be a separator candidate (contains a dash).
+ */
+function hasDash(line) {
+    return line.indexOf("-") !== -1;
+}
+// =============================================================================
+// Core Table Parser (shared between parseMarkdown and parseMarkdownAll)
+// =============================================================================
+/**
+ * Attempt to parse a table starting at line index `startLine`.
+ *
+ * Returns `{ result, endLine }` if a valid table starts here, or `null` otherwise.
+ */
+function parseTableAt(lines, startLine, lineCount, opts) {
+    if (startLine >= lineCount - 1) {
+        return null;
+    }
+    const line = lines[startLine].trim();
+    // Skip empty lines and non-table content
+    if (line === "" || !isTableLine(line)) {
+        return null;
+    }
+    // Candidate header row
+    const headerCells = splitRow(line);
+    if (headerCells.length < 1) {
+        return null;
+    }
+    // Check if the next line is a valid separator row
+    const separatorLine = lines[startLine + 1].trim();
+    if (separatorLine === "" || !hasDash(separatorLine)) {
+        return null;
+    }
+    const separatorCells = splitRow(separatorLine);
+    if (!isSeparatorRow(separatorCells)) {
+        return null;
+    }
+    // Valid table found — extract headers and alignments
+    const columnCount = headerCells.length;
+    const headers = new Array(columnCount);
+    const alignments = new Array(columnCount);
+    for (let c = 0; c < columnCount; c++) {
+        headers[c] = processCell(headerCells[c], opts);
+        alignments[c] = c < separatorCells.length ? parseAlignment(separatorCells[c]) : "none";
+    }
+    // Determine if this is a "piped" table (header starts with `|`).
+    // When the header has a leading pipe, data rows must also start with `|`.
+    // This prevents prose like "This has a | pipe" from being swallowed as data.
+    const piped = startsWithPipe(line);
+    // Parse data rows
+    const rows = [];
+    let j = startLine + 2;
+    for (; j < lineCount; j++) {
+        const dataLine = lines[j].trim();
+        // Stop at empty line or non-table content (end of table)
+        if (dataLine === "" || !isTableLine(dataLine)) {
+            break;
+        }
+        // For piped tables, data rows must also start with `|`
+        if (piped && !startsWithPipe(dataLine)) {
+            break;
+        }
+        // Check maxRows limit
+        if (opts.maxRows !== undefined && rows.length >= opts.maxRows) {
+            // Skip remaining table rows for parseMarkdownAll to correctly advance
+            while (j < lineCount) {
+                const remaining = lines[j].trim();
+                if (remaining === "" || !isTableLine(remaining)) {
+                    break;
+                }
+                if (piped && !startsWithPipe(remaining)) {
+                    break;
+                }
+                j++;
+            }
+            break;
+        }
+        const dataCells = splitRow(dataLine);
+        const row = normalizeRow(dataCells, columnCount, opts);
+        if (opts.skipEmpty && isEmptyRow(row)) {
+            continue;
+        }
+        rows.push(row);
+    }
+    return { result: { headers, rows, alignments }, endLine: j };
+}
+// =============================================================================
+// Main Parser
+// =============================================================================
+/**
+ * Parse a Markdown table string into structured data.
+ *
+ * The parser looks for the GFM table pattern:
+ * 1. A header row (pipe-delimited cells)
+ * 2. A separator row (dashes with optional colons for alignment)
+ * 3. Zero or more data rows
+ *
+ * Non-table content before and after the table is ignored.
+ *
+ * @param input - Markdown string containing a table
+ * @param options - Parse options
+ * @returns Parsed table data with headers, rows, and alignments
+ *
+ * @throws {MarkdownParseError} When no valid table is found in the input
+ *
+ * @example
+ * ```ts
+ * // Basic table
+ * const result = parseMarkdown("| Name | Age |\n| --- | --- |\n| Alice | 30 |");
+ *
+ * // With alignment
+ * const result = parseMarkdown("| Left | Center | Right |\n|:---|:---:|---:|\n|a|b|c|");
+ * // result.alignments = ["left", "center", "right"]
+ *
+ * // From a larger Markdown document
+ * const result = parseMarkdown(markdownDoc); // Finds the first table
+ *
+ * // With options
+ * const result = parseMarkdown(input, { trim: false, maxRows: 100 });
+ * ```
+ */
+export function parseMarkdown(input, options = {}) {
+    const opts = resolveParseOpts(options);
+    const lines = input.split(LINEBREAK_REGEX);
+    const lineCount = lines.length;
+    for (let i = 0; i < lineCount - 1; i++) {
+        const parsed = parseTableAt(lines, i, lineCount, opts);
+        if (parsed) {
+            return parsed.result;
+        }
+    }
+    throw new MarkdownParseError("No valid Markdown table found in input", lineCount > 0 ? lineCount : 1);
+}
+/**
+ * Parse all Markdown tables from a document.
+ *
+ * @param input - Markdown string containing one or more tables
+ * @param options - Parse options (maxRows applies per table)
+ * @returns Array of parsed tables
+ *
+ * @example
+ * ```ts
+ * const tables = parseMarkdownAll(markdownDoc);
+ * console.log(`Found ${tables.length} tables`);
+ * tables.forEach((t, i) => console.log(`Table ${i}: ${t.headers.join(", ")}`));
+ * ```
+ */
+export function parseMarkdownAll(input, options = {}) {
+    const opts = resolveParseOpts(options);
+    const lines = input.split(LINEBREAK_REGEX);
+    const lineCount = lines.length;
+    const tables = [];
+    let i = 0;
+    while (i < lineCount - 1) {
+        const parsed = parseTableAt(lines, i, lineCount, opts);
+        if (parsed) {
+            tables.push(parsed.result);
+            i = parsed.endLine;
+        }
+        else {
+            i++;
+        }
+    }
+    return tables;
+}

package/dist/esm/modules/markdown/types.js ADDED Viewed

@@ -0,0 +1,6 @@
+/**
+ * Markdown Types
+ *
+ * Centralized type definitions for the Markdown module.
+ */
+export {};