npm - @js-ak/excel-toolbox - Versions diffs - 1.6.0 → 1.7.0 - Mend

@js-ak/excel-toolbox 1.6.0 → 1.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/build/cjs/lib/merge-sheets-to-base-file-process-sync.js ADDED Viewed

@@ -0,0 +1,105 @@
+"use strict";
+var __createBinding = (this && this.__createBinding) || (Object.create ? (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    var desc = Object.getOwnPropertyDescriptor(m, k);
+    if (!desc || ("get" in desc ? !m.__esModule : desc.writable || desc.configurable)) {
+      desc = { enumerable: true, get: function() { return m[k]; } };
+    }
+    Object.defineProperty(o, k2, desc);
+}) : (function(o, m, k, k2) {
+    if (k2 === undefined) k2 = k;
+    o[k2] = m[k];
+}));
+var __setModuleDefault = (this && this.__setModuleDefault) || (Object.create ? (function(o, v) {
+    Object.defineProperty(o, "default", { enumerable: true, value: v });
+}) : function(o, v) {
+    o["default"] = v;
+});
+var __importStar = (this && this.__importStar) || (function () {
+    var ownKeys = function(o) {
+        ownKeys = Object.getOwnPropertyNames || function (o) {
+            var ar = [];
+            for (var k in o) if (Object.prototype.hasOwnProperty.call(o, k)) ar[ar.length] = k;
+            return ar;
+        };
+        return ownKeys(o);
+    };
+    return function (mod) {
+        if (mod && mod.__esModule) return mod;
+        var result = {};
+        if (mod != null) for (var k = ownKeys(mod), i = 0; i < k.length; i++) if (k[i] !== "default") __createBinding(result, mod, k[i]);
+        __setModuleDefault(result, mod);
+        return result;
+    };
+})();
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.mergeSheetsToBaseFileProcessSync = mergeSheetsToBaseFileProcessSync;
+const Utils = __importStar(require("./utils/index.js"));
+const Xml = __importStar(require("./xml/index.js"));
+/**
+ * Merges rows from other Excel files into a base Excel file.
+ *
+ * This function is a process-friendly version of mergeSheetsToBaseFile.
+ * It takes a single object with the following properties:
+ * - additions: An array of objects with two properties:
+ *   - files: A dictionary of file paths to their corresponding XML content
+ *   - sheetIndexes: The 1-based indexes of the sheet to extract rows from
+ * - baseFiles: A dictionary of file paths to their corresponding XML content
+ * - baseSheetIndex: The 1-based index of the sheet in the base file to add rows to
+ * - gap: The number of empty rows to insert between each added section
+ * - sheetNamesToRemove: The names of sheets to remove from the output file
+ * - sheetsToRemove: The 1-based indices of sheets to remove from the output file
+ *
+ * The function returns a dictionary of file paths to their corresponding XML content.
+ */
+function mergeSheetsToBaseFileProcessSync(data) {
+    const { additions, baseFiles, baseSheetIndex, gap, sheetNamesToRemove, sheetsToRemove, } = data;
+    const basePath = `xl/worksheets/sheet${baseSheetIndex}.xml`;
+    if (!baseFiles[basePath]) {
+        throw new Error(`Base file does not contain ${basePath}`);
+    }
+    const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = Xml.extractRowsFromSheetSync(baseFiles[basePath]);
+    const allRows = [...baseRows];
+    const allMergeCells = [...baseMergeCells];
+    let currentRowOffset = lastRowNumber + gap;
+    for (const { files, sheetIndexes } of additions) {
+        for (const sheetIndex of sheetIndexes) {
+            const sheetPath = `xl/worksheets/sheet${sheetIndex}.xml`;
+            if (!files[sheetPath]) {
+                throw new Error(`File does not contain ${sheetPath}`);
+            }
+            const { mergeCells, rows } = Xml.extractRowsFromSheetSync(files[sheetPath]);
+            const shiftedRows = Xml.shiftRowIndices(rows, currentRowOffset);
+            const shiftedMergeCells = mergeCells.map(cell => {
+                const [start, end] = cell.ref.split(":");
+                if (!start || !end) {
+                    return cell;
+                }
+                const shiftedStart = Utils.shiftCellRef(start, currentRowOffset);
+                const shiftedEnd = Utils.shiftCellRef(end, currentRowOffset);
+                return { ...cell, ref: `${shiftedStart}:${shiftedEnd}` };
+            });
+            allRows.push(...shiftedRows);
+            allMergeCells.push(...shiftedMergeCells);
+            currentRowOffset += Utils.getMaxRowNumber(rows) + gap;
+        }
+    }
+    const mergedXml = Xml.buildMergedSheet(xml, allRows, allMergeCells);
+    baseFiles[basePath] = mergedXml;
+    for (const sheetIndex of sheetsToRemove) {
+        const sheetPath = `xl/worksheets/sheet${sheetIndex}.xml`;
+        delete baseFiles[sheetPath];
+        if (baseFiles["xl/workbook.xml"]) {
+            baseFiles["xl/workbook.xml"] = Buffer.from(Utils.removeSheetFromWorkbook(baseFiles["xl/workbook.xml"].toString(), sheetIndex));
+        }
+        if (baseFiles["xl/_rels/workbook.xml.rels"]) {
+            baseFiles["xl/_rels/workbook.xml.rels"] = Buffer.from(Utils.removeSheetFromRels(baseFiles["xl/_rels/workbook.xml.rels"].toString(), sheetIndex));
+        }
+        if (baseFiles["[Content_Types].xml"]) {
+            baseFiles["[Content_Types].xml"] = Buffer.from(Utils.removeSheetFromContentTypes(baseFiles["[Content_Types].xml"].toString(), sheetIndex));
+        }
+    }
+    for (const sheetName of sheetNamesToRemove) {
+        Utils.removeSheetByName(baseFiles, sheetName);
+    }
+}

package/build/cjs/lib/merge-sheets-to-base-file-process.js CHANGED Viewed

@@ -52,13 +52,13 @@ const Xml = __importStar(require("./xml/index.js"));
  *
  * The function returns a dictionary of file paths to their corresponding XML content.
  */
-function mergeSheetsToBaseFileProcess(data) {
+async function mergeSheetsToBaseFileProcess(data) {
     const { additions, baseFiles, baseSheetIndex, gap, sheetNamesToRemove, sheetsToRemove, } = data;
     const basePath = `xl/worksheets/sheet${baseSheetIndex}.xml`;
     if (!baseFiles[basePath]) {
         throw new Error(`Base file does not contain ${basePath}`);
     }
-    const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = Xml.extractRowsFromSheet(baseFiles[basePath]);
+    const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = await Xml.extractRowsFromSheet(baseFiles[basePath]);
     const allRows = [...baseRows];
     const allMergeCells = [...baseMergeCells];
     let currentRowOffset = lastRowNumber + gap;
@@ -68,7 +68,7 @@ function mergeSheetsToBaseFileProcess(data) {
             if (!files[sheetPath]) {
                 throw new Error(`File does not contain ${sheetPath}`);
             }
-            const { mergeCells, rows } = Xml.extractRowsFromSheet(files[sheetPath]);
+            const { mergeCells, rows } = await Xml.extractRowsFromSheet(files[sheetPath]);
             const shiftedRows = Xml.shiftRowIndices(rows, currentRowOffset);
             const shiftedMergeCells = mergeCells.map(cell => {
                 const [start, end] = cell.ref.split(":");

package/build/cjs/lib/merge-sheets-to-base-file-sync.js CHANGED Viewed

@@ -36,7 +36,7 @@ Object.defineProperty(exports, "__esModule", { value: true });
 exports.mergeSheetsToBaseFileSync = mergeSheetsToBaseFileSync;
 const Utils = __importStar(require("./utils/index.js"));
 const Zip = __importStar(require("./zip/index.js"));
-const merge_sheets_to_base_file_process_js_1 = require("./merge-sheets-to-base-file-process.js");
+const merge_sheets_to_base_file_process_sync_js_1 = require("./merge-sheets-to-base-file-process-sync.js");
 /**
  * Merge rows from other Excel files into a base Excel file.
  * The output is a new Excel file with the merged content.
@@ -65,7 +65,7 @@ function mergeSheetsToBaseFileSync(data) {
             sheetIndexes,
         });
     }
-    (0, merge_sheets_to_base_file_process_js_1.mergeSheetsToBaseFileProcess)({
+    (0, merge_sheets_to_base_file_process_sync_js_1.mergeSheetsToBaseFileProcessSync)({
         additions: additionsUpdated,
         baseFiles,
         baseSheetIndex,

package/build/cjs/lib/merge-sheets-to-base-file.js CHANGED Viewed

@@ -65,7 +65,7 @@ async function mergeSheetsToBaseFile(data) {
             sheetIndexes,
         });
     }
-    (0, merge_sheets_to_base_file_process_js_1.mergeSheetsToBaseFileProcess)({
+    await (0, merge_sheets_to_base_file_process_js_1.mergeSheetsToBaseFileProcess)({
         additions: additionsUpdated,
         baseFiles,
         baseSheetIndex,

package/build/cjs/lib/template/template-fs.js CHANGED Viewed

@@ -165,13 +165,13 @@ class TemplateFs {
      */
     async #getSheetPathByName(sheetName) {
         // Read XML workbook to find sheet name and path
-        const workbookXml = Xml.extractXmlFromSheet(await this.#readFile(this.#excelKeys.workbook));
+        const workbookXml = await Xml.extractXmlFromSheet(await this.#readFile(this.#excelKeys.workbook));
         const sheetMatch = workbookXml.match(Utils.sheetMatch(sheetName));
         if (!sheetMatch || !sheetMatch[1]) {
             throw new Error(`Sheet "${sheetName}" not found`);
         }
         const rId = sheetMatch[1];
-        const relsXml = Xml.extractXmlFromSheet(await this.#readFile(this.#excelKeys.workbookRels));
+        const relsXml = await Xml.extractXmlFromSheet(await this.#readFile(this.#excelKeys.workbookRels));
         const relMatch = relsXml.match(Utils.relationshipMatch(rId));
         if (!relMatch || !relMatch[1]) {
             throw new Error(`Relationship "${rId}" not found`);
@@ -230,10 +230,10 @@ class TemplateFs {
         let sharedStringsContent = "";
         let sheetContent = "";
         if (this.fileKeys.has(sharedStringsPath)) {
-            sharedStringsContent = Xml.extractXmlFromSheet(await this.#readFile(sharedStringsPath));
+            sharedStringsContent = await Xml.extractXmlFromSheet(await this.#readFile(sharedStringsPath));
         }
         if (this.fileKeys.has(sheetPath)) {
-            sheetContent = Xml.extractXmlFromSheet(await this.#readFile(sheetPath));
+            sheetContent = await Xml.extractXmlFromSheet(await this.#readFile(sheetPath));
             const TABLE_REGEX = /\$\{table:([a-zA-Z0-9_]+)\.([a-zA-Z0-9_]+)\}/g;
             const hasTablePlaceholders = TABLE_REGEX.test(sharedStringsContent) || TABLE_REGEX.test(sheetContent);
             if (hasTablePlaceholders) {
@@ -290,7 +290,7 @@ class TemplateFs {
             }
             // Read workbook.xml and find the source sheet
             const workbookXmlPath = this.#excelKeys.workbook;
-            const workbookXml = Xml.extractXmlFromSheet(await this.#readFile(workbookXmlPath));
+            const workbookXml = await Xml.extractXmlFromSheet(await this.#readFile(workbookXmlPath));
             // Find the source sheet
             const sheetMatch = workbookXml.match(Utils.sheetMatch(sourceName));
             if (!sheetMatch || !sheetMatch[1]) {
@@ -304,7 +304,7 @@ class TemplateFs {
             // Find the source sheet path by rId
             const rId = sheetMatch[1];
             const relsXmlPath = this.#excelKeys.workbookRels;
-            const relsXml = Xml.extractXmlFromSheet(await this.#readFile(relsXmlPath));
+            const relsXml = await Xml.extractXmlFromSheet(await this.#readFile(relsXmlPath));
             const relMatch = relsXml.match(Utils.relationshipMatch(rId));
             if (!relMatch || !relMatch[1]) {
                 throw new Error(`Relationship "${rId}" not found`);
@@ -339,7 +339,7 @@ class TemplateFs {
             // Read [Content_Types].xml
             // Update [Content_Types].xml
             const contentTypesPath = this.#excelKeys.contentTypes;
-            const contentTypesXml = Xml.extractXmlFromSheet(await this.#readFile(contentTypesPath));
+            const contentTypesXml = await Xml.extractXmlFromSheet(await this.#readFile(contentTypesPath));
             const overrideTag = `<Override PartName="/xl/worksheets/${newSheetFilename}" ContentType="application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml"/>`;
             const updatedContentTypesXml = contentTypesXml.replace("</Types>", overrideTag + "</Types>");
             await this.#set(contentTypesPath, updatedContentTypesXml);
@@ -398,7 +398,7 @@ class TemplateFs {
             // Find the sheet
             const sheetPath = await this.#getSheetPathByName(sheetName);
             const sheetXmlRaw = await this.#readFile(sheetPath);
-            const sheetXml = Xml.extractXmlFromSheet(sheetXmlRaw);
+            const sheetXml = await Xml.extractXmlFromSheet(sheetXmlRaw);
             let nextRow = 0;
             if (!startRowNumber) {
                 // Find the last row

package/build/cjs/lib/template/template-memory.js CHANGED Viewed

@@ -140,7 +140,7 @@ class TemplateMemory {
      * @throws {Error} If the file key is not found.
      * @experimental This API is experimental and might change in future versions.
      */
-    #extractXmlFromSheet(fileKey) {
+    async #extractXmlFromSheet(fileKey) {
         if (!this.files[fileKey]) {
             throw new Error(`${fileKey} not found`);
         }
@@ -158,7 +158,7 @@ class TemplateMemory {
      * @throws {Error} If the file key is not found
      * @experimental This API is experimental and might change in future versions.
      */
-    #extractRowsFromSheet(fileKey) {
+    async #extractRowsFromSheet(fileKey) {
         if (!this.files[fileKey]) {
             throw new Error(`${fileKey} not found`);
         }
@@ -172,15 +172,15 @@ class TemplateMemory {
      * @throws {Error} If the sheet with the given name does not exist.
      * @experimental This API is experimental and might change in future versions.
      */
-    #getSheetPathByName(sheetName) {
+    async #getSheetPathByName(sheetName) {
         // Find the sheet
-        const workbookXml = this.#extractXmlFromSheet(this.#excelKeys.workbook);
+        const workbookXml = await this.#extractXmlFromSheet(this.#excelKeys.workbook);
         const sheetMatch = workbookXml.match(Utils.sheetMatch(sheetName));
         if (!sheetMatch || !sheetMatch[1]) {
             throw new Error(`Sheet "${sheetName}" not found`);
         }
         const rId = sheetMatch[1];
-        const relsXml = this.#extractXmlFromSheet(this.#excelKeys.workbookRels);
+        const relsXml = await this.#extractXmlFromSheet(this.#excelKeys.workbookRels);
         const relMatch = relsXml.match(Utils.relationshipMatch(rId));
         if (!relMatch || !relMatch[1]) {
             throw new Error(`Relationship "${rId}" not found`);
@@ -233,11 +233,11 @@ class TemplateMemory {
         let sharedStringsContent = "";
         let sheetContent = "";
         if (this.files[sharedStringsPath]) {
-            sharedStringsContent = this.#extractXmlFromSheet(sharedStringsPath);
+            sharedStringsContent = await this.#extractXmlFromSheet(sharedStringsPath);
         }
-        const sheetPath = this.#getSheetPathByName(sheetName);
+        const sheetPath = await this.#getSheetPathByName(sheetName);
         if (this.files[sheetPath]) {
-            sheetContent = this.#extractXmlFromSheet(sheetPath);
+            sheetContent = await this.#extractXmlFromSheet(sheetPath);
             const TABLE_REGEX = /\$\{table:([a-zA-Z0-9_]+)\.([a-zA-Z0-9_]+)\}/g;
             const hasTablePlaceholders = TABLE_REGEX.test(sharedStringsContent) || TABLE_REGEX.test(sheetContent);
             if (hasTablePlaceholders) {
@@ -272,11 +272,11 @@ class TemplateMemory {
      * @throws {Error} If no sheets are found to merge.
      * @experimental This API is experimental and might change in future versions.
      */
-    #mergeSheets(data) {
+    async #mergeSheets(data) {
         const { additions, baseSheetIndex = 1, baseSheetName, gap = 0, } = data;
         let fileKey = "";
         if (baseSheetName) {
-            fileKey = this.#getSheetPathByName(baseSheetName);
+            fileKey = await this.#getSheetPathByName(baseSheetName);
         }
         if (baseSheetIndex && !fileKey) {
             if (baseSheetIndex < 1) {
@@ -287,16 +287,16 @@ class TemplateMemory {
         if (!fileKey) {
             throw new Error("Base sheet not found");
         }
-        const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = this.#extractRowsFromSheet(fileKey);
+        const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = await this.#extractRowsFromSheet(fileKey);
         const allRows = [...baseRows];
         const allMergeCells = [...baseMergeCells];
         let currentRowOffset = lastRowNumber + gap;
         const sheetPaths = [];
         if (additions.sheetIndexes) {
-            sheetPaths.push(...(additions.sheetIndexes).map(e => this.#getSheetPathById(e)));
+            sheetPaths.push(...(await Promise.all(additions.sheetIndexes.map(e => this.#getSheetPathById(e)))));
         }
         if (additions.sheetNames) {
-            sheetPaths.push(...(additions.sheetNames).map(e => this.#getSheetPathByName(e)));
+            sheetPaths.push(...(await Promise.all(additions.sheetNames.map(e => this.#getSheetPathByName(e)))));
         }
         if (sheetPaths.length === 0) {
             throw new Error("No sheets found to merge");
@@ -305,7 +305,7 @@ class TemplateMemory {
             if (!this.files[sheetPath]) {
                 throw new Error(`Sheet "${sheetPath}" not found`);
             }
-            const { mergeCells, rows } = Xml.extractRowsFromSheet(this.files[sheetPath]);
+            const { mergeCells, rows } = await Xml.extractRowsFromSheet(this.files[sheetPath]);
             const shiftedRows = Xml.shiftRowIndices(rows, currentRowOffset);
             const shiftedMergeCells = mergeCells.map(cell => {
                 const [start, end] = cell.ref.split(":");
@@ -377,7 +377,7 @@ class TemplateMemory {
             }
             // Read workbook.xml and find the source sheet
             const workbookXmlPath = this.#excelKeys.workbook;
-            const workbookXml = this.#extractXmlFromSheet(this.#excelKeys.workbook);
+            const workbookXml = await this.#extractXmlFromSheet(this.#excelKeys.workbook);
             // Find the source sheet
             const sheetMatch = workbookXml.match(Utils.sheetMatch(sourceName));
             if (!sheetMatch || !sheetMatch[1]) {
@@ -391,7 +391,7 @@ class TemplateMemory {
             // Find the source sheet path by rId
             const rId = sheetMatch[1];
             const relsXmlPath = this.#excelKeys.workbookRels;
-            const relsXml = this.#extractXmlFromSheet(this.#excelKeys.workbookRels);
+            const relsXml = await this.#extractXmlFromSheet(this.#excelKeys.workbookRels);
             const relMatch = relsXml.match(Utils.relationshipMatch(rId));
             if (!relMatch || !relMatch[1]) {
                 throw new Error(`Relationship "${rId}" not found`);
@@ -433,7 +433,7 @@ class TemplateMemory {
             // Read [Content_Types].xml
             // Update [Content_Types].xml
             const contentTypesPath = "[Content_Types].xml";
-            const contentTypesXml = this.#extractXmlFromSheet(contentTypesPath);
+            const contentTypesXml = await this.#extractXmlFromSheet(contentTypesPath);
             const overrideTag = `<Override PartName="/xl/worksheets/${newSheetFilename}" ContentType="application/vnd.openxmlformats-officedocument.spreadsheetml.worksheet+xml"/>`;
             const updatedContentTypesXml = contentTypesXml.replace("</Types>", overrideTag + "</Types>");
             await this.#set(contentTypesPath, Buffer.from(updatedContentTypesXml));
@@ -490,8 +490,8 @@ class TemplateMemory {
             Utils.checkStartRow(startRowNumber);
             Utils.checkRows(preparedRows);
             // Find the sheet
-            const sheetPath = this.#getSheetPathByName(sheetName);
-            const sheetXml = this.#extractXmlFromSheet(sheetPath);
+            const sheetPath = await this.#getSheetPathByName(sheetName);
+            const sheetXml = await this.#extractXmlFromSheet(sheetPath);
             let nextRow = 0;
             if (!startRowNumber) {
                 // Find the last row
@@ -554,8 +554,8 @@ class TemplateMemory {
             if (!sheetName)
                 throw new Error("Sheet name is required");
             // Read XML workbook to find sheet name and path
-            const sheetPath = this.#getSheetPathByName(sheetName);
-            const sheetXml = this.#extractXmlFromSheet(sheetPath);
+            const sheetPath = await this.#getSheetPathByName(sheetName);
+            const sheetXml = await this.#extractXmlFromSheet(sheetPath);
             const output = new memory_write_stream_js_1.MemoryWriteStream();
             let inserted = false;
             // --- Case 1: <sheetData>...</sheetData> on one line ---

package/build/cjs/lib/xml/extract-rows-from-sheet-sync.js ADDED Viewed

@@ -0,0 +1,67 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.extractRowsFromSheetSync = extractRowsFromSheetSync;
+const extract_xml_from_sheet_sync_js_1 = require("./extract-xml-from-sheet-sync.js");
+/**
+ * Parses a worksheet (either as Buffer or string) to extract row data,
+ * last row number, and merge cell information from Excel XML format.
+ *
+ * This function is particularly useful for processing Excel files in
+ * Open XML Spreadsheet format (.xlsx).
+ *
+ * @param {Buffer|string} sheet - The worksheet content to parse, either as:
+ *                               - Buffer (binary Excel sheet)
+ *                               - string (raw XML content)
+ * @returns {{
+ *   rows: string[],
+ *   lastRowNumber: number,
+ *   mergeCells: {ref: string}[]
+ * }} An object containing:
+ *   - rows: Array of raw XML strings for each <row> element
+ *   - lastRowNumber: Highest row number found in the sheet (1-based)
+ *   - mergeCells: Array of merged cell ranges (e.g., [{ref: "A1:B2"}])
+ * @throws {Error} If the sheetData section is not found in the XML
+ */
+function extractRowsFromSheetSync(sheet) {
+    // Convert Buffer input to XML string if needed
+    const xml = typeof sheet === "string"
+        ? sheet
+        : (0, extract_xml_from_sheet_sync_js_1.extractXmlFromSheetSync)(sheet);
+    // Extract the sheetData section containing all rows
+    const sheetDataMatch = xml.match(/<sheetData[^>]*>([\s\S]*?)<\/sheetData>/);
+    if (!sheetDataMatch) {
+        throw new Error("sheetData not found in worksheet XML");
+    }
+    const sheetDataContent = sheetDataMatch[1] || "";
+    // Extract all <row> elements using regex
+    const rowMatches = [...sheetDataContent.matchAll(/<row\b[^>]*\/>|<row\b[^>]*>[\s\S]*?<\/row>/g)];
+    const rows = rowMatches.map(match => match[0]);
+    // Calculate the highest row number present in the sheet
+    const lastRowNumber = rowMatches
+        .map(match => {
+        // Extract row number from r="..." attribute (1-based)
+        const rowNumMatch = match[0].match(/r="(\d+)"/);
+        return rowNumMatch?.[1] ? parseInt(rowNumMatch[1], 10) : null;
+    })
+        .filter((row) => row !== null) // Type guard to filter out nulls
+        .reduce((max, current) => Math.max(max, current), 0); // Find maximum row number
+    // Extract all merged cell ranges from the worksheet
+    const mergeCells = [];
+    const mergeCellsMatch = xml.match(/<mergeCells[^>]*>([\s\S]*?)<\/mergeCells>/);
+    if (mergeCellsMatch) {
+        // Find all mergeCell entries with ref attributes
+        const mergeCellMatches = mergeCellsMatch[1]?.match(/<mergeCell[^>]+ref="([^"]+)"[^>]*>/g) || [];
+        mergeCellMatches.forEach(match => {
+            const refMatch = match.match(/ref="([^"]+)"/);
+            if (refMatch?.[1]) {
+                mergeCells.push({ ref: refMatch[1] }); // Store the cell range (e.g., "A1:B2")
+            }
+        });
+    }
+    return {
+        lastRowNumber,
+        mergeCells,
+        rows,
+        xml,
+    };
+}

package/build/cjs/lib/xml/extract-rows-from-sheet.js CHANGED Viewed

@@ -22,9 +22,11 @@ const extract_xml_from_sheet_js_1 = require("./extract-xml-from-sheet.js");
  *   - mergeCells: Array of merged cell ranges (e.g., [{ref: "A1:B2"}])
  * @throws {Error} If the sheetData section is not found in the XML
  */
-function extractRowsFromSheet(sheet) {
+async function extractRowsFromSheet(sheet) {
     // Convert Buffer input to XML string if needed
-    const xml = typeof sheet === "string" ? sheet : (0, extract_xml_from_sheet_js_1.extractXmlFromSheet)(sheet);
+    const xml = typeof sheet === "string"
+        ? sheet
+        : await (0, extract_xml_from_sheet_js_1.extractXmlFromSheet)(sheet);
     // Extract the sheetData section containing all rows
     const sheetDataMatch = xml.match(/<sheetData[^>]*>([\s\S]*?)<\/sheetData>/);
     if (!sheetDataMatch) {

package/build/cjs/lib/xml/extract-xml-from-sheet-sync.js ADDED Viewed

@@ -0,0 +1,43 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.extractXmlFromSheetSync = extractXmlFromSheetSync;
+const node_zlib_1 = require("node:zlib");
+/**
+ * Extracts and parses XML content from an Excel worksheet file (e.g., xl/worksheets/sheet1.xml).
+ * Handles both compressed (raw deflate) and uncompressed (plain XML) formats.
+ *
+ * This function is designed to work with Excel Open XML (.xlsx) worksheet files,
+ * which may be stored in either compressed or uncompressed format within the ZIP container.
+ *
+ * @param {Buffer} buffer - The file content to process, which may be:
+ *                         - Raw XML text
+ *                         - Deflate-compressed XML data (without zlib headers)
+ * @returns {string} - The extracted XML content as a UTF-8 string
+ * @throws {Error} - If the buffer is empty or cannot be processed
+ */
+function extractXmlFromSheetSync(buffer) {
+    if (!buffer || buffer.length === 0) {
+        throw new Error("Empty buffer provided");
+    }
+    let xml;
+    // Check if the buffer starts with an XML declaration (<?xml)
+    const head = buffer.subarray(0, 1024).toString("utf8").replace(/[\x00-\x08\x0B\x0C\x0E-\x1F]/g, "").trim();
+    const isXml = /^<\?xml[\s\S]+<\w+[\s>]/.test(head);
+    if (isXml) {
+        // Case 1: Already uncompressed XML - convert directly to string
+        xml = buffer.toString("utf8");
+    }
+    else {
+        // Case 2: Attempt to decompress as raw deflate data
+        try {
+            xml = (0, node_zlib_1.inflateRawSync)(buffer).toString("utf8");
+        }
+        catch (err) {
+            throw new Error("Failed to decompress sheet XML: " + (err instanceof Error ? err.message : String(err)));
+        }
+    }
+    // Sanitize XML by removing control characters (except tab, newline, carriage return)
+    // This handles potential corruption from binary data or encoding issues
+    xml = xml.replace(/[\x00-\x08\x0B\x0C\x0E-\x1F]/g, "");
+    return xml;
+}

package/build/cjs/lib/xml/extract-xml-from-sheet.js CHANGED Viewed

@@ -1,7 +1,12 @@
 "use strict";
+var __importDefault = (this && this.__importDefault) || function (mod) {
+    return (mod && mod.__esModule) ? mod : { "default": mod };
+};
 Object.defineProperty(exports, "__esModule", { value: true });
 exports.extractXmlFromSheet = extractXmlFromSheet;
-const pako_1 = require("pako");
+const node_util_1 = __importDefault(require("node:util"));
+const node_zlib_1 = __importDefault(require("node:zlib"));
+const inflateRaw = node_util_1.default.promisify(node_zlib_1.default.inflateRaw);
 /**
  * Extracts and parses XML content from an Excel worksheet file (e.g., xl/worksheets/sheet1.xml).
  * Handles both compressed (raw deflate) and uncompressed (plain XML) formats.
@@ -12,35 +17,30 @@ const pako_1 = require("pako");
  * @param {Buffer} buffer - The file content to process, which may be:
  *                         - Raw XML text
  *                         - Deflate-compressed XML data (without zlib headers)
- * @returns {string} - The extracted XML content as a UTF-8 string
+ * @returns {Promise<string>} - The extracted XML content as a UTF-8 string
  * @throws {Error} - If the buffer is empty or cannot be processed
  */
-function extractXmlFromSheet(buffer) {
+async function extractXmlFromSheet(buffer) {
     if (!buffer || buffer.length === 0) {
         throw new Error("Empty buffer provided");
     }
     let xml;
     // Check if the buffer starts with an XML declaration (<?xml)
-    const startsWithXml = buffer.subarray(0, 5).toString("utf8").trim().startsWith("<?xml");
-    if (startsWithXml) {
+    const head = buffer.subarray(0, 1024).toString("utf8").replace(/[\x00-\x08\x0B\x0C\x0E-\x1F]/g, "").trim();
+    const isXml = /^<\?xml[\s\S]+<\w+[\s>]/.test(head);
+    if (isXml) {
         // Case 1: Already uncompressed XML - convert directly to string
         xml = buffer.toString("utf8");
     }
     else {
         // Case 2: Attempt to decompress as raw deflate data
-        const inflated = (0, pako_1.inflateRaw)(buffer, { to: "string" });
-        // Validate the decompressed content contains worksheet data
-        if (inflated && inflated.includes("<sheetData")) {
-            xml = inflated;
+        try {
+            xml = (await inflateRaw(buffer)).toString("utf8");
         }
-        else {
-            throw new Error("Decompressed data does not contain sheetData");
+        catch (err) {
+            throw new Error("Failed to decompress sheet XML: " + (err instanceof Error ? err.message : String(err)));
         }
     }
-    // Fallback: If no XML obtained yet, try direct UTF-8 conversion
-    if (!xml) {
-        xml = buffer.toString("utf8");
-    }
     // Sanitize XML by removing control characters (except tab, newline, carriage return)
     // This handles potential corruption from binary data or encoding issues
     xml = xml.replace(/[\x00-\x08\x0B\x0C\x0E-\x1F]/g, "");

package/build/cjs/lib/xml/index.js CHANGED Viewed

@@ -15,7 +15,8 @@ var __exportStar = (this && this.__exportStar) || function(m, exports) {
 };
 Object.defineProperty(exports, "__esModule", { value: true });
 __exportStar(require("./build-merged-sheet.js"), exports);
+__exportStar(require("./extract-rows-from-sheet-sync.js"), exports);
 __exportStar(require("./extract-rows-from-sheet.js"), exports);
+__exportStar(require("./extract-xml-from-sheet-sync.js"), exports);
 __exportStar(require("./extract-xml-from-sheet.js"), exports);
-__exportStar(require("./extract-xml-from-system-content.js"), exports);
 __exportStar(require("./shift-row-indices.js"), exports);

package/build/esm/lib/merge-sheets-to-base-file-process-sync.js ADDED Viewed

@@ -0,0 +1,69 @@
+import * as Utils from "./utils/index.js";
+import * as Xml from "./xml/index.js";
+/**
+ * Merges rows from other Excel files into a base Excel file.
+ *
+ * This function is a process-friendly version of mergeSheetsToBaseFile.
+ * It takes a single object with the following properties:
+ * - additions: An array of objects with two properties:
+ *   - files: A dictionary of file paths to their corresponding XML content
+ *   - sheetIndexes: The 1-based indexes of the sheet to extract rows from
+ * - baseFiles: A dictionary of file paths to their corresponding XML content
+ * - baseSheetIndex: The 1-based index of the sheet in the base file to add rows to
+ * - gap: The number of empty rows to insert between each added section
+ * - sheetNamesToRemove: The names of sheets to remove from the output file
+ * - sheetsToRemove: The 1-based indices of sheets to remove from the output file
+ *
+ * The function returns a dictionary of file paths to their corresponding XML content.
+ */
+export function mergeSheetsToBaseFileProcessSync(data) {
+    const { additions, baseFiles, baseSheetIndex, gap, sheetNamesToRemove, sheetsToRemove, } = data;
+    const basePath = `xl/worksheets/sheet${baseSheetIndex}.xml`;
+    if (!baseFiles[basePath]) {
+        throw new Error(`Base file does not contain ${basePath}`);
+    }
+    const { lastRowNumber, mergeCells: baseMergeCells, rows: baseRows, xml, } = Xml.extractRowsFromSheetSync(baseFiles[basePath]);
+    const allRows = [...baseRows];
+    const allMergeCells = [...baseMergeCells];
+    let currentRowOffset = lastRowNumber + gap;
+    for (const { files, sheetIndexes } of additions) {
+        for (const sheetIndex of sheetIndexes) {
+            const sheetPath = `xl/worksheets/sheet${sheetIndex}.xml`;
+            if (!files[sheetPath]) {
+                throw new Error(`File does not contain ${sheetPath}`);
+            }
+            const { mergeCells, rows } = Xml.extractRowsFromSheetSync(files[sheetPath]);
+            const shiftedRows = Xml.shiftRowIndices(rows, currentRowOffset);
+            const shiftedMergeCells = mergeCells.map(cell => {
+                const [start, end] = cell.ref.split(":");
+                if (!start || !end) {
+                    return cell;
+                }
+                const shiftedStart = Utils.shiftCellRef(start, currentRowOffset);
+                const shiftedEnd = Utils.shiftCellRef(end, currentRowOffset);
+                return { ...cell, ref: `${shiftedStart}:${shiftedEnd}` };
+            });
+            allRows.push(...shiftedRows);
+            allMergeCells.push(...shiftedMergeCells);
+            currentRowOffset += Utils.getMaxRowNumber(rows) + gap;
+        }
+    }
+    const mergedXml = Xml.buildMergedSheet(xml, allRows, allMergeCells);
+    baseFiles[basePath] = mergedXml;
+    for (const sheetIndex of sheetsToRemove) {
+        const sheetPath = `xl/worksheets/sheet${sheetIndex}.xml`;
+        delete baseFiles[sheetPath];
+        if (baseFiles["xl/workbook.xml"]) {
+            baseFiles["xl/workbook.xml"] = Buffer.from(Utils.removeSheetFromWorkbook(baseFiles["xl/workbook.xml"].toString(), sheetIndex));
+        }
+        if (baseFiles["xl/_rels/workbook.xml.rels"]) {
+            baseFiles["xl/_rels/workbook.xml.rels"] = Buffer.from(Utils.removeSheetFromRels(baseFiles["xl/_rels/workbook.xml.rels"].toString(), sheetIndex));
+        }
+        if (baseFiles["[Content_Types].xml"]) {
+            baseFiles["[Content_Types].xml"] = Buffer.from(Utils.removeSheetFromContentTypes(baseFiles["[Content_Types].xml"].toString(), sheetIndex));
+        }
+    }
+    for (const sheetName of sheetNamesToRemove) {
+        Utils.removeSheetByName(baseFiles, sheetName);
+    }
+}