npm - stegdoc - Versions diffs - 5.3.0 → 5.5.0 - Mend

stegdoc 5.3.0 → 5.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "stegdoc",
-  "version": "5.3.0",
+  "version": "5.5.0",
   "description": "Hide files inside Office documents (XLSX/DOCX) with AES-256 encryption and steganography",
   "main": "src/index.js",
   "bin": {

package/src/commands/decode.js CHANGED Viewed

@@ -198,7 +198,8 @@ async function decodeV5(inputFile, format, firstReadResult, options, spinner, qu
     spinner.succeed && spinner.succeed(`Found all ${totalPartsFound} parts`);
     for (let i = 0; i < allParts.length; i++) {
-      const partSpinner = quiet ? spinner : ora(`Decoding part ${i + 1} of ${totalPartsFound}...`).start();
+      const pct = Math.round(((i + 1) / totalPartsFound) * 100);
+      const partSpinner = quiet ? spinner : ora(`Decoding part ${i + 1}/${totalPartsFound} (${pct}%)...`).start();
       const partResult = await readFile(allParts[i].path, format);
@@ -228,7 +229,7 @@ async function decodeV5(inputFile, format, firstReadResult, options, spinner, qu
         writeTarget.write(partPayload);
       }
-      partSpinner.succeed && partSpinner.succeed(`Part ${i + 1} decoded`);
+      partSpinner.succeed && partSpinner.succeed(`Part ${i + 1}/${totalPartsFound} decoded`);
     }
   } else {
     // Single file

package/src/commands/encode.js CHANGED Viewed

@@ -30,12 +30,14 @@ function zipFolder(folderPath) {
  */
 async function detectFileType(filePath) {
   try {
-    const { fileTypeFromBuffer } = await import('file-type');
+    const fileType = await import('file-type');
+    const fromBuffer = fileType.fileTypeFromBuffer || fileType.default?.fromBuffer;
+    if (!fromBuffer) return null;
     const fd = await fs.promises.open(filePath, 'r');
     const buf = Buffer.alloc(4100);
     await fd.read(buf, 0, 4100, 0);
     await fd.close();
-    return await fileTypeFromBuffer(buf);
+    return await fromBuffer(buf);
   } catch {
     return null;
   }

package/src/index.js CHANGED Viewed

@@ -11,7 +11,7 @@ const verifyCommand = require('./commands/verify');
 program
   .name('stegdoc')
   .description('CLI tool to encode files into Office documents with AES-256 encryption')
-  .version('5.3.0');
+  .version('5.5.0');
 // Encode command
 program

package/src/lib/xlsx-handler.js CHANGED Viewed

@@ -117,6 +117,7 @@ async function createXlsxPartV5(options) {
 /**
  * Read a v5 log-embed XLSX file and extract payload.
+ * Uses fast regex-based XML scanning instead of full DOM parsing for speed.
  * @param {string} xlsxPath - Path to XLSX file
  * @returns {object} { payloadBuffer, metadataJson, encryptionMeta, metadata }
  */
@@ -125,62 +126,67 @@ async function readXlsxV5(xlsxPath) {
     throw new Error(`XLSX file not found: ${xlsxPath}`);
   }
-  // Parse shared strings
-  let sharedStrings = [];
-  const ssParsed = parseXmlFromZip(xlsxPath, 'xl/sharedStrings.xml');
-  if (ssParsed && ssParsed.sst && ssParsed.sst.si) {
-    const siArray = ensureArray(ssParsed.sst.si);
-    sharedStrings = siArray.map((si) => extractTextContent(si.t));
+  // Read file once and reuse the zip instance
+  const fileBuffer = fs.readFileSync(xlsxPath);
+  const zip = new AdmZip(fileBuffer);
+  // Parse shared strings (only if present — v5 files created with useSharedStrings:false may not have them)
+  let sharedStrings = null;
+  const ssEntry = zip.getEntry('xl/sharedStrings.xml');
+  if (ssEntry) {
+    sharedStrings = [];
+    const ssXml = ssEntry.getData().toString('utf8');
+    // Fast extract: match each <si><t>...</t></si> or <si><t ...>...</t></si>
+    const siRegex = /<si><t[^>]*>([^<]*)<\/t><\/si>/g;
+    let match;
+    while ((match = siRegex.exec(ssXml)) !== null) {
+      sharedStrings.push(match[1]);
+    }
   }
-  // Parse sheet1 (the only sheet in v5)
-  const sheetParsed = parseXmlFromZip(xlsxPath, 'xl/worksheets/sheet1.xml');
-  if (!sheetParsed) {
+  // Extract sheet1.xml raw string
+  const sheetEntry = zip.getEntry('xl/worksheets/sheet1.xml');
+  if (!sheetEntry) {
     throw new Error('Sheet not found in XLSX file.');
   }
+  const sheetXml = sheetEntry.getData().toString('utf8');
-  // Extract all rows as arrays of cell values
+  // Fast row extraction using regex — much faster than full DOM parsing
   const allRows = [];
-  const sheetData = sheetParsed.worksheet?.sheetData;
-  if (sheetData && sheetData.row) {
-    const rows = ensureArray(sheetData.row);
-    for (const row of rows) {
-      if (!row.c) continue;
-      const cells = ensureArray(row.c);
-      // Build a sparse array for this row
-      const rowValues = [];
-      for (const cell of cells) {
-        const cellRef = cell['@_r'];
-        if (!cellRef) continue;
-        // Parse column index from cell reference (e.g., "A2" -> col 0, "J2" -> col 9)
-        const colMatch = cellRef.match(/^([A-Z]+)/);
-        if (!colMatch) continue;
-        const colIdx = colLetterToIndex(colMatch[1]);
-        const cellType = cell['@_t'];
-        const cellValue = cell.v;
-        let value;
-        if (cellType === 's' && cellValue !== undefined) {
-          const ssIndex = parseInt(cellValue, 10);
-          value = ssIndex < sharedStrings.length ? sharedStrings[ssIndex] : '';
-        } else if (cellType === 'inlineStr' && cell.is) {
-          value = extractTextContent(cell.is.t);
-        } else if (cellValue !== undefined) {
-          value = String(cellValue);
-        } else {
-          value = '';
-        }
-        rowValues[colIdx] = value;
+  const rowRegex = /<row [^>]*>(.*?)<\/row>/gs;
+  const cellRegex = /<c r="([A-Z]+)\d+"(?: t="([^"]*)")?[^>]*>(?:<v>([^<]*)<\/v>|<is><t[^>]*>([^<]*)<\/t><\/is>)?<\/c>/g;
+  let rowMatch;
+  while ((rowMatch = rowRegex.exec(sheetXml)) !== null) {
+    const rowXml = rowMatch[1];
+    const rowValues = [];
+    let cellMatch;
+    cellRegex.lastIndex = 0;
+    while ((cellMatch = cellRegex.exec(rowXml)) !== null) {
+      const colLetter = cellMatch[1];
+      const cellType = cellMatch[2] || '';
+      const vValue = cellMatch[3];
+      const inlineValue = cellMatch[4];
+      const colIdx = colLetterToIndex(colLetter);
+      let value;
+      if (cellType === 's' && vValue !== undefined && sharedStrings) {
+        const ssIndex = parseInt(vValue, 10);
+        value = ssIndex < sharedStrings.length ? sharedStrings[ssIndex] : '';
+      } else if (inlineValue !== undefined) {
+        value = decodeXmlEntities(inlineValue);
+      } else if (vValue !== undefined) {
+        value = decodeXmlEntities(vValue);
+      } else {
+        value = '';
       }
-      allRows.push(rowValues);
+      rowValues[colIdx] = value;
     }
+    allRows.push(rowValues);
   }
   // Skip the first row (column headers)
@@ -194,6 +200,19 @@ async function readXlsxV5(xlsxPath) {
   return decodeLogLines(dataRows);
 }
+/**
+ * Decode XML entities in a string value
+ */
+function decodeXmlEntities(str) {
+  if (!str || !str.includes('&')) return str;
+  return str
+    .replace(/&amp;/g, '&')
+    .replace(/&lt;/g, '<')
+    .replace(/&gt;/g, '>')
+    .replace(/&apos;/g, "'")
+    .replace(/&quot;/g, '"');
+}
 /**
  * Convert column letter to 0-based index (A=0, B=1, ..., Z=25, AA=26)
  */