npm - @monostate/node-scraper - Versions diffs - 2.2.0 → 2.2.1 - Mend

@monostate/node-scraper 2.2.0 → 2.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/index.js +6 -2
package/package.json +1 -1

package/index.js CHANGED Viewed

@@ -4,7 +4,7 @@ import { existsSync, statSync } from 'fs';
 import path from 'path';
 import { fileURLToPath } from 'url';
 import { promises as fsPromises } from 'fs';
-import { PDFParse } from 'pdf-parse';
+let PDFParse = null;
 import browserPool from './browser-pool.js';
 let puppeteer = null;
@@ -860,7 +860,11 @@ ${parsedContent.headings?.length ? `\nHeadings:\n${parsedContent.headings.map(h
         };
       }
-      // Parse PDF with pdf-parse v2 API
+      // Lazy-load pdf-parse (pdfjs-dist requires DOMMatrix, only available in Node 22+)
+      if (!PDFParse) {
+        const mod = await import('pdf-parse');
+        PDFParse = mod.PDFParse;
+      }
       const parser = new PDFParse({ data: new Uint8Array(buffer) });
       await parser.load();
       const textResult = await parser.getText();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@monostate/node-scraper",
-  "version": "2.2.0",
+  "version": "2.2.1",
   "description": "Intelligent web scraping with AI Q&A, PDF support and multi-level fallback system - 11x faster than traditional scrapers",
   "type": "module",
   "main": "index.js",