@llamaindex/liteparse 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +201 -0
- package/README.md +339 -0
- package/dist/cli/parse.d.ts +4 -0
- package/dist/cli/parse.d.ts.map +1 -0
- package/dist/cli/parse.js +401 -0
- package/dist/cli/parse.js.map +1 -0
- package/dist/src/conversion/convertToPdf.d.ts +47 -0
- package/dist/src/conversion/convertToPdf.d.ts.map +1 -0
- package/dist/src/conversion/convertToPdf.js +337 -0
- package/dist/src/conversion/convertToPdf.js.map +1 -0
- package/dist/src/conversion/convertToPdf.test.d.ts +2 -0
- package/dist/src/conversion/convertToPdf.test.d.ts.map +1 -0
- package/dist/src/conversion/convertToPdf.test.js +208 -0
- package/dist/src/conversion/convertToPdf.test.js.map +1 -0
- package/dist/src/core/config.d.ts +4 -0
- package/dist/src/core/config.d.ts.map +1 -0
- package/dist/src/core/config.js +25 -0
- package/dist/src/core/config.js.map +1 -0
- package/dist/src/core/config.test.d.ts +2 -0
- package/dist/src/core/config.test.d.ts.map +1 -0
- package/dist/src/core/config.test.js +21 -0
- package/dist/src/core/config.test.js.map +1 -0
- package/dist/src/core/parser.d.ts +83 -0
- package/dist/src/core/parser.d.ts.map +1 -0
- package/dist/src/core/parser.js +333 -0
- package/dist/src/core/parser.js.map +1 -0
- package/dist/src/core/parser.test.d.ts +2 -0
- package/dist/src/core/parser.test.d.ts.map +1 -0
- package/dist/src/core/parser.test.js +537 -0
- package/dist/src/core/parser.test.js.map +1 -0
- package/dist/src/core/types.d.ts +287 -0
- package/dist/src/core/types.d.ts.map +1 -0
- package/dist/src/core/types.js +2 -0
- package/dist/src/core/types.js.map +1 -0
- package/dist/src/engines/ocr/http-simple.d.ts +19 -0
- package/dist/src/engines/ocr/http-simple.d.ts.map +1 -0
- package/dist/src/engines/ocr/http-simple.js +63 -0
- package/dist/src/engines/ocr/http-simple.js.map +1 -0
- package/dist/src/engines/ocr/http-simple.test.d.ts +2 -0
- package/dist/src/engines/ocr/http-simple.test.d.ts.map +1 -0
- package/dist/src/engines/ocr/http-simple.test.js +108 -0
- package/dist/src/engines/ocr/http-simple.test.js.map +1 -0
- package/dist/src/engines/ocr/interface.d.ts +15 -0
- package/dist/src/engines/ocr/interface.d.ts.map +1 -0
- package/dist/src/engines/ocr/interface.js +2 -0
- package/dist/src/engines/ocr/interface.js.map +1 -0
- package/dist/src/engines/ocr/tesseract.d.ts +19 -0
- package/dist/src/engines/ocr/tesseract.d.ts.map +1 -0
- package/dist/src/engines/ocr/tesseract.js +112 -0
- package/dist/src/engines/ocr/tesseract.js.map +1 -0
- package/dist/src/engines/ocr/tesseract.test.d.ts +2 -0
- package/dist/src/engines/ocr/tesseract.test.d.ts.map +1 -0
- package/dist/src/engines/ocr/tesseract.test.js +84 -0
- package/dist/src/engines/ocr/tesseract.test.js.map +1 -0
- package/dist/src/engines/pdf/interface.d.ts +79 -0
- package/dist/src/engines/pdf/interface.d.ts.map +1 -0
- package/dist/src/engines/pdf/interface.js +2 -0
- package/dist/src/engines/pdf/interface.js.map +1 -0
- package/dist/src/engines/pdf/pdfium-renderer.d.ts +11 -0
- package/dist/src/engines/pdf/pdfium-renderer.d.ts.map +1 -0
- package/dist/src/engines/pdf/pdfium-renderer.js +64 -0
- package/dist/src/engines/pdf/pdfium-renderer.js.map +1 -0
- package/dist/src/engines/pdf/pdfium-renderer.test.d.ts +2 -0
- package/dist/src/engines/pdf/pdfium-renderer.test.d.ts.map +1 -0
- package/dist/src/engines/pdf/pdfium-renderer.test.js +76 -0
- package/dist/src/engines/pdf/pdfium-renderer.test.js.map +1 -0
- package/dist/src/engines/pdf/pdfjs.d.ts +13 -0
- package/dist/src/engines/pdf/pdfjs.d.ts.map +1 -0
- package/dist/src/engines/pdf/pdfjs.js +538 -0
- package/dist/src/engines/pdf/pdfjs.js.map +1 -0
- package/dist/src/engines/pdf/pdfjs.test.d.ts +2 -0
- package/dist/src/engines/pdf/pdfjs.test.d.ts.map +1 -0
- package/dist/src/engines/pdf/pdfjs.test.js +220 -0
- package/dist/src/engines/pdf/pdfjs.test.js.map +1 -0
- package/dist/src/engines/pdf/pdfjsImporter.d.ts +5 -0
- package/dist/src/engines/pdf/pdfjsImporter.d.ts.map +1 -0
- package/dist/src/engines/pdf/pdfjsImporter.js +9 -0
- package/dist/src/engines/pdf/pdfjsImporter.js.map +1 -0
- package/dist/src/index.d.ts +3 -0
- package/dist/src/index.d.ts.map +1 -0
- package/dist/src/index.js +5 -0
- package/dist/src/index.js.map +1 -0
- package/dist/src/lib.d.ts +17 -0
- package/dist/src/lib.d.ts.map +1 -0
- package/dist/src/lib.js +16 -0
- package/dist/src/lib.js.map +1 -0
- package/dist/src/output/json.d.ts +10 -0
- package/dist/src/output/json.d.ts.map +1 -0
- package/dist/src/output/json.js +31 -0
- package/dist/src/output/json.js.map +1 -0
- package/dist/src/output/json.test.d.ts +2 -0
- package/dist/src/output/json.test.d.ts.map +1 -0
- package/dist/src/output/json.test.js +136 -0
- package/dist/src/output/json.test.js.map +1 -0
- package/dist/src/output/text.d.ts +10 -0
- package/dist/src/output/text.d.ts.map +1 -0
- package/dist/src/output/text.js +17 -0
- package/dist/src/output/text.js.map +1 -0
- package/dist/src/output/text.test.d.ts +2 -0
- package/dist/src/output/text.test.d.ts.map +1 -0
- package/dist/src/output/text.test.js +65 -0
- package/dist/src/output/text.test.js.map +1 -0
- package/dist/src/processing/bbox.d.ts +20 -0
- package/dist/src/processing/bbox.d.ts.map +1 -0
- package/dist/src/processing/bbox.js +258 -0
- package/dist/src/processing/bbox.js.map +1 -0
- package/dist/src/processing/bbox.test.d.ts +2 -0
- package/dist/src/processing/bbox.test.d.ts.map +1 -0
- package/dist/src/processing/bbox.test.js +334 -0
- package/dist/src/processing/bbox.test.js.map +1 -0
- package/dist/src/processing/cleanText.d.ts +6 -0
- package/dist/src/processing/cleanText.d.ts.map +1 -0
- package/dist/src/processing/cleanText.js +73 -0
- package/dist/src/processing/cleanText.js.map +1 -0
- package/dist/src/processing/cleanText.test.d.ts +2 -0
- package/dist/src/processing/cleanText.test.d.ts.map +1 -0
- package/dist/src/processing/cleanText.test.js +46 -0
- package/dist/src/processing/cleanText.test.js.map +1 -0
- package/dist/src/processing/grid.d.ts +7 -0
- package/dist/src/processing/grid.d.ts.map +1 -0
- package/dist/src/processing/grid.js +13 -0
- package/dist/src/processing/grid.js.map +1 -0
- package/dist/src/processing/gridProjection.d.ts +18 -0
- package/dist/src/processing/gridProjection.d.ts.map +1 -0
- package/dist/src/processing/gridProjection.js +1392 -0
- package/dist/src/processing/gridProjection.js.map +1 -0
- package/dist/src/processing/gridProjection.test.d.ts +2 -0
- package/dist/src/processing/gridProjection.test.d.ts.map +1 -0
- package/dist/src/processing/gridProjection.test.js +464 -0
- package/dist/src/processing/gridProjection.test.js.map +1 -0
- package/dist/src/processing/markupUtils.d.ts +7 -0
- package/dist/src/processing/markupUtils.d.ts.map +1 -0
- package/dist/src/processing/markupUtils.js +25 -0
- package/dist/src/processing/markupUtils.js.map +1 -0
- package/dist/src/processing/markupUtils.test.d.ts +2 -0
- package/dist/src/processing/markupUtils.test.d.ts.map +1 -0
- package/dist/src/processing/markupUtils.test.js +26 -0
- package/dist/src/processing/markupUtils.test.js.map +1 -0
- package/dist/src/processing/ocrUtils.d.ts +24 -0
- package/dist/src/processing/ocrUtils.d.ts.map +1 -0
- package/dist/src/processing/ocrUtils.js +79 -0
- package/dist/src/processing/ocrUtils.js.map +1 -0
- package/dist/src/processing/octUtils.test.d.ts +2 -0
- package/dist/src/processing/octUtils.test.d.ts.map +1 -0
- package/dist/src/processing/octUtils.test.js +72 -0
- package/dist/src/processing/octUtils.test.js.map +1 -0
- package/dist/src/processing/textUtils.d.ts +20 -0
- package/dist/src/processing/textUtils.d.ts.map +1 -0
- package/dist/src/processing/textUtils.js +142 -0
- package/dist/src/processing/textUtils.js.map +1 -0
- package/dist/src/processing/textUtils.test.d.ts +2 -0
- package/dist/src/processing/textUtils.test.d.ts.map +1 -0
- package/dist/src/processing/textUtils.test.js +45 -0
- package/dist/src/processing/textUtils.test.js.map +1 -0
- package/dist/src/vendor/pdfjs/LICENSE +177 -0
- package/dist/src/vendor/pdfjs/README.md +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78ms-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/78ms-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/83pv-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90ms-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90ms-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90msp-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90msp-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90pv-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/90pv-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Add-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Add-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Add-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Add-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-0.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-1.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-3.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-4.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-5.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-6.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-CNS1-UCS2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-0.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-1.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-3.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-4.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-5.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-GB1-UCS2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-0.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-1.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-3.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-4.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-5.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-6.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Japan1-UCS2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Korea1-0.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Korea1-1.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Korea1-2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Adobe-Korea1-UCS2.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/B5pc-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/B5pc-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS1-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS1-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS2-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/CNS2-V.bcmap +3 -0
- package/dist/src/vendor/pdfjs/cmaps/ETHK-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/ETHK-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/ETen-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/ETen-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/ETenms-B5-H.bcmap +3 -0
- package/dist/src/vendor/pdfjs/cmaps/ETenms-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Ext-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Ext-RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Ext-RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Ext-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GB-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GB-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GB-H.bcmap +4 -0
- package/dist/src/vendor/pdfjs/cmaps/GB-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBK-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBK-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBK2K-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBK2K-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBKp-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBKp-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBT-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBT-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBT-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBT-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBTpc-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBTpc-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBpc-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/GBpc-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKdla-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKdla-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKdlb-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKdlb-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKgccs-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKgccs-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKm314-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKm314-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKm471-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKm471-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKscs-B5-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/HKscs-B5-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Hankaku.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Hiragana.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-Johab-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-Johab-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCms-UHC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCms-UHC-HW-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCms-UHC-HW-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCms-UHC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCpc-EUC-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/KSCpc-EUC-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Katakana.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/LICENSE +36 -0
- package/dist/src/vendor/pdfjs/cmaps/NWP-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/NWP-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/RKSJ-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/RKSJ-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/Roman.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UCS2-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UCS2-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF16-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF16-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF8-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniCNS-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UCS2-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UCS2-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF16-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF16-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF8-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniGB-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UCS2-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UCS2-HW-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UCS2-HW-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UCS2-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF16-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF16-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF8-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF16-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF16-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF8-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJIS2004-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISPro-UCS2-HW-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISPro-UCS2-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISPro-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISX0213-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISX0213-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISX02132004-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniJISX02132004-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UCS2-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UCS2-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF16-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF16-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF32-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF32-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF8-H.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/UniKS-UTF8-V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/V.bcmap +0 -0
- package/dist/src/vendor/pdfjs/cmaps/WP-Symbol.bcmap +0 -0
- package/dist/src/vendor/pdfjs/pdf.mjs +19481 -0
- package/dist/src/vendor/pdfjs/pdf.mjs.map +1 -0
- package/dist/src/vendor/pdfjs/pdf.sandbox.mjs +210 -0
- package/dist/src/vendor/pdfjs/pdf.sandbox.mjs.map +1 -0
- package/dist/src/vendor/pdfjs/pdf.worker.mjs +56001 -0
- package/dist/src/vendor/pdfjs/pdf.worker.mjs.map +1 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitDingbats.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitFixed.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitFixedBold.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitFixedBoldItalic.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitFixedItalic.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitSerif.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitSerifBold.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitSerifBoldItalic.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitSerifItalic.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/FoxitSymbol.pfb +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LICENSE_FOXIT +27 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LICENSE_LIBERATION +102 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LiberationSans-Bold.ttf +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LiberationSans-BoldItalic.ttf +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LiberationSans-Italic.ttf +0 -0
- package/dist/src/vendor/pdfjs/standard_fonts/LiberationSans-Regular.ttf +0 -0
- package/package.json +89 -0
- package/src/vendor/pdfjs/LICENSE +177 -0
- package/src/vendor/pdfjs/README.md +0 -0
- package/src/vendor/pdfjs/cmaps/78-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78ms-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/78ms-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/83pv-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90ms-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90ms-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90msp-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90msp-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90pv-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/90pv-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Add-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Add-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Add-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Add-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-0.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-1.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-3.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-4.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-5.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-6.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-CNS1-UCS2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-0.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-1.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-3.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-4.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-5.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-GB1-UCS2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-0.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-1.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-3.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-4.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-5.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-6.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Japan1-UCS2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Korea1-0.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Korea1-1.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Korea1-2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Adobe-Korea1-UCS2.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/B5pc-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/B5pc-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS1-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS1-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS2-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/CNS2-V.bcmap +3 -0
- package/src/vendor/pdfjs/cmaps/ETHK-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/ETHK-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/ETen-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/ETen-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/ETenms-B5-H.bcmap +3 -0
- package/src/vendor/pdfjs/cmaps/ETenms-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Ext-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Ext-RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Ext-RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Ext-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GB-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GB-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GB-H.bcmap +4 -0
- package/src/vendor/pdfjs/cmaps/GB-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBK-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBK-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBK2K-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBK2K-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBKp-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBKp-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBT-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBT-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBT-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBT-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBTpc-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBTpc-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBpc-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/GBpc-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKdla-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKdla-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKdlb-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKdlb-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKgccs-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKgccs-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKm314-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKm314-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKm471-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKm471-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKscs-B5-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/HKscs-B5-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Hankaku.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Hiragana.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-Johab-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-Johab-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCms-UHC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCms-UHC-HW-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCms-UHC-HW-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCms-UHC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCpc-EUC-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/KSCpc-EUC-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Katakana.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/LICENSE +36 -0
- package/src/vendor/pdfjs/cmaps/NWP-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/NWP-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/RKSJ-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/RKSJ-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/Roman.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UCS2-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UCS2-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF16-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF16-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF8-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniCNS-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UCS2-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UCS2-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF16-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF16-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF8-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniGB-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UCS2-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UCS2-HW-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UCS2-HW-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UCS2-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF16-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF16-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF8-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF16-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF16-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF8-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJIS2004-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISPro-UCS2-HW-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISPro-UCS2-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISPro-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISX0213-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISX0213-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISX02132004-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniJISX02132004-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UCS2-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UCS2-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF16-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF16-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF32-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF32-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF8-H.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/UniKS-UTF8-V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/V.bcmap +0 -0
- package/src/vendor/pdfjs/cmaps/WP-Symbol.bcmap +0 -0
- package/src/vendor/pdfjs/pdf.mjs +19481 -0
- package/src/vendor/pdfjs/pdf.mjs.map +1 -0
- package/src/vendor/pdfjs/pdf.sandbox.mjs +210 -0
- package/src/vendor/pdfjs/pdf.sandbox.mjs.map +1 -0
- package/src/vendor/pdfjs/pdf.worker.mjs +56001 -0
- package/src/vendor/pdfjs/pdf.worker.mjs.map +1 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitDingbats.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitFixed.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitFixedBold.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitFixedBoldItalic.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitFixedItalic.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitSerif.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitSerifBold.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitSerifBoldItalic.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitSerifItalic.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/FoxitSymbol.pfb +0 -0
- package/src/vendor/pdfjs/standard_fonts/LICENSE_FOXIT +27 -0
- package/src/vendor/pdfjs/standard_fonts/LICENSE_LIBERATION +102 -0
- package/src/vendor/pdfjs/standard_fonts/LiberationSans-Bold.ttf +0 -0
- package/src/vendor/pdfjs/standard_fonts/LiberationSans-BoldItalic.ttf +0 -0
- package/src/vendor/pdfjs/standard_fonts/LiberationSans-Italic.ttf +0 -0
- package/src/vendor/pdfjs/standard_fonts/LiberationSans-Regular.ttf +0 -0
|
@@ -0,0 +1,83 @@
|
|
|
1
|
+
import { LiteParseConfig, ParseResult, ScreenshotResult } from "./types.js";
|
|
2
|
+
/**
|
|
3
|
+
* Main document parser class. Handles PDF parsing, OCR, format conversion,
|
|
4
|
+
* and screenshot generation.
|
|
5
|
+
*
|
|
6
|
+
* @example Basic text extraction
|
|
7
|
+
* ```typescript
|
|
8
|
+
* import { LiteParse } from "@llamaindex/liteparse";
|
|
9
|
+
*
|
|
10
|
+
* const parser = new LiteParse();
|
|
11
|
+
* const result = await parser.parse("document.pdf");
|
|
12
|
+
* console.log(result.text);
|
|
13
|
+
* ```
|
|
14
|
+
*
|
|
15
|
+
* @example JSON output with bounding boxes
|
|
16
|
+
* ```typescript
|
|
17
|
+
* const parser = new LiteParse({ outputFormat: "json", dpi: 300 });
|
|
18
|
+
* const result = await parser.parse("document.pdf");
|
|
19
|
+
* for (const page of result.json.pages) {
|
|
20
|
+
* console.log(`Page ${page.page}: ${page.boundingBoxes.length} bounding boxes`);
|
|
21
|
+
* }
|
|
22
|
+
* ```
|
|
23
|
+
*
|
|
24
|
+
* @example Using an HTTP OCR server
|
|
25
|
+
* ```typescript
|
|
26
|
+
* const parser = new LiteParse({
|
|
27
|
+
* ocrServerUrl: "http://localhost:8828/ocr",
|
|
28
|
+
* ocrLanguage: "en",
|
|
29
|
+
* });
|
|
30
|
+
* const result = await parser.parse("scanned-document.pdf");
|
|
31
|
+
* ```
|
|
32
|
+
*/
|
|
33
|
+
export declare class LiteParse {
|
|
34
|
+
private config;
|
|
35
|
+
private pdfEngine;
|
|
36
|
+
private ocrEngine?;
|
|
37
|
+
/**
|
|
38
|
+
* Create a new LiteParse instance.
|
|
39
|
+
*
|
|
40
|
+
* @param userConfig - Partial configuration to override defaults. See {@link LiteParseConfig} for all options.
|
|
41
|
+
*/
|
|
42
|
+
constructor(userConfig?: Partial<LiteParseConfig>);
|
|
43
|
+
/**
|
|
44
|
+
* Parse a document and return the extracted text, page data, and optionally structured JSON.
|
|
45
|
+
*
|
|
46
|
+
* Supports PDFs natively. Non-PDF formats (DOCX, XLSX, images, etc.) are automatically
|
|
47
|
+
* converted to PDF before parsing if the required system tools are installed.
|
|
48
|
+
*
|
|
49
|
+
* @param filePath - Path to the document file.
|
|
50
|
+
* @param quiet - If `true`, suppresses progress logging to stderr.
|
|
51
|
+
* @returns Parsed document data including text, per-page info, and optional JSON.
|
|
52
|
+
*
|
|
53
|
+
* @throws Error if the file cannot be found, converted, or parsed.
|
|
54
|
+
*/
|
|
55
|
+
parse(filePath: string, quiet?: boolean): Promise<ParseResult>;
|
|
56
|
+
/**
|
|
57
|
+
* Generate screenshots of PDF pages as image buffers.
|
|
58
|
+
*
|
|
59
|
+
* Uses PDFium for high-quality rendering. Each page is returned as a
|
|
60
|
+
* {@link ScreenshotResult} with the raw image buffer and dimensions.
|
|
61
|
+
*
|
|
62
|
+
* @param filePath - Path to the PDF file.
|
|
63
|
+
* @param pageNumbers - 1-indexed page numbers to screenshot. If omitted, all pages are rendered.
|
|
64
|
+
* @param quiet - If `true`, suppresses progress logging to stderr.
|
|
65
|
+
* @returns Array of screenshot results, one per rendered page.
|
|
66
|
+
*/
|
|
67
|
+
screenshot(filePath: string, pageNumbers?: number[], quiet?: boolean): Promise<ScreenshotResult[]>;
|
|
68
|
+
/**
|
|
69
|
+
* Run OCR on pages that need it (in parallel with concurrency limit)
|
|
70
|
+
*/
|
|
71
|
+
private runOCR;
|
|
72
|
+
/**
|
|
73
|
+
* Process OCR for a single page
|
|
74
|
+
*/
|
|
75
|
+
private processPageOcr;
|
|
76
|
+
/**
|
|
77
|
+
* Get a copy of the current configuration, including defaults merged with user overrides.
|
|
78
|
+
*
|
|
79
|
+
* @returns A shallow copy of the active {@link LiteParseConfig}.
|
|
80
|
+
*/
|
|
81
|
+
getConfig(): LiteParseConfig;
|
|
82
|
+
}
|
|
83
|
+
//# sourceMappingURL=parser.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"parser.d.ts","sourceRoot":"","sources":["../../../src/core/parser.ts"],"names":[],"mappings":"AACA,OAAO,EAAE,eAAe,EAAE,WAAW,EAAE,gBAAgB,EAAY,MAAM,YAAY,CAAC;AActF;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,qBAAa,SAAS;IACpB,OAAO,CAAC,MAAM,CAAkB;IAChC,OAAO,CAAC,SAAS,CAAY;IAC7B,OAAO,CAAC,SAAS,CAAC,CAAY;IAE9B;;;;OAIG;gBACS,UAAU,GAAE,OAAO,CAAC,eAAe,CAAM;IAkBrD;;;;;;;;;;;OAWG;IACG,KAAK,CAAC,QAAQ,EAAE,MAAM,EAAE,KAAK,UAAQ,GAAG,OAAO,CAAC,WAAW,CAAC;IA0FlE;;;;;;;;;;OAUG;IACG,UAAU,CACd,QAAQ,EAAE,MAAM,EAChB,WAAW,CAAC,EAAE,MAAM,EAAE,EACtB,KAAK,UAAQ,GACZ,OAAO,CAAC,gBAAgB,EAAE,CAAC;IA+C9B;;OAEG;YACW,MAAM;IAcpB;;OAEG;YACW,cAAc;IAwI5B;;;;OAIG;IACH,SAAS,IAAI,eAAe;CAG7B"}
|
|
@@ -0,0 +1,333 @@
|
|
|
1
|
+
import pLimit from "p-limit";
|
|
2
|
+
import { mergeConfig } from "./config.js";
|
|
3
|
+
import { PdfJsEngine } from "../engines/pdf/pdfjs.js";
|
|
4
|
+
import { PdfiumRenderer } from "../engines/pdf/pdfium-renderer.js";
|
|
5
|
+
import { TesseractEngine } from "../engines/ocr/tesseract.js";
|
|
6
|
+
import { HttpOcrEngine } from "../engines/ocr/http-simple.js";
|
|
7
|
+
import { projectPagesToGrid } from "../processing/grid.js";
|
|
8
|
+
import { buildBoundingBoxes } from "../processing/bbox.js";
|
|
9
|
+
import { formatJSON } from "../output/json.js";
|
|
10
|
+
import { convertToPdf, cleanupConversionFiles } from "../conversion/convertToPdf.js";
|
|
11
|
+
import { cleanOcrTableArtifacts } from "../processing/textUtils.js";
|
|
12
|
+
/**
|
|
13
|
+
* Main document parser class. Handles PDF parsing, OCR, format conversion,
|
|
14
|
+
* and screenshot generation.
|
|
15
|
+
*
|
|
16
|
+
* @example Basic text extraction
|
|
17
|
+
* ```typescript
|
|
18
|
+
* import { LiteParse } from "@llamaindex/liteparse";
|
|
19
|
+
*
|
|
20
|
+
* const parser = new LiteParse();
|
|
21
|
+
* const result = await parser.parse("document.pdf");
|
|
22
|
+
* console.log(result.text);
|
|
23
|
+
* ```
|
|
24
|
+
*
|
|
25
|
+
* @example JSON output with bounding boxes
|
|
26
|
+
* ```typescript
|
|
27
|
+
* const parser = new LiteParse({ outputFormat: "json", dpi: 300 });
|
|
28
|
+
* const result = await parser.parse("document.pdf");
|
|
29
|
+
* for (const page of result.json.pages) {
|
|
30
|
+
* console.log(`Page ${page.page}: ${page.boundingBoxes.length} bounding boxes`);
|
|
31
|
+
* }
|
|
32
|
+
* ```
|
|
33
|
+
*
|
|
34
|
+
* @example Using an HTTP OCR server
|
|
35
|
+
* ```typescript
|
|
36
|
+
* const parser = new LiteParse({
|
|
37
|
+
* ocrServerUrl: "http://localhost:8828/ocr",
|
|
38
|
+
* ocrLanguage: "en",
|
|
39
|
+
* });
|
|
40
|
+
* const result = await parser.parse("scanned-document.pdf");
|
|
41
|
+
* ```
|
|
42
|
+
*/
|
|
43
|
+
export class LiteParse {
|
|
44
|
+
config;
|
|
45
|
+
pdfEngine;
|
|
46
|
+
ocrEngine;
|
|
47
|
+
/**
|
|
48
|
+
* Create a new LiteParse instance.
|
|
49
|
+
*
|
|
50
|
+
* @param userConfig - Partial configuration to override defaults. See {@link LiteParseConfig} for all options.
|
|
51
|
+
*/
|
|
52
|
+
constructor(userConfig = {}) {
|
|
53
|
+
// Merge user config with defaults
|
|
54
|
+
this.config = mergeConfig(userConfig);
|
|
55
|
+
// Initialize PDF engine
|
|
56
|
+
this.pdfEngine = new PdfJsEngine();
|
|
57
|
+
// Initialize OCR engine
|
|
58
|
+
// Auto-detect: use HTTP OCR if URL provided, otherwise use Tesseract
|
|
59
|
+
if (this.config.ocrEnabled) {
|
|
60
|
+
if (this.config.ocrServerUrl) {
|
|
61
|
+
this.ocrEngine = new HttpOcrEngine(this.config.ocrServerUrl);
|
|
62
|
+
}
|
|
63
|
+
else {
|
|
64
|
+
this.ocrEngine = new TesseractEngine(this.config.numWorkers);
|
|
65
|
+
}
|
|
66
|
+
}
|
|
67
|
+
}
|
|
68
|
+
/**
|
|
69
|
+
* Parse a document and return the extracted text, page data, and optionally structured JSON.
|
|
70
|
+
*
|
|
71
|
+
* Supports PDFs natively. Non-PDF formats (DOCX, XLSX, images, etc.) are automatically
|
|
72
|
+
* converted to PDF before parsing if the required system tools are installed.
|
|
73
|
+
*
|
|
74
|
+
* @param filePath - Path to the document file.
|
|
75
|
+
* @param quiet - If `true`, suppresses progress logging to stderr.
|
|
76
|
+
* @returns Parsed document data including text, per-page info, and optional JSON.
|
|
77
|
+
*
|
|
78
|
+
* @throws Error if the file cannot be found, converted, or parsed.
|
|
79
|
+
*/
|
|
80
|
+
async parse(filePath, quiet = false) {
|
|
81
|
+
const log = (msg) => {
|
|
82
|
+
if (!quiet)
|
|
83
|
+
console.error(msg); // Progress goes to stderr
|
|
84
|
+
};
|
|
85
|
+
log(`Processing file: ${filePath}`);
|
|
86
|
+
const conversionResult = await convertToPdf(filePath);
|
|
87
|
+
if ("code" in conversionResult) {
|
|
88
|
+
// Conversion error
|
|
89
|
+
throw new Error(`Conversion failed: ${conversionResult.message}`);
|
|
90
|
+
}
|
|
91
|
+
// Return early for text-based passthrough formats
|
|
92
|
+
if ("content" in conversionResult) {
|
|
93
|
+
log(`File is a text-based format. Returning content directly.`);
|
|
94
|
+
return {
|
|
95
|
+
pages: [],
|
|
96
|
+
text: conversionResult.content,
|
|
97
|
+
};
|
|
98
|
+
}
|
|
99
|
+
// Convert to PDF if needed
|
|
100
|
+
const pdfPath = conversionResult.pdfPath;
|
|
101
|
+
const needsCleanup = pdfPath !== filePath;
|
|
102
|
+
if (needsCleanup) {
|
|
103
|
+
log(`Converted ${conversionResult.originalExtension} to PDF`);
|
|
104
|
+
}
|
|
105
|
+
// Load PDF document
|
|
106
|
+
const doc = await this.pdfEngine.loadDocument(pdfPath);
|
|
107
|
+
log(`Loaded PDF with ${doc.numPages} pages`);
|
|
108
|
+
// Extract pages
|
|
109
|
+
const pages = await this.pdfEngine.extractAllPages(doc, this.config.maxPages, this.config.targetPages);
|
|
110
|
+
// run BEFORE grid projection
|
|
111
|
+
if (this.ocrEngine) {
|
|
112
|
+
await this.runOCR(doc, pages, log);
|
|
113
|
+
}
|
|
114
|
+
// Process pages with complete grid projection (after OCR)
|
|
115
|
+
const processedPages = projectPagesToGrid(pages, this.config);
|
|
116
|
+
// Build bounding boxes if enabled
|
|
117
|
+
if (this.config.preciseBoundingBox) {
|
|
118
|
+
for (const page of processedPages) {
|
|
119
|
+
page.boundingBoxes = buildBoundingBoxes(page.textItems);
|
|
120
|
+
}
|
|
121
|
+
}
|
|
122
|
+
// Build final text
|
|
123
|
+
const fullText = processedPages.map((p) => p.text).join("\n\n");
|
|
124
|
+
// Close PDF document
|
|
125
|
+
await this.pdfEngine.close(doc);
|
|
126
|
+
// Cleanup OCR engine if it's Tesseract (to free memory)
|
|
127
|
+
if (this.ocrEngine && "terminate" in this.ocrEngine) {
|
|
128
|
+
await this.ocrEngine.terminate();
|
|
129
|
+
}
|
|
130
|
+
// Cleanup temporary conversion files
|
|
131
|
+
if (needsCleanup) {
|
|
132
|
+
await cleanupConversionFiles(pdfPath);
|
|
133
|
+
}
|
|
134
|
+
const result = {
|
|
135
|
+
pages: processedPages,
|
|
136
|
+
text: fullText,
|
|
137
|
+
};
|
|
138
|
+
// Format based on output format
|
|
139
|
+
switch (this.config.outputFormat) {
|
|
140
|
+
case "json":
|
|
141
|
+
result.json = JSON.parse(formatJSON(result));
|
|
142
|
+
break;
|
|
143
|
+
case "text":
|
|
144
|
+
// Already in text format
|
|
145
|
+
break;
|
|
146
|
+
}
|
|
147
|
+
return result;
|
|
148
|
+
}
|
|
149
|
+
/**
|
|
150
|
+
* Generate screenshots of PDF pages as image buffers.
|
|
151
|
+
*
|
|
152
|
+
* Uses PDFium for high-quality rendering. Each page is returned as a
|
|
153
|
+
* {@link ScreenshotResult} with the raw image buffer and dimensions.
|
|
154
|
+
*
|
|
155
|
+
* @param filePath - Path to the PDF file.
|
|
156
|
+
* @param pageNumbers - 1-indexed page numbers to screenshot. If omitted, all pages are rendered.
|
|
157
|
+
* @param quiet - If `true`, suppresses progress logging to stderr.
|
|
158
|
+
* @returns Array of screenshot results, one per rendered page.
|
|
159
|
+
*/
|
|
160
|
+
async screenshot(filePath, pageNumbers, quiet = false) {
|
|
161
|
+
const log = (msg) => {
|
|
162
|
+
if (!quiet)
|
|
163
|
+
console.error(msg); // Progress goes to stderr
|
|
164
|
+
};
|
|
165
|
+
log(`Generating screenshots for: ${filePath}`);
|
|
166
|
+
// Load PDF document to get page count and dimensions
|
|
167
|
+
const doc = await this.pdfEngine.loadDocument(filePath);
|
|
168
|
+
const totalPages = doc.numPages;
|
|
169
|
+
const results = [];
|
|
170
|
+
const pages = pageNumbers || Array.from({ length: totalPages }, (_, i) => i + 1);
|
|
171
|
+
// Initialize PDFium renderer
|
|
172
|
+
const renderer = new PdfiumRenderer();
|
|
173
|
+
try {
|
|
174
|
+
for (const pageNum of pages) {
|
|
175
|
+
if (pageNum < 1 || pageNum > totalPages) {
|
|
176
|
+
console.error(`Skipping invalid page number: ${pageNum}`);
|
|
177
|
+
continue;
|
|
178
|
+
}
|
|
179
|
+
log(`Rendering page ${pageNum}...`);
|
|
180
|
+
const imageBuffer = await renderer.renderPageToBuffer(filePath, pageNum, this.config.dpi);
|
|
181
|
+
// Get page dimensions
|
|
182
|
+
const pageData = await this.pdfEngine.extractPage(doc, pageNum);
|
|
183
|
+
results.push({
|
|
184
|
+
pageNum,
|
|
185
|
+
width: pageData.width,
|
|
186
|
+
height: pageData.height,
|
|
187
|
+
imageBuffer,
|
|
188
|
+
});
|
|
189
|
+
}
|
|
190
|
+
}
|
|
191
|
+
finally {
|
|
192
|
+
// Clean up resources
|
|
193
|
+
await renderer.close();
|
|
194
|
+
await this.pdfEngine.close(doc);
|
|
195
|
+
}
|
|
196
|
+
log(`Generated ${results.length} screenshots`);
|
|
197
|
+
return results;
|
|
198
|
+
}
|
|
199
|
+
/**
|
|
200
|
+
* Run OCR on pages that need it (in parallel with concurrency limit)
|
|
201
|
+
*/
|
|
202
|
+
async runOCR(doc, pages, log) {
|
|
203
|
+
if (!this.ocrEngine)
|
|
204
|
+
return;
|
|
205
|
+
log(`Running OCR on pages (concurrency: ${this.config.numWorkers})...`);
|
|
206
|
+
const limit = pLimit(this.config.numWorkers);
|
|
207
|
+
await Promise.all(pages.map((page) => limit(() => this.processPageOcr(doc, page, log))));
|
|
208
|
+
}
|
|
209
|
+
/**
|
|
210
|
+
* Process OCR for a single page
|
|
211
|
+
*/
|
|
212
|
+
async processPageOcr(doc, page, log) {
|
|
213
|
+
if (!this.ocrEngine)
|
|
214
|
+
return;
|
|
215
|
+
// Check if page has very little text (indicating need for OCR)
|
|
216
|
+
const textLength = page.textItems.reduce((sum, item) => sum + item.str.length, 0);
|
|
217
|
+
// Determine if OCR is needed and what mode
|
|
218
|
+
const hasGarbledRegions = page.garbledTextRegions && page.garbledTextRegions.length > 0;
|
|
219
|
+
const needsFullOcr = textLength < 100 || page.images.length > 0;
|
|
220
|
+
if (!needsFullOcr && !hasGarbledRegions) {
|
|
221
|
+
return;
|
|
222
|
+
}
|
|
223
|
+
try {
|
|
224
|
+
// Render page as image
|
|
225
|
+
const imageBuffer = await this.pdfEngine.renderPageImage(doc, page.pageNum, this.config.dpi);
|
|
226
|
+
// Save temporary image file
|
|
227
|
+
const fs = await import("fs/promises");
|
|
228
|
+
const path = await import("path");
|
|
229
|
+
const os = await import("os");
|
|
230
|
+
const tmpDir = os.tmpdir();
|
|
231
|
+
const tmpImagePath = path.join(tmpDir, `page_${page.pageNum}_ocr.png`);
|
|
232
|
+
await fs.writeFile(tmpImagePath, imageBuffer);
|
|
233
|
+
// Run OCR
|
|
234
|
+
log(` OCR on page ${page.pageNum}...`);
|
|
235
|
+
const ocrResults = await this.ocrEngine.recognize(tmpImagePath, {
|
|
236
|
+
language: this.config.ocrLanguage,
|
|
237
|
+
correctRotation: true,
|
|
238
|
+
});
|
|
239
|
+
// Convert OCR results to text items and add to page
|
|
240
|
+
if (ocrResults.length > 0) {
|
|
241
|
+
// Scale factor to convert from OCR pixels to PDF points
|
|
242
|
+
// OCR operates at config.dpi, PDF uses 72 points per inch (PDF spec constant)
|
|
243
|
+
const scaleFactor = 72 / this.config.dpi;
|
|
244
|
+
// Helper to check if an OCR result overlaps with garbled regions
|
|
245
|
+
const overlapsGarbledRegion = (ocrBbox) => {
|
|
246
|
+
if (!page.garbledTextRegions)
|
|
247
|
+
return false;
|
|
248
|
+
const ocrX = ocrBbox[0] * scaleFactor;
|
|
249
|
+
const ocrY = ocrBbox[1] * scaleFactor;
|
|
250
|
+
const ocrW = (ocrBbox[2] - ocrBbox[0]) * scaleFactor;
|
|
251
|
+
const ocrH = (ocrBbox[3] - ocrBbox[1]) * scaleFactor;
|
|
252
|
+
// Check overlap with any garbled region (with some tolerance)
|
|
253
|
+
const tolerance = 5; // PDF points
|
|
254
|
+
for (const region of page.garbledTextRegions) {
|
|
255
|
+
const overlapX = ocrX < region.x + region.width + tolerance && ocrX + ocrW > region.x - tolerance;
|
|
256
|
+
const overlapY = ocrY < region.y + region.height + tolerance && ocrY + ocrH > region.y - tolerance;
|
|
257
|
+
if (overlapX && overlapY) {
|
|
258
|
+
return true;
|
|
259
|
+
}
|
|
260
|
+
}
|
|
261
|
+
return false;
|
|
262
|
+
};
|
|
263
|
+
// Helper to check if an OCR result spatially overlaps with existing PDF text
|
|
264
|
+
// This prevents duplicating text that PDF already extracted correctly
|
|
265
|
+
const overlapsExistingText = (ocrBbox) => {
|
|
266
|
+
const ocrX = ocrBbox[0] * scaleFactor;
|
|
267
|
+
const ocrY = ocrBbox[1] * scaleFactor;
|
|
268
|
+
const ocrW = (ocrBbox[2] - ocrBbox[0]) * scaleFactor;
|
|
269
|
+
const ocrH = (ocrBbox[3] - ocrBbox[1]) * scaleFactor;
|
|
270
|
+
const tolerance = 2; // PDF points - tighter tolerance for existing text
|
|
271
|
+
for (const item of page.textItems) {
|
|
272
|
+
const itemRight = item.x + (item.width || item.w || 0);
|
|
273
|
+
const itemBottom = item.y + (item.height || item.h || 0);
|
|
274
|
+
const overlapX = ocrX < itemRight + tolerance && ocrX + ocrW > item.x - tolerance;
|
|
275
|
+
const overlapY = ocrY < itemBottom + tolerance && ocrY + ocrH > item.y - tolerance;
|
|
276
|
+
if (overlapX && overlapY) {
|
|
277
|
+
return true;
|
|
278
|
+
}
|
|
279
|
+
}
|
|
280
|
+
return false;
|
|
281
|
+
};
|
|
282
|
+
const ocrTextItems = ocrResults
|
|
283
|
+
.filter((r) => r.confidence > 0.1) // Filter low confidence
|
|
284
|
+
.filter((r) => {
|
|
285
|
+
// For targeted OCR (garbled regions only), only include results that overlap
|
|
286
|
+
if (hasGarbledRegions && !needsFullOcr) {
|
|
287
|
+
return overlapsGarbledRegion(r.bbox);
|
|
288
|
+
}
|
|
289
|
+
// For full OCR, include all results
|
|
290
|
+
return true;
|
|
291
|
+
})
|
|
292
|
+
.filter((r) => {
|
|
293
|
+
// Skip OCR results that spatially overlap with existing PDF text
|
|
294
|
+
// This prevents duplicating text that PDF already extracted correctly
|
|
295
|
+
return !overlapsExistingText(r.bbox);
|
|
296
|
+
})
|
|
297
|
+
.map((r) => {
|
|
298
|
+
// Clean OCR artifacts from table border misreads
|
|
299
|
+
const cleanedText = cleanOcrTableArtifacts(r.text);
|
|
300
|
+
return {
|
|
301
|
+
str: cleanedText,
|
|
302
|
+
x: r.bbox[0] * scaleFactor,
|
|
303
|
+
y: r.bbox[1] * scaleFactor,
|
|
304
|
+
width: (r.bbox[2] - r.bbox[0]) * scaleFactor,
|
|
305
|
+
height: (r.bbox[3] - r.bbox[1]) * scaleFactor,
|
|
306
|
+
w: (r.bbox[2] - r.bbox[0]) * scaleFactor,
|
|
307
|
+
h: (r.bbox[3] - r.bbox[1]) * scaleFactor,
|
|
308
|
+
fontName: "OCR",
|
|
309
|
+
fontSize: (r.bbox[3] - r.bbox[1]) * scaleFactor,
|
|
310
|
+
};
|
|
311
|
+
})
|
|
312
|
+
.filter((item) => item.str.length > 0); // Skip items that became empty after cleaning
|
|
313
|
+
// Add OCR text items directly to page textItems
|
|
314
|
+
page.textItems.push(...ocrTextItems);
|
|
315
|
+
log(` Found ${ocrTextItems.length} text items from OCR on page ${page.pageNum}`);
|
|
316
|
+
}
|
|
317
|
+
// Clean up temp file
|
|
318
|
+
await fs.unlink(tmpImagePath).catch(() => { });
|
|
319
|
+
}
|
|
320
|
+
catch (error) {
|
|
321
|
+
log(` OCR failed for page ${page.pageNum}: ${error}`);
|
|
322
|
+
}
|
|
323
|
+
}
|
|
324
|
+
/**
|
|
325
|
+
* Get a copy of the current configuration, including defaults merged with user overrides.
|
|
326
|
+
*
|
|
327
|
+
* @returns A shallow copy of the active {@link LiteParseConfig}.
|
|
328
|
+
*/
|
|
329
|
+
getConfig() {
|
|
330
|
+
return { ...this.config };
|
|
331
|
+
}
|
|
332
|
+
}
|
|
333
|
+
//# sourceMappingURL=parser.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"parser.js","sourceRoot":"","sources":["../../../src/core/parser.ts"],"names":[],"mappings":"AAAA,OAAO,MAAM,MAAM,SAAS,CAAC;AAE7B,OAAO,EAAE,WAAW,EAAE,MAAM,aAAa,CAAC;AAE1C,OAAO,EAAE,WAAW,EAAE,MAAM,yBAAyB,CAAC;AACtD,OAAO,EAAE,cAAc,EAAE,MAAM,mCAAmC,CAAC;AAEnE,OAAO,EAAE,eAAe,EAAE,MAAM,6BAA6B,CAAC;AAC9D,OAAO,EAAE,aAAa,EAAE,MAAM,+BAA+B,CAAC;AAC9D,OAAO,EAAE,kBAAkB,EAAE,MAAM,uBAAuB,CAAC;AAC3D,OAAO,EAAE,kBAAkB,EAAE,MAAM,uBAAuB,CAAC;AAC3D,OAAO,EAAE,UAAU,EAAE,MAAM,mBAAmB,CAAC;AAC/C,OAAO,EAAE,YAAY,EAAE,sBAAsB,EAAE,MAAM,+BAA+B,CAAC;AACrF,OAAO,EAAE,sBAAsB,EAAE,MAAM,4BAA4B,CAAC;AAEpE;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8BG;AACH,MAAM,OAAO,SAAS;IACZ,MAAM,CAAkB;IACxB,SAAS,CAAY;IACrB,SAAS,CAAa;IAE9B;;;;OAIG;IACH,YAAY,aAAuC,EAAE;QACnD,kCAAkC;QAClC,IAAI,CAAC,MAAM,GAAG,WAAW,CAAC,UAAU,CAAC,CAAC;QAEtC,wBAAwB;QACxB,IAAI,CAAC,SAAS,GAAG,IAAI,WAAW,EAAE,CAAC;QAEnC,wBAAwB;QACxB,qEAAqE;QACrE,IAAI,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC;YAC3B,IAAI,IAAI,CAAC,MAAM,CAAC,YAAY,EAAE,CAAC;gBAC7B,IAAI,CAAC,SAAS,GAAG,IAAI,aAAa,CAAC,IAAI,CAAC,MAAM,CAAC,YAAY,CAAC,CAAC;YAC/D,CAAC;iBAAM,CAAC;gBACN,IAAI,CAAC,SAAS,GAAG,IAAI,eAAe,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,CAAC;YAC/D,CAAC;QACH,CAAC;IACH,CAAC;IAED;;;;;;;;;;;OAWG;IACH,KAAK,CAAC,KAAK,CAAC,QAAgB,EAAE,KAAK,GAAG,KAAK;QACzC,MAAM,GAAG,GAAG,CAAC,GAAW,EAAE,EAAE;YAC1B,IAAI,CAAC,KAAK;gBAAE,OAAO,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,0BAA0B;QAC5D,CAAC,CAAC;QAEF,GAAG,CAAC,oBAAoB,QAAQ,EAAE,CAAC,CAAC;QACpC,MAAM,gBAAgB,GAAG,MAAM,YAAY,CAAC,QAAQ,CAAC,CAAC;QAEtD,IAAI,MAAM,IAAI,gBAAgB,EAAE,CAAC;YAC/B,mBAAmB;YACnB,MAAM,IAAI,KAAK,CAAC,sBAAsB,gBAAgB,CAAC,OAAO,EAAE,CAAC,CAAC;QACpE,CAAC;QAED,kDAAkD;QAClD,IAAI,SAAS,IAAI,gBAAgB,EAAE,CAAC;YAClC,GAAG,CAAC,0DAA0D,CAAC,CAAC;YAChE,OAAO;gBACL,KAAK,EAAE,EAAE;gBACT,IAAI,EAAE,gBAAgB,CAAC,OAAO;aAC/B,CAAC;QACJ,CAAC;QAED,2BAA2B;QAC3B,MAAM,OAAO,GAAG,gBAAgB,CAAC,OAAO,CAAC;QACzC,MAAM,YAAY,GAAG,OAAO,KAAK,QAAQ,CAAC;QAE1C,IAAI,YAAY,EAAE,CAAC;YACjB,GAAG,CAAC,aAAa,gBAAgB,CAAC,iBAAiB,SAAS,CAAC,CAAC;QAChE,CAAC;QAED,oBAAoB;QACpB,MAAM,GAAG,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,YAAY,CAAC,OAAO,CAAC,CAAC;QACvD,GAAG,CAAC,mBAAmB,GAAG,CAAC,QAAQ,QAAQ,CAAC,CAAC;QAE7C,gBAAgB;QAChB,MAAM,KAAK,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,eAAe,CAChD,GAAG,EACH,IAAI,CAAC,MAAM,CAAC,QAAQ,EACpB,IAAI,CAAC,MAAM,CAAC,WAAW,CACxB,CAAC;QAEF,6BAA6B;QAC7B,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;YACnB,MAAM,IAAI,CAAC,MAAM,CAAC,GAAG,EAAE,KAAK,EAAE,GAAG,CAAC,CAAC;QACrC,CAAC;QAED,0DAA0D;QAC1D,MAAM,cAAc,GAAG,kBAAkB,CAAC,KAAK,EAAE,IAAI,CAAC,MAAM,CAAC,CAAC;QAE9D,kCAAkC;QAClC,IAAI,IAAI,CAAC,MAAM,CAAC,kBAAkB,EAAE,CAAC;YACnC,KAAK,MAAM,IAAI,IAAI,cAAc,EAAE,CAAC;gBAClC,IAAI,CAAC,aAAa,GAAG,kBAAkB,CAAC,IAAI,CAAC,SAAS,CAAC,CAAC;YAC1D,CAAC;QACH,CAAC;QAED,mBAAmB;QACnB,MAAM,QAAQ,GAAG,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;QAEhE,qBAAqB;QACrB,MAAM,IAAI,CAAC,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;QAEhC,wDAAwD;QACxD,IAAI,IAAI,CAAC,SAAS,IAAI,WAAW,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;YACpD,MAAO,IAAI,CAAC,SAA6B,CAAC,SAAS,EAAE,CAAC;QACxD,CAAC;QAED,qCAAqC;QACrC,IAAI,YAAY,EAAE,CAAC;YACjB,MAAM,sBAAsB,CAAC,OAAO,CAAC,CAAC;QACxC,CAAC;QAED,MAAM,MAAM,GAAgB;YAC1B,KAAK,EAAE,cAAc;YACrB,IAAI,EAAE,QAAQ;SACf,CAAC;QAEF,gCAAgC;QAChC,QAAQ,IAAI,CAAC,MAAM,CAAC,YAAY,EAAE,CAAC;YACjC,KAAK,MAAM;gBACT,MAAM,CAAC,IAAI,GAAG,IAAI,CAAC,KAAK,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC,CAAC;gBAC7C,MAAM;YACR,KAAK,MAAM;gBACT,yBAAyB;gBACzB,MAAM;QACV,CAAC;QAED,OAAO,MAAM,CAAC;IAChB,CAAC;IAED;;;;;;;;;;OAUG;IACH,KAAK,CAAC,UAAU,CACd,QAAgB,EAChB,WAAsB,EACtB,KAAK,GAAG,KAAK;QAEb,MAAM,GAAG,GAAG,CAAC,GAAW,EAAE,EAAE;YAC1B,IAAI,CAAC,KAAK;gBAAE,OAAO,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,0BAA0B;QAC5D,CAAC,CAAC;QAEF,GAAG,CAAC,+BAA+B,QAAQ,EAAE,CAAC,CAAC;QAE/C,qDAAqD;QACrD,MAAM,GAAG,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,YAAY,CAAC,QAAQ,CAAC,CAAC;QACxD,MAAM,UAAU,GAAG,GAAG,CAAC,QAAQ,CAAC;QAEhC,MAAM,OAAO,GAAuB,EAAE,CAAC;QACvC,MAAM,KAAK,GAAG,WAAW,IAAI,KAAK,CAAC,IAAI,CAAC,EAAE,MAAM,EAAE,UAAU,EAAE,EAAE,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC;QAEjF,6BAA6B;QAC7B,MAAM,QAAQ,GAAG,IAAI,cAAc,EAAE,CAAC;QAEtC,IAAI,CAAC;YACH,KAAK,MAAM,OAAO,IAAI,KAAK,EAAE,CAAC;gBAC5B,IAAI,OAAO,GAAG,CAAC,IAAI,OAAO,GAAG,UAAU,EAAE,CAAC;oBACxC,OAAO,CAAC,KAAK,CAAC,iCAAiC,OAAO,EAAE,CAAC,CAAC;oBAC1D,SAAS;gBACX,CAAC;gBAED,GAAG,CAAC,kBAAkB,OAAO,KAAK,CAAC,CAAC;gBACpC,MAAM,WAAW,GAAG,MAAM,QAAQ,CAAC,kBAAkB,CAAC,QAAQ,EAAE,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;gBAE1F,sBAAsB;gBACtB,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,WAAW,CAAC,GAAG,EAAE,OAAO,CAAC,CAAC;gBAEhE,OAAO,CAAC,IAAI,CAAC;oBACX,OAAO;oBACP,KAAK,EAAE,QAAQ,CAAC,KAAK;oBACrB,MAAM,EAAE,QAAQ,CAAC,MAAM;oBACvB,WAAW;iBACZ,CAAC,CAAC;YACL,CAAC;QACH,CAAC;gBAAS,CAAC;YACT,qBAAqB;YACrB,MAAM,QAAQ,CAAC,KAAK,EAAE,CAAC;YACvB,MAAM,IAAI,CAAC,SAAS,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;QAClC,CAAC;QAED,GAAG,CAAC,aAAa,OAAO,CAAC,MAAM,cAAc,CAAC,CAAC;QAC/C,OAAO,OAAO,CAAC;IACjB,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,MAAM,CAClB,GAAgB,EAChB,KAAiB,EACjB,GAA0B;QAE1B,IAAI,CAAC,IAAI,CAAC,SAAS;YAAE,OAAO;QAE5B,GAAG,CAAC,sCAAsC,IAAI,CAAC,MAAM,CAAC,UAAU,MAAM,CAAC,CAAC;QAExE,MAAM,KAAK,GAAG,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,UAAU,CAAC,CAAC;QAE7C,MAAM,OAAO,CAAC,GAAG,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,KAAK,CAAC,GAAG,EAAE,CAAC,IAAI,CAAC,cAAc,CAAC,GAAG,EAAE,IAAI,EAAE,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC;IAC3F,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,cAAc,CAC1B,GAAgB,EAChB,IAAc,EACd,GAA0B;QAE1B,IAAI,CAAC,IAAI,CAAC,SAAS;YAAE,OAAO;QAE5B,+DAA+D;QAC/D,MAAM,UAAU,GAAG,IAAI,CAAC,SAAS,CAAC,MAAM,CACtC,CAAC,GAAW,EAAE,IAAc,EAAE,EAAE,CAAC,GAAG,GAAG,IAAI,CAAC,GAAG,CAAC,MAAM,EACtD,CAAC,CACF,CAAC;QAEF,2CAA2C;QAC3C,MAAM,iBAAiB,GAAG,IAAI,CAAC,kBAAkB,IAAI,IAAI,CAAC,kBAAkB,CAAC,MAAM,GAAG,CAAC,CAAC;QACxF,MAAM,YAAY,GAAG,UAAU,GAAG,GAAG,IAAI,IAAI,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC;QAEhE,IAAI,CAAC,YAAY,IAAI,CAAC,iBAAiB,EAAE,CAAC;YACxC,OAAO;QACT,CAAC;QAED,IAAI,CAAC;YACH,uBAAuB;YACvB,MAAM,WAAW,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,eAAe,CAAC,GAAG,EAAE,IAAI,CAAC,OAAO,EAAE,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC,CAAC;YAE7F,4BAA4B;YAC5B,MAAM,EAAE,GAAG,MAAM,MAAM,CAAC,aAAa,CAAC,CAAC;YACvC,MAAM,IAAI,GAAG,MAAM,MAAM,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM,EAAE,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,CAAC;YAC9B,MAAM,MAAM,GAAG,EAAE,CAAC,MAAM,EAAE,CAAC;YAC3B,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,MAAM,EAAE,QAAQ,IAAI,CAAC,OAAO,UAAU,CAAC,CAAC;YACvE,MAAM,EAAE,CAAC,SAAS,CAAC,YAAY,EAAE,WAAW,CAAC,CAAC;YAE9C,UAAU;YACV,GAAG,CAAC,iBAAiB,IAAI,CAAC,OAAO,KAAK,CAAC,CAAC;YACxC,MAAM,UAAU,GAAG,MAAM,IAAI,CAAC,SAAS,CAAC,SAAS,CAAC,YAAY,EAAE;gBAC9D,QAAQ,EAAE,IAAI,CAAC,MAAM,CAAC,WAAW;gBACjC,eAAe,EAAE,IAAI;aACtB,CAAC,CAAC;YAEH,oDAAoD;YACpD,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBAC1B,wDAAwD;gBACxD,8EAA8E;gBAC9E,MAAM,WAAW,GAAG,EAAE,GAAG,IAAI,CAAC,MAAM,CAAC,GAAG,CAAC;gBAEzC,iEAAiE;gBACjE,MAAM,qBAAqB,GAAG,CAAC,OAAiB,EAAW,EAAE;oBAC3D,IAAI,CAAC,IAAI,CAAC,kBAAkB;wBAAE,OAAO,KAAK,CAAC;oBAE3C,MAAM,IAAI,GAAG,OAAO,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACtC,MAAM,IAAI,GAAG,OAAO,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACtC,MAAM,IAAI,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACrD,MAAM,IAAI,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBAErD,8DAA8D;oBAC9D,MAAM,SAAS,GAAG,CAAC,CAAC,CAAC,aAAa;oBAClC,KAAK,MAAM,MAAM,IAAI,IAAI,CAAC,kBAAkB,EAAE,CAAC;wBAC7C,MAAM,QAAQ,GACZ,IAAI,GAAG,MAAM,CAAC,CAAC,GAAG,MAAM,CAAC,KAAK,GAAG,SAAS,IAAI,IAAI,GAAG,IAAI,GAAG,MAAM,CAAC,CAAC,GAAG,SAAS,CAAC;wBACnF,MAAM,QAAQ,GACZ,IAAI,GAAG,MAAM,CAAC,CAAC,GAAG,MAAM,CAAC,MAAM,GAAG,SAAS,IAAI,IAAI,GAAG,IAAI,GAAG,MAAM,CAAC,CAAC,GAAG,SAAS,CAAC;wBACpF,IAAI,QAAQ,IAAI,QAAQ,EAAE,CAAC;4BACzB,OAAO,IAAI,CAAC;wBACd,CAAC;oBACH,CAAC;oBACD,OAAO,KAAK,CAAC;gBACf,CAAC,CAAC;gBAEF,6EAA6E;gBAC7E,sEAAsE;gBACtE,MAAM,oBAAoB,GAAG,CAAC,OAAiB,EAAW,EAAE;oBAC1D,MAAM,IAAI,GAAG,OAAO,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACtC,MAAM,IAAI,GAAG,OAAO,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACtC,MAAM,IAAI,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBACrD,MAAM,IAAI,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,GAAG,OAAO,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC;oBAErD,MAAM,SAAS,GAAG,CAAC,CAAC,CAAC,mDAAmD;oBACxE,KAAK,MAAM,IAAI,IAAI,IAAI,CAAC,SAAS,EAAE,CAAC;wBAClC,MAAM,SAAS,GAAG,IAAI,CAAC,CAAC,GAAG,CAAC,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC;wBACvD,MAAM,UAAU,GAAG,IAAI,CAAC,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,IAAI,IAAI,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC;wBAEzD,MAAM,QAAQ,GAAG,IAAI,GAAG,SAAS,GAAG,SAAS,IAAI,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,GAAG,SAAS,CAAC;wBAClF,MAAM,QAAQ,GAAG,IAAI,GAAG,UAAU,GAAG,SAAS,IAAI,IAAI,GAAG,IAAI,GAAG,IAAI,CAAC,CAAC,GAAG,SAAS,CAAC;wBAEnF,IAAI,QAAQ,IAAI,QAAQ,EAAE,CAAC;4BACzB,OAAO,IAAI,CAAC;wBACd,CAAC;oBACH,CAAC;oBACD,OAAO,KAAK,CAAC;gBACf,CAAC,CAAC;gBAEF,MAAM,YAAY,GAAe,UAAU;qBACxC,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,UAAU,GAAG,GAAG,CAAC,CAAC,wBAAwB;qBAC1D,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE;oBACZ,6EAA6E;oBAC7E,IAAI,iBAAiB,IAAI,CAAC,YAAY,EAAE,CAAC;wBACvC,OAAO,qBAAqB,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;oBACvC,CAAC;oBACD,oCAAoC;oBACpC,OAAO,IAAI,CAAC;gBACd,CAAC,CAAC;qBACD,MAAM,CAAC,CAAC,CAAC,EAAE,EAAE;oBACZ,iEAAiE;oBACjE,sEAAsE;oBACtE,OAAO,CAAC,oBAAoB,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;gBACvC,CAAC,CAAC;qBACD,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE;oBACT,iDAAiD;oBACjD,MAAM,WAAW,GAAG,sBAAsB,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC;oBACnD,OAAO;wBACL,GAAG,EAAE,WAAW;wBAChB,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,WAAW;wBAC1B,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,WAAW;wBAC1B,KAAK,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW;wBAC5C,MAAM,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW;wBAC7C,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW;wBACxC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW;wBACxC,QAAQ,EAAE,KAAK;wBACf,QAAQ,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,GAAG,WAAW;qBAChD,CAAC;gBACJ,CAAC,CAAC;qBACD,MAAM,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC,IAAI,CAAC,GAAG,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC,CAAC,8CAA8C;gBAExF,gDAAgD;gBAChD,IAAI,CAAC,SAAS,CAAC,IAAI,CAAC,GAAG,YAAY,CAAC,CAAC;gBACrC,GAAG,CAAC,WAAW,YAAY,CAAC,MAAM,gCAAgC,IAAI,CAAC,OAAO,EAAE,CAAC,CAAC;YACpF,CAAC;YAED,qBAAqB;YACrB,MAAM,EAAE,CAAC,MAAM,CAAC,YAAY,CAAC,CAAC,KAAK,CAAC,GAAG,EAAE,GAAE,CAAC,CAAC,CAAC;QAChD,CAAC;QAAC,OAAO,KAAK,EAAE,CAAC;YACf,GAAG,CAAC,yBAAyB,IAAI,CAAC,OAAO,KAAK,KAAK,EAAE,CAAC,CAAC;QACzD,CAAC;IACH,CAAC;IAED;;;;OAIG;IACH,SAAS;QACP,OAAO,EAAE,GAAG,IAAI,CAAC,MAAM,EAAE,CAAC;IAC5B,CAAC;CACF"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"parser.test.d.ts","sourceRoot":"","sources":["../../../src/core/parser.test.ts"],"names":[],"mappings":""}
|