@minded-ai/mindedjs 3.0.8-beta.12 → 3.1.9-beta.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/cli/index.js +2 -9
- package/dist/cli/index.js.map +1 -1
- package/dist/cli/runCommand.d.ts +1 -1
- package/dist/cli/runCommand.d.ts.map +1 -1
- package/dist/cli/runCommand.js +31 -23
- package/dist/cli/runCommand.js.map +1 -1
- package/dist/index.d.ts +2 -1
- package/dist/index.d.ts.map +1 -1
- package/dist/index.js +6 -3
- package/dist/index.js.map +1 -1
- package/dist/internalTools/documentExtraction/documentExtraction.d.ts +112 -102
- package/dist/internalTools/documentExtraction/documentExtraction.d.ts.map +1 -1
- package/dist/internalTools/documentExtraction/documentExtraction.js +146 -705
- package/dist/internalTools/documentExtraction/documentExtraction.js.map +1 -1
- package/dist/internalTools/documentExtraction/extractStructuredData.d.ts +57 -0
- package/dist/internalTools/documentExtraction/extractStructuredData.d.ts.map +1 -0
- package/dist/internalTools/documentExtraction/extractStructuredData.js +121 -0
- package/dist/internalTools/documentExtraction/extractStructuredData.js.map +1 -0
- package/dist/internalTools/documentExtraction/parseDocumentLocal.d.ts +16 -0
- package/dist/internalTools/documentExtraction/parseDocumentLocal.d.ts.map +1 -0
- package/dist/internalTools/documentExtraction/parseDocumentLocal.js +547 -0
- package/dist/internalTools/documentExtraction/parseDocumentLocal.js.map +1 -0
- package/dist/internalTools/documentExtraction/parseDocumentManaged.d.ts +13 -0
- package/dist/internalTools/documentExtraction/parseDocumentManaged.d.ts.map +1 -0
- package/dist/internalTools/documentExtraction/parseDocumentManaged.js +150 -0
- package/dist/internalTools/documentExtraction/parseDocumentManaged.js.map +1 -0
- package/dist/nodes/addAppToolNode.d.ts.map +1 -1
- package/dist/nodes/addAppToolNode.js +20 -1
- package/dist/nodes/addAppToolNode.js.map +1 -1
- package/dist/toolsLibrary/classifier.d.ts +2 -2
- package/dist/toolsLibrary/parseDocument.d.ts +11 -10
- package/dist/toolsLibrary/parseDocument.d.ts.map +1 -1
- package/dist/toolsLibrary/parseDocument.js +33 -189
- package/dist/toolsLibrary/parseDocument.js.map +1 -1
- package/dist/toolsLibrary/withBrowserSession.d.ts.map +1 -1
- package/dist/toolsLibrary/withBrowserSession.js +70 -2
- package/dist/toolsLibrary/withBrowserSession.js.map +1 -1
- package/dist/types/Flows.types.d.ts +1 -0
- package/dist/types/Flows.types.d.ts.map +1 -1
- package/dist/types/Flows.types.js.map +1 -1
- package/dist/utils/schemaUtils.js +1 -1
- package/dist/utils/schemaUtils.js.map +1 -1
- package/docs/tooling/document-processing.md +235 -174
- package/package.json +2 -1
- package/src/cli/index.ts +2 -10
- package/src/cli/runCommand.ts +31 -25
- package/src/index.ts +2 -1
- package/src/internalTools/documentExtraction/documentExtraction.ts +184 -767
- package/src/internalTools/documentExtraction/extractStructuredData.ts +140 -0
- package/src/internalTools/documentExtraction/parseDocumentLocal.ts +660 -0
- package/src/internalTools/documentExtraction/parseDocumentManaged.ts +152 -0
- package/src/nodes/addAppToolNode.ts +30 -7
- package/src/toolsLibrary/parseDocument.ts +38 -206
- package/src/toolsLibrary/withBrowserSession.ts +89 -4
- package/src/types/Flows.types.ts +1 -0
- package/src/utils/schemaUtils.ts +1 -1
|
@@ -1 +1 @@
|
|
|
1
|
-
{"version":3,"file":"documentExtraction.js","sourceRoot":"","sources":["../../../src/internalTools/documentExtraction/documentExtraction.ts"],"names":[],"mappings":";;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;AAwDA,kDA4BC;AAlFD,uCAAyB;AACzB,2CAA6B;AAC7B,+CAA4C;AAC5C,uCAAyB;AACzB,mCAAiI;AAEjI;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA+CG;AACI,KAAK,UAAU,mBAAmB,CAAa,OAQrD;IASC,8BAA8B;IAC9B,MAAM,SAAS,GAAG,IAAI,iBAAiB,CAAC,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,GAAG,CAAC,CAAC;IAErE,4CAA4C;IAC5C,OAAO,SAAS,CAAC,mBAAmB,CAAC;QACnC,YAAY,EAAE,OAAO,CAAC,YAAY;QAClC,eAAe,EAAE,OAAO,CAAC,eAAe;QACxC,WAAW,EAAE,OAAO,CAAC,WAAW;QAChC,MAAM,EAAE,OAAO,CAAC,MAAM;QACtB,YAAY,EAAE,OAAO,CAAC,YAAY;KACnC,CAAC,CAAC;AACL,CAAC;AAED;;;GAGG;AACH,MAAa,iBAAiB;IAO5B,YAAY,SAAkC,EAAE,EAAE,GAAuB;QALjE,QAAG,GAA6B,IAAI,CAAC;QACrC,qBAAgB,GAAkB,IAAI,CAAC;QACvC,gBAAW,GAAQ,IAAI,CAAC;QACxB,uBAAkB,GAAG,KAAK,CAAC;QAGjC,IAAI,CAAC,MAAM,GAAG;YACZ,aAAa,EAAE,IAAI;YACnB,YAAY,EAAE,EAAE;YAChB,SAAS,EAAE,KAAK;YAChB,GAAG,MAAM;SACV,CAAC;QAEF,IAAI,CAAC,GAAG,GAAG,GAAG,IAAI,IAAI,CAAC;QACvB,IAAI,CAAC,gBAAgB,GAAG,IAAI,CAAC,MAAM,CAAC,gBAAgB,IAAI,OAAO,CAAC,GAAG,CAAC,mBAAmB,IAAI,IAAI,CAAC;IAClG,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,mBAAmB,CAAC,QAAgB;QAChD,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,CAAC;YAC3B,OAAO,IAAI,CAAC;QACd,CAAC;QAED,IAAI,CAAC;YACH,wCAAwC;YACxC,MAAM,WAAW,GAAG,EAAE,CAAC,YAAY,CAAC,QAAQ,CAAC,CAAC;YAC9C,MAAM,QAAQ,GAAG,IAAI,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC;YACzC,MAAM,QAAQ,GAAG,IAAI,CAAC,WAAW,CAAC,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,CAAC;YAE1D,MAAM,QAAQ,GAAG,IAAI,QAAQ,EAAE,CAAC;YAChC,MAAM,IAAI,GAAG,IAAI,IAAI,CAAC,CAAC,WAAW,CAAC,EAAE,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,CAAC;YACzD,QAAQ,CAAC,MAAM,CAAC,MAAM,EAAE,IAAI,EAAE,QAAQ,CAAC,CAAC;YACxC,QAAQ,CAAC,MAAM,CAAC,cAAc,EAAE,MAAM,CAAC,CAAC;YAExC,MAAM,cAAc,GAAG,MAAM,KAAK,CAAC,uDAAuD,EAAE;gBAC1F,MAAM,EAAE,MAAM;gBACd,OAAO,EAAE;oBACP,MAAM,EAAE,kBAAkB;oBAC1B,aAAa,EAAE,UAAU,IAAI,CAAC,gBAAgB,EAAE;iBACjD;gBACD,IAAI,EAAE,QAAQ;aACf,CAAC,CAAC;YAEH,IAAI,CAAC,cAAc,CAAC,EAAE,EAAE,CAAC;gBACvB,MAAM,SAAS,GAAG,MAAM,cAAc,CAAC,IAAI,EAAE,CAAC;gBAC9C,MAAM,IAAI,KAAK,CAAC,0BAA0B,cAAc,CAAC,MAAM,MAAM,SAAS,EAAE,CAAC,CAAC;YACpF,CAAC;YAED,MAAM,YAAY,GAAG,MAAM,cAAc,CAAC,IAAI,EAAE,CAAC;YACjD,MAAM,KAAK,GAAG,YAAY,CAAC,EAAE,IAAI,YAAY,CAAC,MAAM,CAAC;YAErD,IAAI,CAAC,KAAK,EAAE,CAAC;gBACX,MAAM,IAAI,KAAK,CAAC,gCAAgC,CAAC,CAAC;YACpD,CAAC;YAED,eAAM,CAAC,IAAI,CAAC;gBACV,GAAG,EAAE,iDAAiD;gBACtD,KAAK;gBACL,QAAQ;aACT,CAAC,CAAC;YAEH,kCAAkC;YAClC,IAAI,QAAQ,GAAG,CAAC,CAAC;YACjB,MAAM,WAAW,GAAG,EAAE,CAAC,CAAC,kDAAkD;YAC1E,MAAM,SAAS,GAAG,IAAI,CAAC,CAAC,YAAY;YAEpC,OAAO,QAAQ,GAAG,WAAW,EAAE,CAAC;gBAC9B,MAAM,cAAc,GAAG,MAAM,KAAK,CAAC,sDAAsD,KAAK,EAAE,EAAE;oBAChG,MAAM,EAAE,KAAK;oBACb,OAAO,EAAE;wBACP,MAAM,EAAE,kBAAkB;wBAC1B,aAAa,EAAE,UAAU,IAAI,CAAC,gBAAgB,EAAE;qBACjD;iBACF,CAAC,CAAC;gBAEH,IAAI,CAAC,cAAc,CAAC,EAAE,EAAE,CAAC;oBACvB,MAAM,IAAI,KAAK,CAAC,+BAA+B,cAAc,CAAC,MAAM,EAAE,CAAC,CAAC;gBAC1E,CAAC;gBAED,MAAM,YAAY,GAAG,MAAM,cAAc,CAAC,IAAI,EAAE,CAAC;gBACjD,MAAM,MAAM,GAAG,YAAY,CAAC,MAAM,IAAI,YAAY,CAAC,UAAU,CAAC;gBAE9D,IAAI,MAAM,KAAK,SAAS,IAAI,MAAM,KAAK,WAAW,IAAI,MAAM,KAAK,WAAW,EAAE,CAAC;oBAC7E,uCAAuC;oBAEvC,wCAAwC;oBACxC,MAAM,UAAU,GAAG,IAAI,eAAe,EAAE,CAAC;oBACzC,MAAM,OAAO,GAAG,UAAU,CAAC,GAAG,EAAE,CAAC,UAAU,CAAC,KAAK,EAAE,EAAE,KAAK,CAAC,CAAC,CAAC,oBAAoB;oBAEjF,IAAI,cAAc,CAAC;oBACnB,IAAI,CAAC;wBACH,cAAc,GAAG,MAAM,KAAK,CAAC,sDAAsD,KAAK,kBAAkB,EAAE;4BAC1G,MAAM,EAAE,KAAK;4BACb,OAAO,EAAE;gCACP,MAAM,EAAE,kBAAkB;gCAC1B,aAAa,EAAE,UAAU,IAAI,CAAC,gBAAgB,EAAE;6BACjD;4BACD,MAAM,EAAE,UAAU,CAAC,MAAM;yBAC1B,CAAC,CAAC;oBACL,CAAC;oBAAC,OAAO,UAAU,EAAE,CAAC;wBACpB,YAAY,CAAC,OAAO,CAAC,CAAC;wBACtB,IAAI,UAAU,YAAY,KAAK,IAAI,UAAU,CAAC,IAAI,KAAK,YAAY,EAAE,CAAC;4BACpE,MAAM,IAAI,KAAK,CAAC,2DAA2D,CAAC,CAAC;wBAC/E,CAAC;wBACD,MAAM,UAAU,CAAC;oBACnB,CAAC;oBAED,YAAY,CAAC,OAAO,CAAC,CAAC;oBAEtB,IAAI,CAAC,cAAc,CAAC,EAAE,EAAE,CAAC;wBACvB,MAAM,SAAS,GAAG,MAAM,cAAc,CAAC,IAAI,EAAE,CAAC;wBAC9C,MAAM,IAAI,KAAK,CAAC,+BAA+B,cAAc,CAAC,MAAM,MAAM,SAAS,EAAE,CAAC,CAAC;oBACzF,CAAC;oBAED,IAAI,UAAe,CAAC;oBACpB,IAAI,CAAC;wBACH,wEAAwE;wBACxE,IAAI,YAAY,CAAC;wBACjB,IAAI,cAAc,CAAC,IAAI,EAAE,CAAC;4BACxB,MAAM,MAAM,GAAG,cAAc,CAAC,IAAI,CAAC,SAAS,EAAE,CAAC;4BAC/C,MAAM,MAAM,GAAiB,EAAE,CAAC;4BAChC,IAAI,WAAW,GAAG,CAAC,CAAC;4BAEpB,IAAI,CAAC;gCACH,OAAO,IAAI,EAAE,CAAC;oCACZ,MAAM,EAAE,IAAI,EAAE,KAAK,EAAE,GAAG,MAAM,MAAM,CAAC,IAAI,EAAE,CAAC;oCAC5C,IAAI,IAAI;wCAAE,MAAM;oCAChB,IAAI,KAAK,EAAE,CAAC;wCACV,MAAM,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;wCACnB,WAAW,IAAI,KAAK,CAAC,MAAM,CAAC;oCAC9B,CAAC;gCACH,CAAC;gCAED,iBAAiB;gCACjB,MAAM,QAAQ,GAAG,IAAI,UAAU,CAAC,WAAW,CAAC,CAAC;gCAC7C,IAAI,MAAM,GAAG,CAAC,CAAC;gCACf,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;oCAC3B,QAAQ,CAAC,GAAG,CAAC,KAAK,EAAE,MAAM,CAAC,CAAC;oCAC5B,MAAM,IAAI,KAAK,CAAC,MAAM,CAAC;gCACzB,CAAC;gCAED,YAAY,GAAG,IAAI,WAAW,EAAE,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;4BACpD,CAAC;oCAAS,CAAC;gCACT,MAAM,CAAC,WAAW,EAAE,CAAC;4BACvB,CAAC;wBACH,CAAC;6BAAM,CAAC;4BACN,YAAY,GAAG,MAAM,cAAc,CAAC,IAAI,EAAE,CAAC;wBAC7C,CAAC;wBAED,+DAA+D;wBAC/D,IAAI,CAAC;4BACH,UAAU,GAAG,IAAI,CAAC,KAAK,CAAC,YAAY,CAAC,CAAC;wBACxC,CAAC;wBAAC,WAAM,CAAC;4BACP,8DAA8D;4BAC9D,UAAU,GAAG,YAAY,CAAC;wBAC5B,CAAC;oBACH,CAAC;oBAAC,OAAO,SAAS,EAAE,CAAC;wBACnB,eAAM,CAAC,KAAK,CAAC;4BACX,GAAG,EAAE,kDAAkD;4BACvD,KAAK;4BACL,KAAK,EAAE,SAAS,YAAY,KAAK,CAAC,CAAC,CAAC,SAAS,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,SAAS,CAAC;4BACzE,KAAK,EAAE,SAAS,YAAY,KAAK,CAAC,CAAC,CAAC,SAAS,CAAC,KAAK,CAAC,CAAC,CAAC,SAAS;yBAChE,CAAC,CAAC;wBACH,MAAM,IAAI,KAAK,CAAC,yCAAyC,CAAC,CAAC;oBAC7D,CAAC;oBAED,eAAM,CAAC,KAAK,CAAC;wBACX,GAAG,EAAE,2CAA2C;wBAChD,KAAK;wBACL,QAAQ,EAAE,OAAO,UAAU;wBAC3B,IAAI,EAAE,OAAO,UAAU,KAAK,QAAQ,IAAI,UAAU,KAAK,IAAI,CAAC,CAAC,CAAC,MAAM,CAAC,IAAI,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC,EAAE;wBAC1F,WAAW,EAAE,OAAO,UAAU,KAAK,QAAQ,IAAI,UAAU,IAAI,UAAU;wBACvE,UAAU,EAAE,OAAO,UAAU,KAAK,QAAQ,IAAI,SAAS,IAAI,UAAU;wBACrE,OAAO,EAAE,OAAO,UAAU,KAAK,QAAQ,IAAI,MAAM,IAAI,UAAU;qBAChE,CAAC,CAAC;oBAEH,gFAAgF;oBAChF,IAAI,eAAuB,CAAC;oBAC5B,IAAI,OAAO,UAAU,KAAK,QAAQ,EAAE,CAAC;wBACnC,eAAe,GAAG,UAAU,CAAC;oBAC/B,CAAC;yBAAM,CAAC;wBACN,eAAe,GAAG,UAAU,CAAC,QAAQ,IAAI,UAAU,CAAC,OAAO,IAAI,UAAU,CAAC,IAAI,IAAI,EAAE,CAAC;oBACvF,CAAC;oBAED,IAAI,CAAC,eAAe,EAAE,CAAC;wBACrB,eAAM,CAAC,KAAK,CAAC;4BACX,GAAG,EAAE,0CAA0C;4BAC/C,KAAK;4BACL,UAAU,EAAE,IAAI,CAAC,SAAS,CAAC,UAAU,CAAC,CAAC,SAAS,CAAC,CAAC,EAAE,GAAG,CAAC;yBACzD,CAAC,CAAC;wBACH,MAAM,IAAI,KAAK,CAAC,kCAAkC,CAAC,CAAC;oBACtD,CAAC;oBAED,eAAM,CAAC,IAAI,CAAC;wBACV,GAAG,EAAE,kEAAkE;wBACvE,KAAK;wBACL,aAAa,EAAE,eAAe,CAAC,MAAM;wBACrC,OAAO,EAAE,eAAe,CAAC,SAAS,CAAC,CAAC,EAAE,GAAG,CAAC;qBAC3C,CAAC,CAAC;oBAEH,eAAM,CAAC,KAAK,CAAC;wBACX,GAAG,EAAE,sDAAsD;wBAC3D,KAAK;qBACN,CAAC,CAAC;oBAEH,OAAO,eAAe,CAAC;gBACzB,CAAC;qBAAM,IAAI,MAAM,KAAK,QAAQ,IAAI,MAAM,KAAK,OAAO,IAAI,MAAM,KAAK,QAAQ,EAAE,CAAC;oBAC5E,MAAM,IAAI,KAAK,CAAC,uBAAuB,YAAY,CAAC,KAAK,IAAI,eAAe,EAAE,CAAC,CAAC;gBAClF,CAAC;gBAED,2BAA2B;gBAC3B,MAAM,IAAI,OAAO,CAAC,CAAC,OAAO,EAAE,EAAE,CAAC,UAAU,CAAC,OAAO,EAAE,SAAS,CAAC,CAAC,CAAC;gBAC/D,QAAQ,EAAE,CAAC;YACb,CAAC;YAED,MAAM,IAAI,KAAK,CAAC,uCAAuC,CAAC,CAAC;QAC3D,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,eAAM,CAAC,IAAI,CAAC;gBACV,OAAO,EAAE,+CAA+C;gBACxD,GAAG;aACJ,CAAC,CAAC;YACH,OAAO,IAAI,CAAC;QACd,CAAC;gBAAS,CAAC;YACT,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,kDAAkD;gBACvD,QAAQ;aACT,CAAC,CAAC;QACL,CAAC;IACH,CAAC;IAED;;OAEG;IACK,WAAW,CAAC,aAAqB;QACvC,MAAM,SAAS,GAA8B;YAC3C,MAAM,EAAE,iBAAiB;YACzB,MAAM,EAAE,oBAAoB;YAC5B,OAAO,EAAE,yEAAyE;YAClF,MAAM,EAAE,YAAY;YACpB,MAAM,EAAE,iBAAiB;YACzB,MAAM,EAAE,YAAY;YACpB,OAAO,EAAE,YAAY;YACrB,MAAM,EAAE,WAAW;YACnB,MAAM,EAAE,WAAW;YACnB,MAAM,EAAE,WAAW;YACnB,OAAO,EAAE,YAAY;YACrB,OAAO,EAAE,YAAY;YACrB,MAAM,EAAE,0BAA0B;YAClC,OAAO,EAAE,mEAAmE;YAC5E,MAAM,EAAE,UAAU;YAClB,OAAO,EAAE,WAAW;YACpB,MAAM,EAAE,WAAW;YACnB,MAAM,EAAE,iBAAiB;YACzB,KAAK,EAAE,eAAe;SACvB,CAAC;QAEF,OAAO,SAAS,CAAC,aAAa,CAAC,WAAW,EAAE,CAAC,IAAI,0BAA0B,CAAC;IAC9E,CAAC;IAED;;OAEG;IACH,KAAK,CAAC,mBAAmB,CAAa,OAAkC;QACtE,eAAM,CAAC,KAAK,CAAC;YACX,GAAG,EAAE,gDAAgD;YACrD,eAAe,EAAE,CAAC,CAAC,OAAO,CAAC,YAAY;YACvC,cAAc,EAAE,CAAC,CAAC,OAAO,CAAC,WAAW;YACrC,kBAAkB,EAAE,CAAC,CAAC,OAAO,CAAC,eAAe;YAC7C,MAAM,EAAE,CAAC,CAAC,IAAI,CAAC,GAAG;YAClB,SAAS,EAAE,CAAC,CAAC,OAAO,CAAC,MAAM;SAC5B,CAAC,CAAC;QAEH,MAAM,SAAS,GAAG,IAAI,CAAC,GAAG,EAAE,CAAC;QAE7B,IAAI,CAAC;YACH,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,8CAA8C;aACpD,CAAC,CAAC;YAEH,wCAAwC;YACxC,MAAM,EAAE,OAAO,EAAE,QAAQ,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAI,CAAC,kBAAkB,CAAC,OAAO,CAAC,CAAC;YAE/E,yCAAyC;YACzC,IAAI,gBAAwB,CAAC;YAE7B,IAAI,IAAI,CAAC,WAAW,CAAC,QAAQ,CAAC,EAAE,CAAC;gBAC/B,gBAAgB,GAAG,MAAM,IAAI,CAAC,oBAAoB,CAAC,OAAiB,EAAE,QAAQ,EAAE,OAAO,CAAC,YAAY,CAAC,CAAC;YACxG,CAAC;iBAAM,CAAC;gBACN,gBAAgB,GAAG,MAAM,IAAI,CAAC,mBAAmB,CAAC,OAAO,EAAE,OAAO,CAAC,YAAY,EAAE,QAAQ,CAAC,CAAC;YAC7F,CAAC;YAED,eAAM,CAAC,IAAI,CAAC;gBACV,GAAG,EAAE,gDAAgD;gBACrD,QAAQ;gBACR,aAAa,EAAE,gBAAgB,CAAC,MAAM;aACvC,CAAC,CAAC;YAEH,MAAM,cAAc,GAAG,IAAI,CAAC,GAAG,EAAE,GAAG,SAAS,CAAC;YAE9C,qDAAqD;YACrD,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC;gBACd,OAAO;oBACL,IAAI,EAAE,gBAAqB;oBAC3B,QAAQ,EAAE;wBACR,QAAQ;wBACR,QAAQ;wBACR,cAAc;wBACd,aAAa,EAAE,gBAAgB,CAAC,MAAM;qBACvC;iBACF,CAAC;YACJ,CAAC;YAED,gEAAgE;YAChE,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,qBAAqB,CAAI,gBAAgB,EAAE,OAAO,CAAC,MAAM,EAAE,OAAO,CAAC,SAAS,EAAE,OAAO,CAAC,YAAY,CAAC,CAAC;YAErI,OAAO;gBACL,IAAI,EAAE,aAAa;gBACnB,QAAQ,EAAE;oBACR,QAAQ;oBACR,QAAQ;oBACR,cAAc;oBACd,aAAa,EAAE,gBAAgB,CAAC,MAAM;iBACvC;aACF,CAAC;QACJ,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,eAAM,CAAC,KAAK,CAAC;gBACX,OAAO,EAAE,gDAAgD;gBACzD,GAAG;aACJ,CAAC,CAAC;YACH,MAAM,IAAI,KAAK,CAAC,+BAA+B,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QACrG,CAAC;IACH,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,kBAAkB,CAAC,OAAkC;QAKjE,eAAM,CAAC,KAAK,CAAC;YACX,GAAG,EAAE,+CAA+C;YACpD,OAAO,EAAE,CAAC,CAAC,OAAO,CAAC,YAAY;YAC/B,UAAU,EAAE,CAAC,CAAC,OAAO,CAAC,eAAe;YACrC,MAAM,EAAE,CAAC,CAAC,OAAO,CAAC,WAAW;SAC9B,CAAC,CAAC;QAEH,iBAAiB;QACjB,IAAI,OAAO,CAAC,YAAY,EAAE,CAAC;YACzB,IAAI,CAAC,EAAE,CAAC,UAAU,CAAC,OAAO,CAAC,YAAY,CAAC,EAAE,CAAC;gBACzC,MAAM,IAAI,KAAK,CAAC,uBAAuB,OAAO,CAAC,YAAY,EAAE,CAAC,CAAC;YACjE,CAAC;YAED,MAAM,OAAO,GAAG,EAAE,CAAC,YAAY,CAAC,OAAO,CAAC,YAAY,CAAC,CAAC;YACtD,MAAM,QAAQ,GAAG,IAAI,CAAC,OAAO,CAAC,OAAO,CAAC,YAAY,CAAC,CAAC,WAAW,EAAE,CAAC;YAElE,OAAO;gBACL,OAAO;gBACP,QAAQ;gBACR,QAAQ,EAAE,OAAO,CAAC,MAAM;aACzB,CAAC;QACJ,CAAC;QAED,wBAAwB;QACxB,IAAI,OAAO,CAAC,eAAe,EAAE,CAAC;YAC5B,uDAAuD;YACvD,IAAI,QAAQ,GAAG,UAAU,CAAC;YAC1B,IAAI,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,eAAe,CAAC,EAAE,CAAC;gBAC7C,QAAQ,GAAG,IAAI,CAAC,uBAAuB,CAAC,OAAO,CAAC,eAAe,CAAC,CAAC;YACnE,CAAC;iBAAM,IAAI,OAAO,OAAO,CAAC,eAAe,KAAK,QAAQ,EAAE,CAAC;gBACvD,QAAQ,GAAG,MAAM,CAAC,CAAC,sBAAsB;YAC3C,CAAC;YAED,OAAO;gBACL,OAAO,EAAE,OAAO,CAAC,eAAe;gBAChC,QAAQ;gBACR,QAAQ,EAAE,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,eAAe,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,eAAe,CAAC,MAAM,CAAC,CAAC,CAAC,MAAM,CAAC,UAAU,CAAC,OAAO,CAAC,eAAe,CAAC;aACjI,CAAC;QACJ,CAAC;QAED,WAAW;QACX,IAAI,OAAO,CAAC,WAAW,EAAE,CAAC;YACxB,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,gDAAgD;gBACrD,GAAG,EAAE,OAAO,CAAC,WAAW;aACzB,CAAC,CAAC;YAEH,MAAM,QAAQ,GAAG,MAAM,KAAK,CAAC,OAAO,CAAC,WAAW,CAAC,CAAC;YAElD,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,wCAAwC;gBAC7C,MAAM,EAAE,QAAQ,CAAC,MAAM;gBACvB,EAAE,EAAE,QAAQ,CAAC,EAAE;aAChB,CAAC,CAAC;YAEH,IAAI,CAAC,QAAQ,CAAC,EAAE,EAAE,CAAC;gBACjB,MAAM,IAAI,KAAK,CAAC,sCAAsC,QAAQ,CAAC,UAAU,EAAE,CAAC,CAAC;YAC/E,CAAC;YAED,MAAM,WAAW,GAAG,MAAM,QAAQ,CAAC,WAAW,EAAE,CAAC;YACjD,MAAM,OAAO,GAAG,MAAM,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;YACzC,MAAM,QAAQ,GAAG,IAAI,CAAC,oBAAoB,CAAC,OAAO,CAAC,WAAW,CAAC,IAAI,IAAI,CAAC,uBAAuB,CAAC,OAAO,CAAC,CAAC;YAEzG,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,+CAA+C;gBACpD,WAAW,EAAE,OAAO,CAAC,MAAM;gBAC3B,QAAQ;aACT,CAAC,CAAC;YAEH,OAAO;gBACL,OAAO;gBACP,QAAQ;gBACR,QAAQ,EAAE,OAAO,CAAC,MAAM;aACzB,CAAC;QACJ,CAAC;QAED,MAAM,IAAI,KAAK,CAAC,qFAAqF,CAAC,CAAC;IACzG,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,oBAAoB,CAAC,OAAe,EAAE,QAAgB,EAAE,QAAiB;QACrF,IAAI,CAAC;YACH,iEAAiE;YACjE,IAAI,QAAQ,IAAI,IAAI,CAAC,gBAAgB,EAAE,CAAC;gBACtC,eAAM,CAAC,KAAK,CAAC;oBACX,GAAG,EAAE,2DAA2D;oBAChE,QAAQ;iBACT,CAAC,CAAC;gBACH,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,mBAAmB,CAAC,QAAQ,CAAC,CAAC;gBAC/D,eAAM,CAAC,KAAK,CAAC;oBACX,GAAG,EAAE,4DAA4D;oBACjE,UAAU,EAAE,CAAC,CAAC,aAAa;oBAC3B,aAAa,EAAE,aAAa,aAAb,aAAa,uBAAb,aAAa,CAAE,MAAM;iBACrC,CAAC,CAAC;gBACH,IAAI,aAAa,EAAE,CAAC;oBAClB,OAAO,aAAa,CAAC;gBACvB,CAAC;YACH,CAAC;YAED,kEAAkE;YAClE,IAAI,CAAC,QAAQ,IAAI,IAAI,CAAC,gBAAgB,EAAE,CAAC;gBACvC,MAAM,OAAO,GAAG,EAAE,CAAC,MAAM,EAAE,CAAC;gBAC5B,MAAM,YAAY,GAAG,QAAQ,IAAI,CAAC,GAAG,EAAE,GAAG,QAAQ,EAAE,CAAC;gBACrD,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,YAAY,CAAC,CAAC;gBAEtD,eAAM,CAAC,KAAK,CAAC;oBACX,GAAG,EAAE,kDAAkD;oBACvD,YAAY;oBACZ,WAAW,EAAE,OAAO,CAAC,MAAM;iBAC5B,CAAC,CAAC;gBAEH,IAAI,CAAC;oBACH,EAAE,CAAC,aAAa,CAAC,YAAY,EAAE,OAAO,CAAC,CAAC;oBACxC,eAAM,CAAC,KAAK,CAAC;wBACX,GAAG,EAAE,gEAAgE;wBACrE,YAAY;qBACb,CAAC,CAAC;oBACH,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,mBAAmB,CAAC,YAAY,CAAC,CAAC;oBACnE,eAAM,CAAC,KAAK,CAAC;wBACX,GAAG,EAAE,iEAAiE;wBACtE,UAAU,EAAE,CAAC,CAAC,aAAa;wBAC3B,aAAa,EAAE,aAAa,aAAb,aAAa,uBAAb,aAAa,CAAE,MAAM;qBACrC,CAAC,CAAC;oBACH,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,CAAC;oBAE5B,IAAI,aAAa,EAAE,CAAC;wBAClB,OAAO,aAAa,CAAC;oBACvB,CAAC;gBACH,CAAC;gBAAC,OAAO,GAAG,EAAE,CAAC;oBACb,8BAA8B;oBAC9B,IAAI,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,EAAE,CAAC;wBAChC,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,CAAC;oBAC9B,CAAC;oBACD,eAAM,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,2DAA2D,EAAE,GAAG,EAAE,CAAC,CAAC;gBACzF,CAAC;YACH,CAAC;YAED,uDAAuD;YACvD,wCAAwC;YACxC,IAAI,QAAQ,KAAK,MAAM,EAAE,CAAC;gBACxB,MAAM,IAAI,KAAK,CAAC,gCAAgC,CAAC,CAAC;YACpD,CAAC;YAED,eAAM,CAAC,IAAI,CAAC;gBACV,GAAG,EAAE,4FAA4F;gBACjG,QAAQ;gBACR,WAAW,EAAE,OAAO,CAAC,MAAM;aAC5B,CAAC,CAAC;YAEH,oDAAoD;YACpD,IAAI,IAAI,CAAC,MAAM,CAAC,SAAS,EAAE,CAAC;gBAC1B,kCAAkC;gBAClC,MAAM,WAAW,GAAG,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC;gBAC/C,MAAM,QAAQ,GAAG,IAAI,CAAC,WAAW,CAAC,QAAQ,CAAC,CAAC;gBAC5C,OAAO,QAAQ,QAAQ,WAAW,WAAW,EAAE,CAAC;YAClD,CAAC;iBAAM,CAAC;gBACN,gEAAgE;gBAChE,OAAO,oBAAoB,QAAQ,CAAC,WAAW,EAAE,gBAC/C,OAAO,CAAC,MACV,wFAAwF,CAAC;YAC3F,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,IAAI,KAAK,CAAC,qCAAqC,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAC3G,CAAC;IACH,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,mBAAmB,CAAC,OAAwB,EAAE,QAAiB,EAAE,QAAiB;QAC9F,gDAAgD;QAChD,IAAI,QAAQ,IAAI,IAAI,CAAC,gBAAgB,EAAE,CAAC;YACtC,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,mBAAmB,CAAC,QAAQ,CAAC,CAAC;YAC/D,IAAI,aAAa,EAAE,CAAC;gBAClB,OAAO,aAAa,CAAC;YACvB,CAAC;QACH,CAAC;QAED,iFAAiF;QACjF,IAAI,CAAC,QAAQ,IAAI,IAAI,CAAC,gBAAgB,IAAI,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,EAAE,CAAC;YACnE,MAAM,OAAO,GAAG,EAAE,CAAC,MAAM,EAAE,CAAC;YAC5B,MAAM,YAAY,GAAG,QAAQ,IAAI,CAAC,GAAG,EAAE,GAAG,QAAQ,IAAI,MAAM,EAAE,CAAC;YAC/D,MAAM,YAAY,GAAG,IAAI,CAAC,IAAI,CAAC,OAAO,EAAE,YAAY,CAAC,CAAC;YAEtD,IAAI,CAAC;gBACH,EAAE,CAAC,aAAa,CAAC,YAAY,EAAE,OAAO,CAAC,CAAC;gBACxC,MAAM,aAAa,GAAG,MAAM,IAAI,CAAC,mBAAmB,CAAC,YAAY,CAAC,CAAC;gBACnE,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,CAAC;gBAE5B,IAAI,aAAa,EAAE,CAAC;oBAClB,OAAO,aAAa,CAAC;gBACvB,CAAC;YACH,CAAC;YAAC,OAAO,GAAG,EAAE,CAAC;gBACb,8BAA8B;gBAC9B,IAAI,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,EAAE,CAAC;oBAChC,EAAE,CAAC,UAAU,CAAC,YAAY,CAAC,CAAC;gBAC9B,CAAC;gBACD,eAAM,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,mEAAmE,EAAE,GAAG,EAAE,CAAC,CAAC;YACjG,CAAC;QACH,CAAC;QAED,sCAAsC;QACtC,IAAI,OAAO,OAAO,KAAK,QAAQ,EAAE,CAAC;YAChC,OAAO,OAAO,CAAC;QACjB,CAAC;QAED,sCAAsC;QACtC,IAAI,QAAQ,KAAK,MAAM,IAAI,CAAC,IAAI,CAAC,gBAAgB,EAAE,CAAC;YAClD,MAAM,IAAI,KAAK,CAAC,kFAAkF,CAAC,CAAC;QACtG,CAAC;QAED,2CAA2C;QAC3C,IAAI,CAAC,MAAM,EAAE,KAAK,EAAE,OAAO,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,CAAC,CAAC,QAAQ,CAAC,QAAQ,IAAI,EAAE,CAAC,EAAE,CAAC;YAC9E,OAAO,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;QACnC,CAAC;QAED,qDAAqD;QACrD,MAAM,IAAI,KAAK,CAAC,6BAA6B,QAAQ,wEAAwE,CAAC,CAAC;IACjI,CAAC;IAED;;OAEG;IACK,KAAK,CAAC,qBAAqB,CACjC,OAAe,EACf,MAAkC,EAClC,SAAoD,EACpD,YAAqB;QAErB,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,CAAC;YACd,MAAM,IAAI,KAAK,CAAC,0GAA0G,CAAC,CAAC;QAC9H,CAAC;QAED,kEAAkE;QAClE,8EAA8E;QAE9E,MAAM,mBAAmB,GACvB,+CAA+C;YAC/C,wEAAwE;YACxE,2FAA2F;YAC3F,8CAA8C,CAAC;QAEjD,MAAM,iBAAiB,GAAG,YAAY,IAAI,mBAAmB,CAAC;QAE9D,IAAI,CAAC;YACH,+CAA+C;YAC/C,IAAI,MAAM,EAAE,CAAC;gBACX,iDAAiD;gBACjD,IAAI,CAAC,CAAC,sBAAsB,IAAI,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC;oBAC1C,MAAM,IAAI,KAAK,CAAC,4FAA4F,CAAC,CAAC;gBAChH,CAAC;gBAED,MAAM,aAAa,GAAI,IAAI,CAAC,GAAW,CAAC,oBAAoB,CAAC,MAAa,CAAC,CAAC;gBAE5E,MAAM,MAAM,GAAG,MAAM,aAAa,CAAC,MAAM,CAAC;oBACxC;wBACE,IAAI,EAAE,QAAQ;wBACd,OAAO,EAAE,iBAAiB;qBAC3B;oBACD;wBACE,IAAI,EAAE,MAAM;wBACZ,OAAO,EAAE,mEAAmE,OAAO,EAAE;qBACtF;iBACF,CAAC,CAAC;gBAEH,eAAM,CAAC,KAAK,CAAC;oBACX,GAAG,EAAE,0DAA0D;oBAC/D,aAAa,EAAE,IAAI,CAAC,SAAS,CAAC,MAAM,EAAE,IAAI,EAAE,CAAC,CAAC;iBAC/C,CAAC,CAAC;gBAEH,OAAO,MAAW,CAAC;YACrB,CAAC;iBAAM,CAAC;gBACN,iDAAiD;gBACjD,MAAM,QAAQ,GAAG,MAAM,IAAI,CAAC,GAAG,CAAC,MAAM,CAAC;oBACrC;wBACE,IAAI,EAAE,QAAQ;wBACd,OAAO,EAAE,iBAAiB;qBAC3B;oBACD;wBACE,IAAI,EAAE,MAAM;wBACZ,OAAO,EAAE,iEAAiE,OAAO,EAAE;qBACpF;iBACF,CAAC,CAAC;gBAEH,6CAA6C;gBAC7C,IAAI,WAAmB,CAAC;gBACxB,IAAI,OAAO,QAAQ,CAAC,OAAO,KAAK,QAAQ,EAAE,CAAC;oBACzC,WAAW,GAAG,QAAQ,CAAC,OAAO,CAAC;gBACjC,CAAC;qBAAM,IAAI,KAAK,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,IAAI,QAAQ,CAAC,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;oBAC1E,iCAAiC;oBACjC,WAAW,GAAG,QAAQ,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,KAAU,EAAE,EAAE,CAAC,CAAC,OAAO,KAAK,KAAK,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,IAAI,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;gBACxH,CAAC;qBAAM,CAAC;oBACN,WAAW,GAAG,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;gBACzC,CAAC;gBAED,eAAM,CAAC,KAAK,CAAC;oBACX,GAAG,EAAE,4DAA4D;oBACjE,aAAa,EAAE,WAAW,CAAC,MAAM;iBAClC,CAAC,CAAC;gBAEH,OAAO,WAAgB,CAAC;YAC1B,CAAC;QACH,CAAC;QAAC,OAAO,GAAG,EAAE,CAAC;YACb,MAAM,IAAI,KAAK,CAAC,0BAA0B,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;QAChG,CAAC;IACH,CAAC;IAED;;OAEG;IACK,WAAW,CAAC,QAAgB;QAClC,MAAM,UAAU,GAAG,CAAC,MAAM,EAAE,OAAO,EAAE,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE,OAAO,CAAC,CAAC;QAC/E,OAAO,UAAU,CAAC,QAAQ,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC,CAAC;IACrD,CAAC;IAED;;OAEG;IACK,uBAAuB,CAAC,MAAc;QAC5C,+BAA+B;QAC/B,MAAM,UAAU,GAA8B;YAC5C,UAAU,EAAE,MAAM;YAClB,MAAM,EAAE,MAAM;YACd,UAAU,EAAE,MAAM;YAClB,UAAU,EAAE,MAAM;YAClB,UAAU,EAAE,MAAM,EAAE,gCAAgC;YACpD,QAAQ,EAAE,MAAM,EAAE,gBAAgB;SACnC,CAAC;QAEF,MAAM,GAAG,GAAG,MAAM,CAAC,QAAQ,CAAC,KAAK,EAAE,CAAC,EAAE,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC;QAEvD,KAAK,MAAM,CAAC,SAAS,EAAE,IAAI,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,UAAU,CAAC,EAAE,CAAC;YAC3D,IAAI,GAAG,CAAC,UAAU,CAAC,SAAS,CAAC,EAAE,CAAC;gBAC9B,OAAO,IAAI,CAAC;YACd,CAAC;QACH,CAAC;QAED,OAAO,UAAU,CAAC;IACpB,CAAC;IAED;;OAEG;IACK,oBAAoB,CAAC,GAAW;QACtC,IAAI,CAAC;YACH,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC,GAAG,CAAC,CAAC,QAAQ,CAAC;YACvC,MAAM,SAAS,GAAG,IAAI,CAAC,OAAO,CAAC,QAAQ,CAAC,CAAC,WAAW,EAAE,CAAC;YACvD,OAAO,SAAS,IAAI,IAAI,CAAC;QAC3B,CAAC;QAAC,WAAM,CAAC;YACP,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;IAED;;OAEG;IACH,MAAM,CAAC,yBAAyB;QAC9B,OAAO,CAAC,GAAG,gCAAwB,CAAC,CAAC;IACvC,CAAC;IAED;;OAEG;IACH,MAAM,CAAC,uBAAuB,CAAC,QAAgB;QAC7C,OAAO,gCAAwB,CAAC,QAAQ,CAAC,QAAQ,CAAC,WAAW,EAAE,CAAC,CAAC;IACnE,CAAC;CACF;AAzsBD,8CAysBC"}
|
|
1
|
+
{"version":3,"file":"documentExtraction.js","sourceRoot":"","sources":["../../../src/internalTools/documentExtraction/documentExtraction.ts"],"names":[],"mappings":";;;AAyEA,sFAoDC;AA4CD,sCAuCC;AA9MD,mEAA0E;AAE1E,iEAAyE;AACzE,6DAAqE;AAErE;;GAEG;AACH,IAAY,sBAKX;AALD,WAAY,sBAAsB;IAChC,6DAA6D;IAC7D,6CAAmB,CAAA;IACnB,iDAAiD;IACjD,yCAAe,CAAA;AACjB,CAAC,EALW,sBAAsB,sCAAtB,sBAAsB,QAKjC;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GAuDG;AACI,KAAK,UAAU,qCAAqC,CAAgC,EACzF,cAAc,EACd,cAAc,EACd,SAAS,EACT,gBAAgB,EAChB,sBAAsB,GAAG,KAAK,EAC9B,GAAG,EACH,YAAY,EACZ,kBAAkB,GAUnB;IAKC,iBAAiB;IACjB,MAAM,MAAM,GAAG,MAAM,aAAa,CAAC;QACjC,cAAc;QACd,cAAc;QACd,SAAS;QACT,gBAAgB;KACjB,CAAC,CAAC;IAEH,IAAI,CAAC,sBAAsB,IAAI,CAAC,MAAM,CAAC,UAAU,EAAE,CAAC;QAClD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,IAAI,CAAC,GAAG,EAAE,CAAC;QACT,MAAM,IAAI,KAAK,CAAC,+FAA+F,CAAC,CAAC;IACnH,CAAC;IAED,mDAAmD;IACnD,MAAM,iBAAiB,GAAG,MAAM,IAAA,uDAA+B,EAAI;QACjE,OAAO,EAAE,MAAM,CAAC,UAAU;QAC1B,GAAG;QACH,MAAM,EAAE,YAAY;QACpB,MAAM,EAAE,kBAAkB;QAC1B,SAAS;KACV,CAAC,CAAC;IAEH,OAAO;QACL,GAAG,MAAM;QACT,iBAAiB;KAClB,CAAC;AACJ,CAAC;AAED;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GAyCG;AACI,KAAK,UAAU,aAAa,CAAC,EAClC,cAAc,EACd,cAAc,GAAG,sBAAsB,CAAC,OAAO,EAC/C,SAAS,EACT,gBAAgB,GAMjB;IASC,IAAI,CAAC,cAAc,EAAE,CAAC;QACpB,MAAM,IAAI,KAAK,CAAC,yDAAyD,CAAC,CAAC;IAC7E,CAAC;IAED,MAAM,aAAa,GAAG,KAAK,CAAC,cAAc,CAAC,CAAC;IAE5C,IAAI,cAAc,KAAK,sBAAsB,CAAC,OAAO,EAAE,CAAC;QACtD,OAAO,IAAA,sDAA+B,EAAC;YACrC,cAAc;YACd,aAAa;YACb,SAAS;SACV,CAAC,CAAC;IACL,CAAC;SAAM,CAAC;QACN,OAAO,IAAA,kDAA6B,EAAC;YACnC,cAAc;YACd,aAAa;YACb,SAAS;YACT,gBAAgB,EAAE,gBAAgB,aAAhB,gBAAgB,cAAhB,gBAAgB,GAAI,OAAO,CAAC,GAAG,CAAC,mBAAmB;SACtE,CAAC,CAAC;IACL,CAAC;AACH,CAAC;AAED;;GAEG;AACH,SAAS,KAAK,CAAC,MAAc;IAC3B,IAAI,CAAC;QACH,MAAM,GAAG,GAAG,IAAI,GAAG,CAAC,MAAM,CAAC,CAAC;QAC5B,OAAO,GAAG,CAAC,QAAQ,KAAK,OAAO,IAAI,GAAG,CAAC,QAAQ,KAAK,QAAQ,CAAC;IAC/D,CAAC;IAAC,WAAM,CAAC;QACP,OAAO,KAAK,CAAC;IACf,CAAC;AACH,CAAC"}
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
import { ZodType } from 'zod';
|
|
2
|
+
import { BaseLanguageModel } from '@langchain/core/language_models/base';
|
|
3
|
+
/**
|
|
4
|
+
* Extract structured or unstructured data from content using AI.
|
|
5
|
+
*
|
|
6
|
+
* This function processes string content with an LLM to extract information:
|
|
7
|
+
* - With schema: Returns structured data matching the Zod schema
|
|
8
|
+
* - Without schema: Returns LLM's text analysis of the content based on the provided prompt
|
|
9
|
+
*
|
|
10
|
+
* @param options - Extraction options
|
|
11
|
+
* @param options.content - The content to extract information from
|
|
12
|
+
* @param options.llm - Language model instance for AI-powered extraction
|
|
13
|
+
* @param options.schema - Optional Zod schema defining the structure of data to extract
|
|
14
|
+
* @param options.prompt - Optional prompt to guide the extraction (defaults to expert data-extraction assistant)
|
|
15
|
+
* @param options.sessionId - Unique session identifier for logging and tracking
|
|
16
|
+
*
|
|
17
|
+
* @returns Promise resolving to:
|
|
18
|
+
* - Structured data of type T if schema is provided
|
|
19
|
+
* - String or object containing LLM analysis if no schema provided
|
|
20
|
+
*
|
|
21
|
+
* @throws {Error} If LLM is not provided or doesn't support structured output
|
|
22
|
+
* @throws {Error} If LLM extraction fails
|
|
23
|
+
*
|
|
24
|
+
* @example
|
|
25
|
+
* ```typescript
|
|
26
|
+
* import { extractStructuredDataFromString } from '@minded-ai/mindedjs';
|
|
27
|
+
* import { z } from 'zod';
|
|
28
|
+
*
|
|
29
|
+
* // Extract structured data with schema
|
|
30
|
+
* const result1 = await extractStructuredDataFromString({
|
|
31
|
+
* content: 'Invoice #12345\nTotal: $500.00\nDate: 2024-01-15',
|
|
32
|
+
* llm: agent.llm,
|
|
33
|
+
* schema: z.object({
|
|
34
|
+
* invoiceNumber: z.string(),
|
|
35
|
+
* totalAmount: z.number(),
|
|
36
|
+
* date: z.string(),
|
|
37
|
+
* }),
|
|
38
|
+
* });
|
|
39
|
+
* // result1: {"invoiceNumber": "12345", "totalAmount": 500, "date": "2024-01-15"}
|
|
40
|
+
*
|
|
41
|
+
* // Extract unstructured data with custom prompt (returns object format as string)
|
|
42
|
+
* const result2 = await extractStructuredDataFromString({
|
|
43
|
+
* content: 'Invoice #12345\nTotal: $500.00\nDate: 2024-01-15',
|
|
44
|
+
* llm: agent.llm,
|
|
45
|
+
* prompt: 'Extract the invoice number, total amount, and date. Return as an object with keys: invoiceNumber, totalAmount, date',
|
|
46
|
+
* });
|
|
47
|
+
* // result2: {"invoiceNumber": "12345", "totalAmount": 500, "date": "2024-01-15"}
|
|
48
|
+
* ```
|
|
49
|
+
*/
|
|
50
|
+
export declare function extractStructuredDataFromString<T extends Record<string, any>>({ content, llm, schema, prompt, sessionId, }: {
|
|
51
|
+
content: string;
|
|
52
|
+
llm: BaseLanguageModel;
|
|
53
|
+
schema?: ZodType<T>;
|
|
54
|
+
prompt?: string;
|
|
55
|
+
sessionId: string;
|
|
56
|
+
}): Promise<T | string>;
|
|
57
|
+
//# sourceMappingURL=extractStructuredData.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"extractStructuredData.d.ts","sourceRoot":"","sources":["../../../src/internalTools/documentExtraction/extractStructuredData.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,OAAO,EAAE,MAAM,KAAK,CAAC;AAE9B,OAAO,EAAE,iBAAiB,EAAE,MAAM,sCAAsC,CAAC;AAEzE;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8CG;AACH,wBAAsB,+BAA+B,CAAC,CAAC,SAAS,MAAM,CAAC,MAAM,EAAE,GAAG,CAAC,EAAE,EACnF,OAAO,EACP,GAAG,EACH,MAAM,EACN,MAAM,EACN,SAAS,GACV,EAAE;IACD,OAAO,EAAE,MAAM,CAAC;IAChB,GAAG,EAAE,iBAAiB,CAAC;IACvB,MAAM,CAAC,EAAE,OAAO,CAAC,CAAC,CAAC,CAAC;IACpB,MAAM,CAAC,EAAE,MAAM,CAAC;IAChB,SAAS,EAAE,MAAM,CAAC;CACnB,GAAG,OAAO,CAAC,CAAC,GAAG,MAAM,CAAC,CAoEtB"}
|
|
@@ -0,0 +1,121 @@
|
|
|
1
|
+
"use strict";
|
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
|
3
|
+
exports.extractStructuredDataFromString = extractStructuredDataFromString;
|
|
4
|
+
const logger_1 = require("../../utils/logger");
|
|
5
|
+
/**
|
|
6
|
+
* Extract structured or unstructured data from content using AI.
|
|
7
|
+
*
|
|
8
|
+
* This function processes string content with an LLM to extract information:
|
|
9
|
+
* - With schema: Returns structured data matching the Zod schema
|
|
10
|
+
* - Without schema: Returns LLM's text analysis of the content based on the provided prompt
|
|
11
|
+
*
|
|
12
|
+
* @param options - Extraction options
|
|
13
|
+
* @param options.content - The content to extract information from
|
|
14
|
+
* @param options.llm - Language model instance for AI-powered extraction
|
|
15
|
+
* @param options.schema - Optional Zod schema defining the structure of data to extract
|
|
16
|
+
* @param options.prompt - Optional prompt to guide the extraction (defaults to expert data-extraction assistant)
|
|
17
|
+
* @param options.sessionId - Unique session identifier for logging and tracking
|
|
18
|
+
*
|
|
19
|
+
* @returns Promise resolving to:
|
|
20
|
+
* - Structured data of type T if schema is provided
|
|
21
|
+
* - String or object containing LLM analysis if no schema provided
|
|
22
|
+
*
|
|
23
|
+
* @throws {Error} If LLM is not provided or doesn't support structured output
|
|
24
|
+
* @throws {Error} If LLM extraction fails
|
|
25
|
+
*
|
|
26
|
+
* @example
|
|
27
|
+
* ```typescript
|
|
28
|
+
* import { extractStructuredDataFromString } from '@minded-ai/mindedjs';
|
|
29
|
+
* import { z } from 'zod';
|
|
30
|
+
*
|
|
31
|
+
* // Extract structured data with schema
|
|
32
|
+
* const result1 = await extractStructuredDataFromString({
|
|
33
|
+
* content: 'Invoice #12345\nTotal: $500.00\nDate: 2024-01-15',
|
|
34
|
+
* llm: agent.llm,
|
|
35
|
+
* schema: z.object({
|
|
36
|
+
* invoiceNumber: z.string(),
|
|
37
|
+
* totalAmount: z.number(),
|
|
38
|
+
* date: z.string(),
|
|
39
|
+
* }),
|
|
40
|
+
* });
|
|
41
|
+
* // result1: {"invoiceNumber": "12345", "totalAmount": 500, "date": "2024-01-15"}
|
|
42
|
+
*
|
|
43
|
+
* // Extract unstructured data with custom prompt (returns object format as string)
|
|
44
|
+
* const result2 = await extractStructuredDataFromString({
|
|
45
|
+
* content: 'Invoice #12345\nTotal: $500.00\nDate: 2024-01-15',
|
|
46
|
+
* llm: agent.llm,
|
|
47
|
+
* prompt: 'Extract the invoice number, total amount, and date. Return as an object with keys: invoiceNumber, totalAmount, date',
|
|
48
|
+
* });
|
|
49
|
+
* // result2: {"invoiceNumber": "12345", "totalAmount": 500, "date": "2024-01-15"}
|
|
50
|
+
* ```
|
|
51
|
+
*/
|
|
52
|
+
async function extractStructuredDataFromString({ content, llm, schema, prompt, sessionId, }) {
|
|
53
|
+
if (!llm) {
|
|
54
|
+
throw new Error('LLM instance is required for structured data extraction. Please provide an LLM when calling extractStructuredDataFromString.');
|
|
55
|
+
}
|
|
56
|
+
const messages = [
|
|
57
|
+
{
|
|
58
|
+
role: 'system',
|
|
59
|
+
content: 'You are an expert data-extraction assistant. ' +
|
|
60
|
+
'Extract the requested information from the provided document content. ' +
|
|
61
|
+
'If you cannot find a value for a required field, use "N/A" or a descriptive placeholder. ' +
|
|
62
|
+
'Be accurate and thorough in your extraction. ' +
|
|
63
|
+
'The user prompt may include information needed to extract structured data from the document.',
|
|
64
|
+
},
|
|
65
|
+
{
|
|
66
|
+
role: 'user',
|
|
67
|
+
content: (prompt ? prompt + ' ' : '') + `Please analyze and extract information from this document:\n\n${content}`,
|
|
68
|
+
},
|
|
69
|
+
];
|
|
70
|
+
try {
|
|
71
|
+
if (schema) {
|
|
72
|
+
if (!llm.withStructuredOutput) {
|
|
73
|
+
throw new Error('The provided LLM does not support structured output. Please use a compatible LLM instance.');
|
|
74
|
+
}
|
|
75
|
+
const structuredLlm = llm.withStructuredOutput(schema);
|
|
76
|
+
const result = await structuredLlm.invoke(messages);
|
|
77
|
+
logger_1.logger.debug({
|
|
78
|
+
msg: '[DocumentProcessor] Structured data extraction completed',
|
|
79
|
+
sessionId,
|
|
80
|
+
extractedData: JSON.stringify(result),
|
|
81
|
+
});
|
|
82
|
+
return result;
|
|
83
|
+
}
|
|
84
|
+
else {
|
|
85
|
+
// Without schema, return the LLM's text response
|
|
86
|
+
const response = await llm.invoke(messages);
|
|
87
|
+
// Extract the text content from the response
|
|
88
|
+
let textContent;
|
|
89
|
+
if (typeof response.content === 'string') {
|
|
90
|
+
textContent = response.content;
|
|
91
|
+
}
|
|
92
|
+
else if (Array.isArray(response.content) && response.content.length > 0) {
|
|
93
|
+
// Handle array of content blocks
|
|
94
|
+
textContent = response.content.map((block) => (typeof block === 'string' ? block : block.text || '')).join('\n');
|
|
95
|
+
}
|
|
96
|
+
else {
|
|
97
|
+
textContent = String(response.content);
|
|
98
|
+
}
|
|
99
|
+
// Try to parse the response in case it is a valid JSON object.
|
|
100
|
+
const result = parseJSONSafe(textContent);
|
|
101
|
+
logger_1.logger.debug({
|
|
102
|
+
msg: '[DocumentProcessor] Unstructured data extraction completed',
|
|
103
|
+
sessionId,
|
|
104
|
+
extractedData: textContent,
|
|
105
|
+
});
|
|
106
|
+
return result;
|
|
107
|
+
}
|
|
108
|
+
}
|
|
109
|
+
catch (err) {
|
|
110
|
+
throw new Error(`LLM extraction failed: ${err instanceof Error ? err.message : String(err)}`);
|
|
111
|
+
}
|
|
112
|
+
}
|
|
113
|
+
function parseJSONSafe(str) {
|
|
114
|
+
try {
|
|
115
|
+
return JSON.parse(str);
|
|
116
|
+
}
|
|
117
|
+
catch (_a) {
|
|
118
|
+
return str;
|
|
119
|
+
}
|
|
120
|
+
}
|
|
121
|
+
//# sourceMappingURL=extractStructuredData.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"extractStructuredData.js","sourceRoot":"","sources":["../../../src/internalTools/documentExtraction/extractStructuredData.ts"],"names":[],"mappings":";;AAmDA,0EAgFC;AAlID,+CAA4C;AAG5C;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;;GA8CG;AACI,KAAK,UAAU,+BAA+B,CAAgC,EACnF,OAAO,EACP,GAAG,EACH,MAAM,EACN,MAAM,EACN,SAAS,GAOV;IACC,IAAI,CAAC,GAAG,EAAE,CAAC;QACT,MAAM,IAAI,KAAK,CACb,8HAA8H,CAC/H,CAAC;IACJ,CAAC;IAED,MAAM,QAAQ,GAAG;QACf;YACE,IAAI,EAAE,QAAQ;YACd,OAAO,EACL,+CAA+C;gBAC/C,wEAAwE;gBACxE,2FAA2F;gBAC3F,+CAA+C;gBAC/C,8FAA8F;SACjG;QACD;YACE,IAAI,EAAE,MAAM;YACZ,OAAO,EAAE,CAAC,MAAM,CAAC,CAAC,CAAC,MAAM,GAAG,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,GAAG,iEAAiE,OAAO,EAAE;SACnH;KACF,CAAC;IAEF,IAAI,CAAC;QACH,IAAI,MAAM,EAAE,CAAC;YACX,IAAI,CAAC,GAAG,CAAC,oBAAoB,EAAE,CAAC;gBAC9B,MAAM,IAAI,KAAK,CAAC,4FAA4F,CAAC,CAAC;YAChH,CAAC;YACD,MAAM,aAAa,GAAG,GAAG,CAAC,oBAAoB,CAAI,MAAM,CAAC,CAAC;YAE1D,MAAM,MAAM,GAAG,MAAM,aAAa,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;YAEpD,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,0DAA0D;gBAC/D,SAAS;gBACT,aAAa,EAAE,IAAI,CAAC,SAAS,CAAC,MAAM,CAAC;aACtC,CAAC,CAAC;YAEH,OAAO,MAAM,CAAC;QAChB,CAAC;aAAM,CAAC;YACN,iDAAiD;YACjD,MAAM,QAAQ,GAAG,MAAM,GAAG,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;YAE5C,6CAA6C;YAC7C,IAAI,WAAmB,CAAC;YACxB,IAAI,OAAO,QAAQ,CAAC,OAAO,KAAK,QAAQ,EAAE,CAAC;gBACzC,WAAW,GAAG,QAAQ,CAAC,OAAO,CAAC;YACjC,CAAC;iBAAM,IAAI,KAAK,CAAC,OAAO,CAAC,QAAQ,CAAC,OAAO,CAAC,IAAI,QAAQ,CAAC,OAAO,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;gBAC1E,iCAAiC;gBACjC,WAAW,GAAG,QAAQ,CAAC,OAAO,CAAC,GAAG,CAAC,CAAC,KAAU,EAAE,EAAE,CAAC,CAAC,OAAO,KAAK,KAAK,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,IAAI,IAAI,EAAE,CAAC,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;YACxH,CAAC;iBAAM,CAAC;gBACN,WAAW,GAAG,MAAM,CAAC,QAAQ,CAAC,OAAO,CAAC,CAAC;YACzC,CAAC;YAED,+DAA+D;YAC/D,MAAM,MAAM,GAAG,aAAa,CAAC,WAAW,CAAC,CAAC;YAE1C,eAAM,CAAC,KAAK,CAAC;gBACX,GAAG,EAAE,4DAA4D;gBACjE,SAAS;gBACT,aAAa,EAAE,WAAW;aAC3B,CAAC,CAAC;YAEH,OAAO,MAAM,CAAC;QAChB,CAAC;IACH,CAAC;IAAC,OAAO,GAAG,EAAE,CAAC;QACb,MAAM,IAAI,KAAK,CAAC,0BAA0B,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC;IAChG,CAAC;AACH,CAAC;AAED,SAAS,aAAa,CAAC,GAAW;IAChC,IAAI,CAAC;QACH,OAAO,IAAI,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;IACzB,CAAC;IAAC,WAAM,CAAC;QACP,OAAO,GAAG,CAAC;IACb,CAAC;AACH,CAAC"}
|
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
export declare function parseDocumentWithLocalService({ documentSource, isDocumentUrl, sessionId, llamaCloudApiKey, useBase64, }: {
|
|
2
|
+
isDocumentUrl: boolean;
|
|
3
|
+
documentSource: string;
|
|
4
|
+
sessionId: string;
|
|
5
|
+
llamaCloudApiKey?: string;
|
|
6
|
+
useBase64?: boolean;
|
|
7
|
+
}): Promise<{
|
|
8
|
+
rawContent: string;
|
|
9
|
+
metadata: {
|
|
10
|
+
fileSize: number | undefined;
|
|
11
|
+
fileType: string;
|
|
12
|
+
processingTime: number;
|
|
13
|
+
contentLength: number;
|
|
14
|
+
};
|
|
15
|
+
}>;
|
|
16
|
+
//# sourceMappingURL=parseDocumentLocal.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"parseDocumentLocal.d.ts","sourceRoot":"","sources":["../../../src/internalTools/documentExtraction/parseDocumentLocal.ts"],"names":[],"mappings":"AAKA,wBAAsB,6BAA6B,CAAC,EAClD,cAAc,EACd,aAAa,EACb,SAAS,EACT,gBAAgB,EAChB,SAAS,GACV,EAAE;IACD,aAAa,EAAE,OAAO,CAAC;IACvB,cAAc,EAAE,MAAM,CAAC;IACvB,SAAS,EAAE,MAAM,CAAC;IAClB,gBAAgB,CAAC,EAAE,MAAM,CAAC;IAC1B,SAAS,CAAC,EAAE,OAAO,CAAC;CACrB;;;;;;;;GA8DA"}
|