@vertesia/workflow 0.42.2
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/LICENSE +13 -0
- package/README.md +24 -0
- package/bin/bundle-workflows.mjs +26 -0
- package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js +32 -0
- package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
- package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +66 -0
- package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
- package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js +18 -0
- package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
- package/lib/cjs/activities/chunkDocument.js +79 -0
- package/lib/cjs/activities/chunkDocument.js.map +1 -0
- package/lib/cjs/activities/createDocumentFromOther.js +64 -0
- package/lib/cjs/activities/createDocumentFromOther.js.map +1 -0
- package/lib/cjs/activities/executeInteraction.js +135 -0
- package/lib/cjs/activities/executeInteraction.js.map +1 -0
- package/lib/cjs/activities/extractDocumentText.js +140 -0
- package/lib/cjs/activities/extractDocumentText.js.map +1 -0
- package/lib/cjs/activities/generateDocumentProperties.js +59 -0
- package/lib/cjs/activities/generateDocumentProperties.js.map +1 -0
- package/lib/cjs/activities/generateEmbeddings.js +292 -0
- package/lib/cjs/activities/generateEmbeddings.js.map +1 -0
- package/lib/cjs/activities/generateImageRendition.js +104 -0
- package/lib/cjs/activities/generateImageRendition.js.map +1 -0
- package/lib/cjs/activities/generateOrAssignContentType.js +103 -0
- package/lib/cjs/activities/generateOrAssignContentType.js.map +1 -0
- package/lib/cjs/activities/getObjectFromStore.js +20 -0
- package/lib/cjs/activities/getObjectFromStore.js.map +1 -0
- package/lib/cjs/activities/index.js +54 -0
- package/lib/cjs/activities/index.js.map +1 -0
- package/lib/cjs/activities/media/processPdfWithTextract.js +102 -0
- package/lib/cjs/activities/media/processPdfWithTextract.js.map +1 -0
- package/lib/cjs/activities/media/transcribeMediaWithGladia.js +51 -0
- package/lib/cjs/activities/media/transcribeMediaWithGladia.js.map +1 -0
- package/lib/cjs/activities/notifyWebhook.js +34 -0
- package/lib/cjs/activities/notifyWebhook.js.map +1 -0
- package/lib/cjs/activities/setDocumentStatus.js +15 -0
- package/lib/cjs/activities/setDocumentStatus.js.map +1 -0
- package/lib/cjs/conversion/TextractProcessor.js +416 -0
- package/lib/cjs/conversion/TextractProcessor.js.map +1 -0
- package/lib/cjs/conversion/image.js +22 -0
- package/lib/cjs/conversion/image.js.map +1 -0
- package/lib/cjs/conversion/mutool.js +147 -0
- package/lib/cjs/conversion/mutool.js.map +1 -0
- package/lib/cjs/conversion/pandoc.js +39 -0
- package/lib/cjs/conversion/pandoc.js.map +1 -0
- package/lib/cjs/conversion/pdf.js +13 -0
- package/lib/cjs/conversion/pdf.js.map +1 -0
- package/lib/cjs/dsl/conditions.js +81 -0
- package/lib/cjs/dsl/conditions.js.map +1 -0
- package/lib/cjs/dsl/dsl-workflow.js +223 -0
- package/lib/cjs/dsl/dsl-workflow.js.map +1 -0
- package/lib/cjs/dsl/projections.js +59 -0
- package/lib/cjs/dsl/projections.js.map +1 -0
- package/lib/cjs/dsl/setup/ActivityContext.js +96 -0
- package/lib/cjs/dsl/setup/ActivityContext.js.map +1 -0
- package/lib/cjs/dsl/setup/fetch/DataProvider.js +51 -0
- package/lib/cjs/dsl/setup/fetch/DataProvider.js.map +1 -0
- package/lib/cjs/dsl/setup/fetch/index.js +16 -0
- package/lib/cjs/dsl/setup/fetch/index.js.map +1 -0
- package/lib/cjs/dsl/setup/fetch/providers.js +67 -0
- package/lib/cjs/dsl/setup/fetch/providers.js.map +1 -0
- package/lib/cjs/dsl/test/test-child-workflow.js +10 -0
- package/lib/cjs/dsl/test/test-child-workflow.js.map +1 -0
- package/lib/cjs/dsl/validation.js +122 -0
- package/lib/cjs/dsl/validation.js.map +1 -0
- package/lib/cjs/dsl/vars.js +341 -0
- package/lib/cjs/dsl/vars.js.map +1 -0
- package/lib/cjs/dsl/walk.js +100 -0
- package/lib/cjs/dsl/walk.js.map +1 -0
- package/lib/cjs/errors.js +36 -0
- package/lib/cjs/errors.js.map +1 -0
- package/lib/cjs/index.js +43 -0
- package/lib/cjs/index.js.map +1 -0
- package/lib/cjs/iterative-generation/activities/extractToc.js +47 -0
- package/lib/cjs/iterative-generation/activities/extractToc.js.map +1 -0
- package/lib/cjs/iterative-generation/activities/finalizeOutput.js +69 -0
- package/lib/cjs/iterative-generation/activities/finalizeOutput.js.map +1 -0
- package/lib/cjs/iterative-generation/activities/generatePart.js +73 -0
- package/lib/cjs/iterative-generation/activities/generatePart.js.map +1 -0
- package/lib/cjs/iterative-generation/activities/generateToc.js +91 -0
- package/lib/cjs/iterative-generation/activities/generateToc.js.map +1 -0
- package/lib/cjs/iterative-generation/activities/index.js +12 -0
- package/lib/cjs/iterative-generation/activities/index.js.map +1 -0
- package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js +55 -0
- package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
- package/lib/cjs/iterative-generation/types.js +5 -0
- package/lib/cjs/iterative-generation/types.js.map +1 -0
- package/lib/cjs/iterative-generation/utils.js +118 -0
- package/lib/cjs/iterative-generation/utils.js.map +1 -0
- package/lib/cjs/package.json +3 -0
- package/lib/cjs/result-types.js +10 -0
- package/lib/cjs/result-types.js.map +1 -0
- package/lib/cjs/system/generateObjectText.js +89 -0
- package/lib/cjs/system/generateObjectText.js.map +1 -0
- package/lib/cjs/system/notifyWebhookWorkflow.js +52 -0
- package/lib/cjs/system/notifyWebhookWorkflow.js.map +1 -0
- package/lib/cjs/system/recalculateEmbeddingsWorkflow.js +37 -0
- package/lib/cjs/system/recalculateEmbeddingsWorkflow.js.map +1 -0
- package/lib/cjs/utils/auth.js +15 -0
- package/lib/cjs/utils/auth.js.map +1 -0
- package/lib/cjs/utils/blobs.js +63 -0
- package/lib/cjs/utils/blobs.js.map +1 -0
- package/lib/cjs/utils/client.js +25 -0
- package/lib/cjs/utils/client.js.map +1 -0
- package/lib/cjs/utils/expand-vars.js +33 -0
- package/lib/cjs/utils/expand-vars.js.map +1 -0
- package/lib/cjs/utils/memory.js +72 -0
- package/lib/cjs/utils/memory.js.map +1 -0
- package/lib/cjs/utils/tokens.js +38 -0
- package/lib/cjs/utils/tokens.js.map +1 -0
- package/lib/cjs/vars.js +20 -0
- package/lib/cjs/vars.js.map +1 -0
- package/lib/cjs/workflows.js +17 -0
- package/lib/cjs/workflows.js.map +1 -0
- package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js +29 -0
- package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
- package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +63 -0
- package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
- package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js +15 -0
- package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
- package/lib/esm/activities/chunkDocument.js +76 -0
- package/lib/esm/activities/chunkDocument.js.map +1 -0
- package/lib/esm/activities/createDocumentFromOther.js +58 -0
- package/lib/esm/activities/createDocumentFromOther.js.map +1 -0
- package/lib/esm/activities/executeInteraction.js +131 -0
- package/lib/esm/activities/executeInteraction.js.map +1 -0
- package/lib/esm/activities/extractDocumentText.js +137 -0
- package/lib/esm/activities/extractDocumentText.js.map +1 -0
- package/lib/esm/activities/generateDocumentProperties.js +56 -0
- package/lib/esm/activities/generateDocumentProperties.js.map +1 -0
- package/lib/esm/activities/generateEmbeddings.js +256 -0
- package/lib/esm/activities/generateEmbeddings.js.map +1 -0
- package/lib/esm/activities/generateImageRendition.js +98 -0
- package/lib/esm/activities/generateImageRendition.js.map +1 -0
- package/lib/esm/activities/generateOrAssignContentType.js +100 -0
- package/lib/esm/activities/generateOrAssignContentType.js.map +1 -0
- package/lib/esm/activities/getObjectFromStore.js +17 -0
- package/lib/esm/activities/getObjectFromStore.js.map +1 -0
- package/lib/esm/activities/index.js +21 -0
- package/lib/esm/activities/index.js.map +1 -0
- package/lib/esm/activities/media/processPdfWithTextract.js +98 -0
- package/lib/esm/activities/media/processPdfWithTextract.js.map +1 -0
- package/lib/esm/activities/media/transcribeMediaWithGladia.js +48 -0
- package/lib/esm/activities/media/transcribeMediaWithGladia.js.map +1 -0
- package/lib/esm/activities/notifyWebhook.js +31 -0
- package/lib/esm/activities/notifyWebhook.js.map +1 -0
- package/lib/esm/activities/setDocumentStatus.js +12 -0
- package/lib/esm/activities/setDocumentStatus.js.map +1 -0
- package/lib/esm/conversion/TextractProcessor.js +409 -0
- package/lib/esm/conversion/TextractProcessor.js.map +1 -0
- package/lib/esm/conversion/image.js +16 -0
- package/lib/esm/conversion/image.js.map +1 -0
- package/lib/esm/conversion/mutool.js +139 -0
- package/lib/esm/conversion/mutool.js.map +1 -0
- package/lib/esm/conversion/pandoc.js +36 -0
- package/lib/esm/conversion/pandoc.js.map +1 -0
- package/lib/esm/conversion/pdf.js +7 -0
- package/lib/esm/conversion/pdf.js.map +1 -0
- package/lib/esm/dsl/conditions.js +75 -0
- package/lib/esm/dsl/conditions.js.map +1 -0
- package/lib/esm/dsl/dsl-workflow.js +216 -0
- package/lib/esm/dsl/dsl-workflow.js.map +1 -0
- package/lib/esm/dsl/projections.js +55 -0
- package/lib/esm/dsl/projections.js.map +1 -0
- package/lib/esm/dsl/setup/ActivityContext.js +91 -0
- package/lib/esm/dsl/setup/ActivityContext.js.map +1 -0
- package/lib/esm/dsl/setup/fetch/DataProvider.js +47 -0
- package/lib/esm/dsl/setup/fetch/DataProvider.js.map +1 -0
- package/lib/esm/dsl/setup/fetch/index.js +12 -0
- package/lib/esm/dsl/setup/fetch/index.js.map +1 -0
- package/lib/esm/dsl/setup/fetch/providers.js +61 -0
- package/lib/esm/dsl/setup/fetch/providers.js.map +1 -0
- package/lib/esm/dsl/test/test-child-workflow.js +5 -0
- package/lib/esm/dsl/test/test-child-workflow.js.map +1 -0
- package/lib/esm/dsl/validation.js +118 -0
- package/lib/esm/dsl/validation.js.map +1 -0
- package/lib/esm/dsl/vars.js +335 -0
- package/lib/esm/dsl/vars.js.map +1 -0
- package/lib/esm/dsl/walk.js +96 -0
- package/lib/esm/dsl/walk.js.map +1 -0
- package/lib/esm/errors.js +30 -0
- package/lib/esm/errors.js.map +1 -0
- package/lib/esm/index.js +25 -0
- package/lib/esm/index.js.map +1 -0
- package/lib/esm/iterative-generation/activities/extractToc.js +44 -0
- package/lib/esm/iterative-generation/activities/extractToc.js.map +1 -0
- package/lib/esm/iterative-generation/activities/finalizeOutput.js +66 -0
- package/lib/esm/iterative-generation/activities/finalizeOutput.js.map +1 -0
- package/lib/esm/iterative-generation/activities/generatePart.js +70 -0
- package/lib/esm/iterative-generation/activities/generatePart.js.map +1 -0
- package/lib/esm/iterative-generation/activities/generateToc.js +88 -0
- package/lib/esm/iterative-generation/activities/generateToc.js.map +1 -0
- package/lib/esm/iterative-generation/activities/index.js +5 -0
- package/lib/esm/iterative-generation/activities/index.js.map +1 -0
- package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js +52 -0
- package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
- package/lib/esm/iterative-generation/types.js +2 -0
- package/lib/esm/iterative-generation/types.js.map +1 -0
- package/lib/esm/iterative-generation/utils.js +109 -0
- package/lib/esm/iterative-generation/utils.js.map +1 -0
- package/lib/esm/result-types.js +7 -0
- package/lib/esm/result-types.js.map +1 -0
- package/lib/esm/system/generateObjectText.js +86 -0
- package/lib/esm/system/generateObjectText.js.map +1 -0
- package/lib/esm/system/notifyWebhookWorkflow.js +49 -0
- package/lib/esm/system/notifyWebhookWorkflow.js.map +1 -0
- package/lib/esm/system/recalculateEmbeddingsWorkflow.js +34 -0
- package/lib/esm/system/recalculateEmbeddingsWorkflow.js.map +1 -0
- package/lib/esm/utils/auth.js +8 -0
- package/lib/esm/utils/auth.js.map +1 -0
- package/lib/esm/utils/blobs.js +52 -0
- package/lib/esm/utils/blobs.js.map +1 -0
- package/lib/esm/utils/client.js +22 -0
- package/lib/esm/utils/client.js.map +1 -0
- package/lib/esm/utils/expand-vars.js +30 -0
- package/lib/esm/utils/expand-vars.js.map +1 -0
- package/lib/esm/utils/memory.js +60 -0
- package/lib/esm/utils/memory.js.map +1 -0
- package/lib/esm/utils/tokens.js +34 -0
- package/lib/esm/utils/tokens.js.map +1 -0
- package/lib/esm/vars.js +4 -0
- package/lib/esm/vars.js.map +1 -0
- package/lib/esm/workflows.js +9 -0
- package/lib/esm/workflows.js.map +1 -0
- package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts +17 -0
- package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts.map +1 -0
- package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts +29 -0
- package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts.map +1 -0
- package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts +19 -0
- package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts.map +1 -0
- package/lib/types/activities/chunkDocument.d.ts +18 -0
- package/lib/types/activities/chunkDocument.d.ts.map +1 -0
- package/lib/types/activities/createDocumentFromOther.d.ts +21 -0
- package/lib/types/activities/createDocumentFromOther.d.ts.map +1 -0
- package/lib/types/activities/executeInteraction.d.ts +40 -0
- package/lib/types/activities/executeInteraction.d.ts.map +1 -0
- package/lib/types/activities/extractDocumentText.d.ts +9 -0
- package/lib/types/activities/extractDocumentText.d.ts.map +1 -0
- package/lib/types/activities/generateDocumentProperties.d.ts +32 -0
- package/lib/types/activities/generateDocumentProperties.d.ts.map +1 -0
- package/lib/types/activities/generateEmbeddings.d.ts +49 -0
- package/lib/types/activities/generateEmbeddings.d.ts.map +1 -0
- package/lib/types/activities/generateImageRendition.d.ts +17 -0
- package/lib/types/activities/generateImageRendition.d.ts.map +1 -0
- package/lib/types/activities/generateOrAssignContentType.d.ts +44 -0
- package/lib/types/activities/generateOrAssignContentType.d.ts.map +1 -0
- package/lib/types/activities/getObjectFromStore.d.ts +14 -0
- package/lib/types/activities/getObjectFromStore.d.ts.map +1 -0
- package/lib/types/activities/index.d.ts +21 -0
- package/lib/types/activities/index.d.ts.map +1 -0
- package/lib/types/activities/media/processPdfWithTextract.d.ts +26 -0
- package/lib/types/activities/media/processPdfWithTextract.d.ts.map +1 -0
- package/lib/types/activities/media/transcribeMediaWithGladia.d.ts +14 -0
- package/lib/types/activities/media/transcribeMediaWithGladia.d.ts.map +1 -0
- package/lib/types/activities/notifyWebhook.d.ts +17 -0
- package/lib/types/activities/notifyWebhook.d.ts.map +1 -0
- package/lib/types/activities/setDocumentStatus.d.ts +15 -0
- package/lib/types/activities/setDocumentStatus.d.ts.map +1 -0
- package/lib/types/conversion/TextractProcessor.d.ts +45 -0
- package/lib/types/conversion/TextractProcessor.d.ts.map +1 -0
- package/lib/types/conversion/image.d.ts +9 -0
- package/lib/types/conversion/image.d.ts.map +1 -0
- package/lib/types/conversion/mutool.d.ts +19 -0
- package/lib/types/conversion/mutool.d.ts.map +1 -0
- package/lib/types/conversion/pandoc.d.ts +2 -0
- package/lib/types/conversion/pandoc.d.ts.map +1 -0
- package/lib/types/conversion/pdf.d.ts +2 -0
- package/lib/types/conversion/pdf.d.ts.map +1 -0
- package/lib/types/dsl/conditions.d.ts +2 -0
- package/lib/types/dsl/conditions.d.ts.map +1 -0
- package/lib/types/dsl/dsl-workflow.d.ts +5 -0
- package/lib/types/dsl/dsl-workflow.d.ts.map +1 -0
- package/lib/types/dsl/projections.d.ts +4 -0
- package/lib/types/dsl/projections.d.ts.map +1 -0
- package/lib/types/dsl/setup/ActivityContext.d.ts +14 -0
- package/lib/types/dsl/setup/ActivityContext.d.ts.map +1 -0
- package/lib/types/dsl/setup/fetch/DataProvider.d.ts +9 -0
- package/lib/types/dsl/setup/fetch/DataProvider.d.ts.map +1 -0
- package/lib/types/dsl/setup/fetch/index.d.ts +6 -0
- package/lib/types/dsl/setup/fetch/index.d.ts.map +1 -0
- package/lib/types/dsl/setup/fetch/providers.d.ts +25 -0
- package/lib/types/dsl/setup/fetch/providers.d.ts.map +1 -0
- package/lib/types/dsl/test/test-child-workflow.d.ts +4 -0
- package/lib/types/dsl/test/test-child-workflow.d.ts.map +1 -0
- package/lib/types/dsl/validation.d.ts +4 -0
- package/lib/types/dsl/validation.d.ts.map +1 -0
- package/lib/types/dsl/vars.d.ts +48 -0
- package/lib/types/dsl/vars.d.ts.map +1 -0
- package/lib/types/dsl/walk.d.ts +18 -0
- package/lib/types/dsl/walk.d.ts.map +1 -0
- package/lib/types/errors.d.ts +16 -0
- package/lib/types/errors.d.ts.map +1 -0
- package/lib/types/index.d.ts +24 -0
- package/lib/types/index.d.ts.map +1 -0
- package/lib/types/iterative-generation/activities/extractToc.d.ts +10 -0
- package/lib/types/iterative-generation/activities/extractToc.d.ts.map +1 -0
- package/lib/types/iterative-generation/activities/finalizeOutput.d.ts +3 -0
- package/lib/types/iterative-generation/activities/finalizeOutput.d.ts.map +1 -0
- package/lib/types/iterative-generation/activities/generatePart.d.ts +3 -0
- package/lib/types/iterative-generation/activities/generatePart.d.ts.map +1 -0
- package/lib/types/iterative-generation/activities/generateToc.d.ts +4 -0
- package/lib/types/iterative-generation/activities/generateToc.d.ts.map +1 -0
- package/lib/types/iterative-generation/activities/index.d.ts +5 -0
- package/lib/types/iterative-generation/activities/index.d.ts.map +1 -0
- package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts +3 -0
- package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts.map +1 -0
- package/lib/types/iterative-generation/types.d.ts +79 -0
- package/lib/types/iterative-generation/types.d.ts.map +1 -0
- package/lib/types/iterative-generation/utils.d.ts +27 -0
- package/lib/types/iterative-generation/utils.d.ts.map +1 -0
- package/lib/types/result-types.d.ts +22 -0
- package/lib/types/result-types.d.ts.map +1 -0
- package/lib/types/system/generateObjectText.d.ts +4 -0
- package/lib/types/system/generateObjectText.d.ts.map +1 -0
- package/lib/types/system/notifyWebhookWorkflow.d.ts +6 -0
- package/lib/types/system/notifyWebhookWorkflow.d.ts.map +1 -0
- package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts +40 -0
- package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts.map +1 -0
- package/lib/types/utils/auth.d.ts +4 -0
- package/lib/types/utils/auth.d.ts.map +1 -0
- package/lib/types/utils/blobs.d.ts +8 -0
- package/lib/types/utils/blobs.d.ts.map +1 -0
- package/lib/types/utils/client.d.ts +7 -0
- package/lib/types/utils/client.d.ts.map +1 -0
- package/lib/types/utils/expand-vars.d.ts +8 -0
- package/lib/types/utils/expand-vars.d.ts.map +1 -0
- package/lib/types/utils/memory.d.ts +12 -0
- package/lib/types/utils/memory.d.ts.map +1 -0
- package/lib/types/utils/tokens.d.ts +11 -0
- package/lib/types/utils/tokens.d.ts.map +1 -0
- package/lib/types/vars.d.ts +3 -0
- package/lib/types/vars.d.ts.map +1 -0
- package/lib/types/workflows.d.ts +9 -0
- package/lib/types/workflows.d.ts.map +1 -0
- package/lib/workflows-bundle.js +18394 -0
- package/package.json +109 -0
- package/src/activities/advanced/createDocumentTypeFromInteractionRun.ts +54 -0
- package/src/activities/advanced/createOrUpdateDocumentFromInteractionRun.ts +97 -0
- package/src/activities/advanced/updateDocumentFromInteractionRun.ts +34 -0
- package/src/activities/chunkDocument.ts +124 -0
- package/src/activities/createDocumentFromOther.ts +92 -0
- package/src/activities/executeInteraction.ts +191 -0
- package/src/activities/extractDocumentText.ts +174 -0
- package/src/activities/generateDocumentProperties.ts +93 -0
- package/src/activities/generateEmbeddings.ts +345 -0
- package/src/activities/generateImageRendition.ts +134 -0
- package/src/activities/generateOrAssignContentType.ts +152 -0
- package/src/activities/getObjectFromStore.ts +31 -0
- package/src/activities/index.ts +21 -0
- package/src/activities/media/processPdfWithTextract.ts +141 -0
- package/src/activities/media/transcribeMediaWithGladia.ts +83 -0
- package/src/activities/notifyWebhook.test.ts +32 -0
- package/src/activities/notifyWebhook.ts +51 -0
- package/src/activities/setDocumentStatus.ts +25 -0
- package/src/conversion/TextractProcessor.ts +505 -0
- package/src/conversion/image.test.ts +26 -0
- package/src/conversion/image.ts +22 -0
- package/src/conversion/mutool.test.ts +74 -0
- package/src/conversion/mutool.ts +180 -0
- package/src/conversion/pandoc.test.ts +22 -0
- package/src/conversion/pandoc.ts +44 -0
- package/src/conversion/pdf.test.ts +35 -0
- package/src/conversion/pdf.ts +8 -0
- package/src/dsl/conditions.ts +76 -0
- package/src/dsl/dsl-workflow.test.ts +58 -0
- package/src/dsl/dsl-workflow.ts +235 -0
- package/src/dsl/ms.d.ts +11 -0
- package/src/dsl/projections.test.ts +159 -0
- package/src/dsl/projections.ts +72 -0
- package/src/dsl/setup/ActivityContext.ts +106 -0
- package/src/dsl/setup/fetch/DataProvider.ts +45 -0
- package/src/dsl/setup/fetch/index.ts +19 -0
- package/src/dsl/setup/fetch/providers.ts +67 -0
- package/src/dsl/test/test-child-workflow.ts +6 -0
- package/src/dsl/validation.test.ts +257 -0
- package/src/dsl/validation.ts +125 -0
- package/src/dsl/vars.test.ts +245 -0
- package/src/dsl/vars.ts +340 -0
- package/src/dsl/walk.test.ts +81 -0
- package/src/dsl/walk.ts +103 -0
- package/src/dsl/workflow-exec-child.test.ts +182 -0
- package/src/dsl/workflow-fetch.test.ts +135 -0
- package/src/dsl/workflow-import.test.ts +89 -0
- package/src/dsl/workflow.test.ts +110 -0
- package/src/errors.ts +24 -0
- package/src/index.ts +27 -0
- package/src/iterative-generation/activities/extractToc.ts +49 -0
- package/src/iterative-generation/activities/finalizeOutput.ts +77 -0
- package/src/iterative-generation/activities/generatePart.ts +82 -0
- package/src/iterative-generation/activities/generateToc.ts +98 -0
- package/src/iterative-generation/activities/index.ts +4 -0
- package/src/iterative-generation/iterativeGenerationWorkflow.ts +67 -0
- package/src/iterative-generation/types.ts +99 -0
- package/src/iterative-generation/utils.ts +123 -0
- package/src/result-types.ts +25 -0
- package/src/system/generateObjectText.ts +109 -0
- package/src/system/notifyWebhookWorkflow.ts +64 -0
- package/src/system/recalculateEmbeddingsWorkflow.ts +46 -0
- package/src/utils/auth.ts +10 -0
- package/src/utils/blobs.ts +58 -0
- package/src/utils/client.ts +31 -0
- package/src/utils/expand-vars.ts +31 -0
- package/src/utils/memory.ts +66 -0
- package/src/utils/tokens.ts +44 -0
- package/src/vars.ts +3 -0
- package/src/workflows.ts +9 -0
package/LICENSE
ADDED
@@ -0,0 +1,13 @@
|
|
1
|
+
Copyright 2024 Composable Prompts
|
2
|
+
|
3
|
+
Licensed under the Apache License, Version 2.0 (the "License");
|
4
|
+
you may not use this file except in compliance with the License.
|
5
|
+
You may obtain a copy of the License at
|
6
|
+
|
7
|
+
http://www.apache.org/licenses/LICENSE-2.0
|
8
|
+
|
9
|
+
Unless required by applicable law or agreed to in writing, software
|
10
|
+
distributed under the License is distributed on an "AS IS" BASIS,
|
11
|
+
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
12
|
+
See the License for the specific language governing permissions and
|
13
|
+
limitations under the License.
|
package/README.md
ADDED
@@ -0,0 +1,24 @@
|
|
1
|
+
# Zeno Workflows
|
2
|
+
|
3
|
+
This package implements the workflow tasks shared by all content object types.
|
4
|
+
|
5
|
+
There are 3 main sequential tasks:
|
6
|
+
|
7
|
+
1. Build Content
|
8
|
+
2. Build Properties
|
9
|
+
3. Build Tree
|
10
|
+
|
11
|
+
## Build Content
|
12
|
+
|
13
|
+
This task is generating the text content from the object content source if any.
|
14
|
+
|
15
|
+
If no content source was provided, e.g. the object text field is already filled by the client or the object type doesn't support generating text content, this task will do nothing
|
16
|
+
|
17
|
+
## Build Properties
|
18
|
+
This task is generating metadata properties or the `object` field.
|
19
|
+
|
20
|
+
It will do nothing for object types that doesn't need to generate extra properties.
|
21
|
+
|
22
|
+
## Build Tree
|
23
|
+
This task is generating the sub-objects if any.
|
24
|
+
|
@@ -0,0 +1,26 @@
|
|
1
|
+
#!/usr/bin/env node
|
2
|
+
|
3
|
+
import { bundleWorkflowCode } from '@temporalio/worker';
|
4
|
+
import { writeFile } from 'fs/promises';
|
5
|
+
import path from 'path';
|
6
|
+
|
7
|
+
async function bundle(wsPath, bundlePath) {
|
8
|
+
const { code } = await bundleWorkflowCode({
|
9
|
+
workflowsPath: path.resolve(wsPath),
|
10
|
+
});
|
11
|
+
const codePath = path.resolve(bundlePath);
|
12
|
+
await writeFile(codePath, code);
|
13
|
+
console.log(`Bundle written to ${codePath}`);
|
14
|
+
}
|
15
|
+
|
16
|
+
const wsPath = process.argv[2];
|
17
|
+
const bundlePath = process.argv[3];
|
18
|
+
if (!wsPath || !bundlePath) {
|
19
|
+
console.error('Usage: build-workflows <workflows-path> <bundle-path>');
|
20
|
+
process.exit(1);
|
21
|
+
}
|
22
|
+
|
23
|
+
bundle(wsPath, bundlePath).catch((err) => {
|
24
|
+
console.error(err);
|
25
|
+
process.exit(1);
|
26
|
+
});
|
@@ -0,0 +1,32 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.createDocumentTypeFromInteractionRun = createDocumentTypeFromInteractionRun;
|
4
|
+
const activity_1 = require("@temporalio/activity");
|
5
|
+
const projections_js_1 = require("../../dsl/projections.js");
|
6
|
+
const ActivityContext_js_1 = require("../../dsl/setup/ActivityContext.js");
|
7
|
+
const errors_js_1 = require("../../errors.js");
|
8
|
+
async function createDocumentTypeFromInteractionRun(payload) {
|
9
|
+
const { params, client } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
10
|
+
if (!params.run) {
|
11
|
+
throw new errors_js_1.ActivityParamNotFound("run", payload.activity);
|
12
|
+
}
|
13
|
+
const genTypeRes = params.run.result;
|
14
|
+
if (!genTypeRes.document_type) {
|
15
|
+
activity_1.log.error("No name generated for type: " + JSON.stringify(genTypeRes), genTypeRes);
|
16
|
+
throw new Error("No name generated for type");
|
17
|
+
}
|
18
|
+
activity_1.log.info("Generated schema for type", genTypeRes.metadata_schema);
|
19
|
+
const typeData = {
|
20
|
+
name: genTypeRes.document_type,
|
21
|
+
object_schema: genTypeRes.metadata_schema,
|
22
|
+
is_chunkable: !!genTypeRes.is_chunkable,
|
23
|
+
};
|
24
|
+
const type = await client.types.create(typeData);
|
25
|
+
if (params.updateObjectId) {
|
26
|
+
await client.objects.update(params.updateObjectId, {
|
27
|
+
type: type.id,
|
28
|
+
});
|
29
|
+
}
|
30
|
+
return (0, projections_js_1.projectResult)(payload, params, type, { id: type.id, name: type.name });
|
31
|
+
}
|
32
|
+
//# sourceMappingURL=createDocumentTypeFromInteractionRun.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"createDocumentTypeFromInteractionRun.js","sourceRoot":"","sources":["../../../../src/activities/advanced/createDocumentTypeFromInteractionRun.ts"],"names":[],"mappings":";;AAuBA,oFA8BC;AApDD,mDAA2C;AAC3C,6DAAyD;AACzD,2EAAmE;AACnE,+CAAwD;AAmBjD,KAAK,UAAU,oCAAoC,CAAC,OAAoC;IAC3F,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,MAAM,IAAA,kCAAa,EAA6C,OAAO,CAAC,CAAC;IAEpG,IAAI,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC;QACd,MAAM,IAAI,iCAAqB,CAAC,KAAK,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IAC7D,CAAC;IAED,MAAM,UAAU,GAAG,MAAM,CAAC,GAAG,CAAC,MAAM,CAAC;IAErC,IAAI,CAAC,UAAU,CAAC,aAAa,EAAE,CAAC;QAC5B,cAAG,CAAC,KAAK,CAAC,8BAA8B,GAAG,IAAI,CAAC,SAAS,CAAC,UAAU,CAAC,EAAE,UAAU,CAAC,CAAC;QACnF,MAAM,IAAI,KAAK,CAAC,4BAA4B,CAAC,CAAC;IAClD,CAAC;IAED,cAAG,CAAC,IAAI,CAAC,2BAA2B,EAAE,UAAU,CAAC,eAAe,CAAC,CAAC;IAClE,MAAM,QAAQ,GAAmC;QAC7C,IAAI,EAAE,UAAU,CAAC,aAAa;QAC9B,aAAa,EAAE,UAAU,CAAC,eAAe;QACzC,YAAY,EAAE,CAAC,CAAC,UAAU,CAAC,YAAY;KAC1C,CAAA;IAED,MAAM,IAAI,GAAG,MAAM,MAAM,CAAC,KAAK,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;IAEjD,IAAI,MAAM,CAAC,cAAc,EAAE,CAAC;QACxB,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,cAAc,EAAE;YAC/C,IAAI,EAAE,IAAI,CAAC,EAAE;SAChB,CAAC,CAAC;IACP,CAAC;IAED,OAAO,IAAA,8BAAa,EAAC,OAAO,EAAE,MAAM,EAAE,IAAI,EAAE,EAAE,EAAE,EAAE,IAAI,CAAC,EAAE,EAAE,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,CAAC,CAAC;AAClF,CAAC"}
|
@@ -0,0 +1,66 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.createOrUpdateDocumentFromInteractionRun = createOrUpdateDocumentFromInteractionRun;
|
4
|
+
const common_1 = require("@vertesia/common");
|
5
|
+
const activity_1 = require("@temporalio/activity");
|
6
|
+
const ActivityContext_js_1 = require("../../dsl/setup/ActivityContext.js");
|
7
|
+
const errors_js_1 = require("../../errors.js");
|
8
|
+
async function createOrUpdateDocumentFromInteractionRun(payload) {
|
9
|
+
const { params, client } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
10
|
+
const runId = params.run_id;
|
11
|
+
const objectTypeName = params.object_type;
|
12
|
+
if (!runId) {
|
13
|
+
throw new errors_js_1.ActivityParamNotFound("run_id", payload.activity);
|
14
|
+
}
|
15
|
+
if (!objectTypeName && !params.update_existing_id) {
|
16
|
+
throw new errors_js_1.ActivityParamNotFound("object_type", payload.activity);
|
17
|
+
}
|
18
|
+
activity_1.log.info("Creating document from interaction result", { runId, objectTypeName });
|
19
|
+
const run = await client.runs.retrieve(runId).catch((e) => {
|
20
|
+
throw new errors_js_1.NoDocumentFound(`Error fetching run ${runId}: ${e.message}`);
|
21
|
+
});
|
22
|
+
const type = objectTypeName ?
|
23
|
+
await client.types.getTypeByName(objectTypeName).catch((e) => {
|
24
|
+
throw new errors_js_1.NoDocumentFound(`Error fetching type ${objectTypeName}: ${e.message}`);
|
25
|
+
})
|
26
|
+
: undefined;
|
27
|
+
const result = run.result;
|
28
|
+
const resultIsObject = typeof result === 'object';
|
29
|
+
const inputData = run.parameters;
|
30
|
+
let name;
|
31
|
+
if (resultIsObject) {
|
32
|
+
name = result['name'] || result["title"] || inputData['name'] || params.fallback_name || 'Untitled';
|
33
|
+
}
|
34
|
+
else {
|
35
|
+
name = inputData['name'] || params.fallback_name || 'Untitled';
|
36
|
+
}
|
37
|
+
const docPayload = {
|
38
|
+
name,
|
39
|
+
parent: params.parent ?? undefined,
|
40
|
+
properties: resultIsObject ? result : {},
|
41
|
+
text: !resultIsObject ? result : undefined,
|
42
|
+
type: type?.id,
|
43
|
+
status: common_1.ContentObjectStatus.completed,
|
44
|
+
generation_run_info: {
|
45
|
+
id: run.id,
|
46
|
+
date: new Date().toISOString(),
|
47
|
+
model: run.modelId,
|
48
|
+
target: resultIsObject ? 'properties' : 'text'
|
49
|
+
}
|
50
|
+
};
|
51
|
+
//create or update the document
|
52
|
+
let newDoc = false;
|
53
|
+
let doc = undefined;
|
54
|
+
if (params.update_existing_id) {
|
55
|
+
activity_1.log.info(`Updating existing document ${params.update_existing_id}`);
|
56
|
+
doc = await client.objects.update(params.update_existing_id, docPayload);
|
57
|
+
}
|
58
|
+
else {
|
59
|
+
activity_1.log.info(`Creating new document of type ${objectTypeName}`);
|
60
|
+
doc = await client.objects.create(docPayload);
|
61
|
+
newDoc = true;
|
62
|
+
}
|
63
|
+
activity_1.log.info(`Document ${objectTypeName + ' '}${doc.id}(${doc.name}) ${newDoc ? 'created' : 'updated'}`);
|
64
|
+
return { id: doc.id, isNew: newDoc, type: name };
|
65
|
+
}
|
66
|
+
//# sourceMappingURL=createOrUpdateDocumentFromInteractionRun.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"createOrUpdateDocumentFromInteractionRun.js","sourceRoot":"","sources":["../../../../src/activities/advanced/createOrUpdateDocumentFromInteractionRun.ts"],"names":[],"mappings":";;AA8BA,4FAkEC;AAhGD,6CAAqG;AACrG,mDAA2C;AAC3C,2EAAmE;AACnE,+CAAyE;AA2BlE,KAAK,UAAU,wCAAwC,CAAC,OAAoC;IAC/F,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,MAAM,IAAA,kCAAa,EAA+C,OAAO,CAAC,CAAC;IAEtG,MAAM,KAAK,GAAG,MAAM,CAAC,MAAM,CAAC;IAC5B,MAAM,cAAc,GAAG,MAAM,CAAC,WAAW,CAAC;IAE1C,IAAI,CAAC,KAAK,EAAE,CAAC;QACT,MAAM,IAAI,iCAAqB,CAAC,QAAQ,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IAChE,CAAC;IACD,IAAI,CAAC,cAAc,IAAI,CAAC,MAAM,CAAC,kBAAkB,EAAE,CAAC;QAChD,MAAM,IAAI,iCAAqB,CAAC,aAAa,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IACrE,CAAC;IAED,cAAG,CAAC,IAAI,CAAC,2CAA2C,EAAE,EAAE,KAAK,EAAE,cAAc,EAAE,CAAC,CAAC;IAEjF,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,EAAE;QACtD,MAAM,IAAI,2BAAe,CAAC,sBAAsB,KAAK,KAAK,CAAC,CAAC,OAAO,EAAE,CAAC,CAAC;IAC3E,CAAC,CAAC,CAAC;IAEH,MAAM,IAAI,GAAG,cAAc,CAAC,CAAC;QACzB,MAAM,MAAM,CAAC,KAAK,CAAC,aAAa,CAAC,cAAc,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,EAAE;YACzD,MAAM,IAAI,2BAAe,CAAC,uBAAuB,cAAc,KAAK,CAAC,CAAC,OAAO,EAAE,CAAC,CAAC;QACrF,CAAC,CAAC;QACF,CAAC,CAAC,SAAS,CAAC;IAGhB,MAAM,MAAM,GAAG,GAAG,CAAC,MAAM,CAAC;IAC1B,MAAM,cAAc,GAAG,OAAO,MAAM,KAAK,QAAQ,CAAC;IAClD,MAAM,SAAS,GAAG,GAAG,CAAC,UAAU,CAAC;IAEjC,IAAI,IAAY,CAAC;IACjB,IAAI,cAAc,EAAE,CAAC;QACjB,IAAI,GAAG,MAAM,CAAC,MAAM,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,IAAI,SAAS,CAAC,MAAM,CAAC,IAAI,MAAM,CAAC,aAAa,IAAI,UAAU,CAAC;IACxG,CAAC;SAAM,CAAC;QACJ,IAAI,GAAG,SAAS,CAAC,MAAM,CAAC,IAAI,MAAM,CAAC,aAAa,IAAI,UAAU,CAAC;IACnE,CAAC;IAED,MAAM,UAAU,GAAG;QACf,IAAI;QACJ,MAAM,EAAE,MAAM,CAAC,MAAM,IAAI,SAAS;QAClC,UAAU,EAAE,cAAc,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE;QACxC,IAAI,EAAE,CAAC,cAAc,CAAC,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,SAAS;QAC1C,IAAI,EAAE,IAAI,EAAE,EAAE;QACd,MAAM,EAAE,4BAAmB,CAAC,SAAS;QACrC,mBAAmB,EAAE;YACjB,EAAE,EAAE,GAAG,CAAC,EAAE;YACV,IAAI,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;YAC9B,KAAK,EAAE,GAAG,CAAC,OAAO;YAClB,MAAM,EAAE,cAAc,CAAC,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,MAAM;SACjD;KACJ,CAAC;IAEF,+BAA+B;IAC/B,IAAI,MAAM,GAAY,KAAK,CAAC;IAC5B,IAAI,GAAG,GAAG,SAAS,CAAC;IACpB,IAAI,MAAM,CAAC,kBAAkB,EAAE,CAAC;QAC5B,cAAG,CAAC,IAAI,CAAC,8BAA8B,MAAM,CAAC,kBAAkB,EAAE,CAAC,CAAC;QACpE,GAAG,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,kBAAkB,EAAE,UAAU,CAAC,CAAC;IAC7E,CAAC;SAAM,CAAC;QACJ,cAAG,CAAC,IAAI,CAAC,iCAAiC,cAAc,EAAE,CAAC,CAAC;QAC5D,GAAG,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,UAAU,CAAC,CAAC;QAC9C,MAAM,GAAG,IAAI,CAAC;IAClB,CAAC;IAED,cAAG,CAAC,IAAI,CAAC,YAAY,cAAc,GAAG,GAAG,GAAG,GAAG,CAAC,EAAE,IAAI,GAAG,CAAC,IAAI,KAAK,MAAM,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,SAAS,EAAE,CAAC,CAAC;IACrG,OAAO,EAAE,EAAE,EAAE,GAAG,CAAC,EAAE,EAAE,KAAK,EAAE,MAAM,EAAE,IAAI,EAAE,IAAI,EAAE,CAAA;AACpD,CAAC"}
|
@@ -0,0 +1,18 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.updateDocumentFromInteractionRun = updateDocumentFromInteractionRun;
|
4
|
+
const ActivityContext_js_1 = require("../../dsl/setup/ActivityContext.js");
|
5
|
+
const errors_js_1 = require("../../errors.js");
|
6
|
+
async function updateDocumentFromInteractionRun(payload) {
|
7
|
+
const { params, client, objectId } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
8
|
+
if (!params.run) {
|
9
|
+
throw new errors_js_1.ActivityParamNotFound("run", payload.activity);
|
10
|
+
}
|
11
|
+
const docProps = params.run.result;
|
12
|
+
if (!docProps) {
|
13
|
+
return { status: "failed", error: "no-props" };
|
14
|
+
}
|
15
|
+
await client.objects.update(objectId, docProps);
|
16
|
+
return { status: "success" };
|
17
|
+
}
|
18
|
+
//# sourceMappingURL=updateDocumentFromInteractionRun.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"updateDocumentFromInteractionRun.js","sourceRoot":"","sources":["../../../../src/activities/advanced/updateDocumentFromInteractionRun.ts"],"names":[],"mappings":";;AAiBA,4EAgBC;AAhCD,2EAAmE;AACnE,+CAAwD;AAejD,KAAK,UAAU,gCAAgC,CAAC,OAAoC;IACvF,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAA,kCAAa,EAAyC,OAAO,CAAC,CAAC;IAE1G,IAAI,CAAC,MAAM,CAAC,GAAG,EAAE,CAAC;QACd,MAAM,IAAI,iCAAqB,CAAC,KAAK,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IAC7D,CAAC;IAED,MAAM,QAAQ,GAAG,MAAM,CAAC,GAAG,CAAC,MAAM,CAAC;IAEnC,IAAI,CAAC,QAAQ,EAAE,CAAC;QACZ,OAAO,EAAE,MAAM,EAAE,QAAQ,EAAE,KAAK,EAAE,UAAU,EAAE,CAAC;IACnD,CAAC;IAED,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,QAAQ,EAAE,QAAQ,CAAC,CAAC;IAEhD,OAAO,EAAE,MAAM,EAAE,SAAS,EAAE,CAAC;AACjC,CAAC"}
|
@@ -0,0 +1,79 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.chunkDocument = chunkDocument;
|
4
|
+
const activity_1 = require("@temporalio/activity");
|
5
|
+
const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
|
6
|
+
const executeInteraction_js_1 = require("./executeInteraction.js");
|
7
|
+
const INT_CHUNK_DOCUMENT = "sys:ChunkDocument";
|
8
|
+
async function chunkDocument(payload) {
|
9
|
+
const { params, client, objectId } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
10
|
+
const { force } = params;
|
11
|
+
const interactionName = params.interactionName ?? INT_CHUNK_DOCUMENT;
|
12
|
+
activity_1.log.info(`Object ${objectId} chunking started`);
|
13
|
+
const document = await client.objects.retrieve(objectId, "+text");
|
14
|
+
const type = document.type ? await client.types.retrieve(document.type.id) : undefined;
|
15
|
+
if (!type?.is_chunkable) {
|
16
|
+
activity_1.log.warn('Type is not chunkable for object ID: ' + objectId);
|
17
|
+
return { id: objectId, status: "skipped", message: "type not chunkable" };
|
18
|
+
}
|
19
|
+
//check if text is present
|
20
|
+
if (!document.text) {
|
21
|
+
activity_1.log.warn('No text found for object ID: ' + objectId);
|
22
|
+
return { id: objectId, status: "failed", message: "no text found" };
|
23
|
+
}
|
24
|
+
if (!force && document.parts && document.parts.length > 0 && document.parts_etag === document.text_etag) {
|
25
|
+
activity_1.log.info('Document already chunked for object ID: ' + objectId);
|
26
|
+
return { id: objectId, status: "skipped", message: "document already chunked with correct etag" };
|
27
|
+
}
|
28
|
+
//instrument the text with line numbers
|
29
|
+
const lines = document.text.split('\n');
|
30
|
+
const instrumented = lines.map((l, i) => `{%${i}%}${l}`).join('\n');
|
31
|
+
const res = await (0, executeInteraction_js_1.executeInteractionFromActivity)(client, interactionName, params, {
|
32
|
+
objectId: objectId,
|
33
|
+
content: instrumented
|
34
|
+
});
|
35
|
+
const parts = res.result.parts;
|
36
|
+
if (!parts || parts.length === 0) {
|
37
|
+
activity_1.log.warn('No parts found for object ID: ' + objectId, res);
|
38
|
+
return { id: objectId, status: "failed", parts: [], message: "no parts found" };
|
39
|
+
}
|
40
|
+
const partDocs = await Promise.all(parts.map(async (part, i) => {
|
41
|
+
const text = lines.filter((_l, i) => i >= part.line_number_start && i <= part.line_number_end).join('\n');
|
42
|
+
const location = () => {
|
43
|
+
let location = document.location;
|
44
|
+
if (location.endsWith('/')) {
|
45
|
+
location += document.name + "/" + part.type;
|
46
|
+
}
|
47
|
+
location += '/' + document.name + "/" + part.type;
|
48
|
+
return location;
|
49
|
+
};
|
50
|
+
const docPart = await client.objects.create({
|
51
|
+
name: part.name,
|
52
|
+
parent: objectId,
|
53
|
+
text: text,
|
54
|
+
location: location(),
|
55
|
+
properties: {
|
56
|
+
part_number: i + 1,
|
57
|
+
etag: document.text_etag,
|
58
|
+
source_line_start: part.line_number_start,
|
59
|
+
source_line_end: part.line_number_end,
|
60
|
+
title: part.name
|
61
|
+
}
|
62
|
+
});
|
63
|
+
return docPart;
|
64
|
+
}));
|
65
|
+
//delete previous parts
|
66
|
+
if (document.parts && document.parts.length > 0) {
|
67
|
+
activity_1.log.info('Deleting previous parts for object ID: ' + objectId, { parts: document.parts });
|
68
|
+
await Promise.all(document.parts.map(async (partId) => {
|
69
|
+
await client.objects.delete(partId);
|
70
|
+
}));
|
71
|
+
}
|
72
|
+
await client.objects.update(objectId, {
|
73
|
+
parts: partDocs.map(p => p.id),
|
74
|
+
parts_etag: document.text_etag
|
75
|
+
});
|
76
|
+
activity_1.log.info(`Object ${objectId} chunking completed`, { parts: document.parts });
|
77
|
+
return { id: objectId, status: "completed", parts: document.parts };
|
78
|
+
}
|
79
|
+
//# sourceMappingURL=chunkDocument.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"chunkDocument.js","sourceRoot":"","sources":["../../../src/activities/chunkDocument.ts"],"names":[],"mappings":";;AAkCA,sCAyFC;AA1HD,mDAA2C;AAC3C,wEAAgE;AAChE,mEAAqG;AAErG,MAAM,kBAAkB,GAAG,mBAAmB,CAAA;AA6BvC,KAAK,UAAU,aAAa,CAAC,OAAoC;IACpE,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,GAAG,MAAM,IAAA,kCAAa,EAAsB,OAAO,CAAC,CAAC;IAEvF,MAAM,EAAE,KAAK,EAAE,GAAG,MAAM,CAAC;IACzB,MAAM,eAAe,GAAG,MAAM,CAAC,eAAe,IAAI,kBAAkB,CAAC;IAErE,cAAG,CAAC,IAAI,CAAC,UAAU,QAAQ,mBAAmB,CAAC,CAAC;IAEhD,MAAM,QAAQ,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,QAAQ,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC;IAElE,MAAM,IAAI,GAAG,QAAQ,CAAC,IAAI,CAAC,CAAC,CAAC,MAAM,MAAM,CAAC,KAAK,CAAC,QAAQ,CAAC,QAAQ,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC;IAEvF,IAAI,CAAC,IAAI,EAAE,YAAY,EAAE,CAAC;QACtB,cAAG,CAAC,IAAI,CAAC,uCAAuC,GAAG,QAAQ,CAAC,CAAC;QAC7D,OAAO,EAAE,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,SAAS,EAAE,OAAO,EAAE,oBAAoB,EAAE,CAAA;IAC7E,CAAC;IAED,0BAA0B;IAC1B,IAAI,CAAC,QAAQ,CAAC,IAAI,EAAE,CAAC;QACjB,cAAG,CAAC,IAAI,CAAC,+BAA+B,GAAG,QAAQ,CAAC,CAAC;QACrD,OAAO,EAAE,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,QAAQ,EAAE,OAAO,EAAE,eAAe,EAAE,CAAA;IACvE,CAAC;IAED,IAAI,CAAC,KAAK,IAAI,QAAQ,CAAC,KAAK,IAAI,QAAQ,CAAC,KAAK,CAAC,MAAM,GAAG,CAAC,IAAI,QAAQ,CAAC,UAAU,KAAK,QAAQ,CAAC,SAAS,EAAE,CAAC;QACtG,cAAG,CAAC,IAAI,CAAC,0CAA0C,GAAG,QAAQ,CAAC,CAAC;QAChE,OAAO,EAAE,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,SAAS,EAAE,OAAO,EAAE,4CAA4C,EAAE,CAAA;IACrG,CAAC;IAED,uCAAuC;IACvC,MAAM,KAAK,GAAG,QAAQ,CAAC,IAAI,CAAC,KAAK,CAAC,IAAI,CAAC,CAAA;IACvC,MAAM,YAAY,GAAG,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,KAAK,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAA;IAEnE,MAAM,GAAG,GAAG,MAAM,IAAA,sDAA8B,EAAC,MAAM,EAAE,eAAe,EAAE,MAAM,EAAE;QAC9E,QAAQ,EAAE,QAAQ;QAClB,OAAO,EAAE,YAAY;KACxB,CAAC,CAAC;IAEH,MAAM,KAAK,GAAG,GAAG,CAAC,MAAM,CAAC,KAAkB,CAAC;IAC5C,IAAI,CAAC,KAAK,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC/B,cAAG,CAAC,IAAI,CAAC,gCAAgC,GAAG,QAAQ,EAAE,GAAG,CAAC,CAAC;QAC3D,OAAO,EAAE,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,QAAQ,EAAE,KAAK,EAAE,EAAE,EAAE,OAAO,EAAE,gBAAgB,EAAE,CAAA;IACnF,CAAC;IAED,MAAM,QAAQ,GAAG,MAAM,OAAO,CAAC,GAAG,CAAC,KAAK,CAAC,GAAG,CAAC,KAAK,EAAE,IAAI,EAAE,CAAC,EAAE,EAAE;QAE3D,MAAM,IAAI,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,EAAE,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,IAAI,IAAI,CAAC,iBAAiB,IAAI,CAAC,IAAI,IAAI,CAAC,eAAe,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAE1G,MAAM,QAAQ,GAAG,GAAG,EAAE;YAClB,IAAI,QAAQ,GAAG,QAAQ,CAAC,QAAQ,CAAC;YACjC,IAAI,QAAQ,CAAC,QAAQ,CAAC,GAAG,CAAC,EAAE,CAAC;gBACzB,QAAQ,IAAI,QAAQ,CAAC,IAAI,GAAG,GAAG,GAAG,IAAI,CAAC,IAAI,CAAA;YAC/C,CAAC;YACD,QAAQ,IAAI,GAAG,GAAG,QAAQ,CAAC,IAAI,GAAG,GAAG,GAAG,IAAI,CAAC,IAAI,CAAC;YAClD,OAAO,QAAQ,CAAC;QACpB,CAAC,CAAA;QAED,MAAM,OAAO,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC;YACxC,IAAI,EAAE,IAAI,CAAC,IAAI;YACf,MAAM,EAAE,QAAQ;YAChB,IAAI,EAAE,IAAI;YACV,QAAQ,EAAE,QAAQ,EAAE;YACpB,UAAU,EAAE;gBACR,WAAW,EAAE,CAAC,GAAG,CAAC;gBAClB,IAAI,EAAE,QAAQ,CAAC,SAAS;gBACxB,iBAAiB,EAAE,IAAI,CAAC,iBAAiB;gBACzC,eAAe,EAAE,IAAI,CAAC,eAAe;gBACrC,KAAK,EAAE,IAAI,CAAC,IAAI;aACnB;SACJ,CAAC,CAAC;QACH,OAAO,OAAO,CAAC;IACnB,CAAC,CAAC,CAAC,CAAC;IAEJ,uBAAuB;IACvB,IAAI,QAAQ,CAAC,KAAK,IAAI,QAAQ,CAAC,KAAK,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QAC9C,cAAG,CAAC,IAAI,CAAC,yCAAyC,GAAG,QAAQ,EAAE,EAAE,KAAK,EAAE,QAAQ,CAAC,KAAK,EAAE,CAAC,CAAC;QAC1F,MAAM,OAAO,CAAC,GAAG,CAAC,QAAQ,CAAC,KAAK,CAAC,GAAG,CAAC,KAAK,EAAE,MAAM,EAAE,EAAE;YAClD,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,MAAM,CAAC,CAAC;QACxC,CAAC,CAAC,CAAC,CAAC;IACR,CAAC;IAED,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,QAAQ,EAAE;QAClC,KAAK,EAAE,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,EAAE,CAAC;QAC9B,UAAU,EAAE,QAAQ,CAAC,SAAS;KACjC,CAAC,CAAC;IAEH,cAAG,CAAC,IAAI,CAAC,UAAU,QAAQ,qBAAqB,EAAE,EAAE,KAAK,EAAE,QAAQ,CAAC,KAAK,EAAE,CAAC,CAAC;IAE7E,OAAO,EAAE,EAAE,EAAE,QAAQ,EAAE,MAAM,EAAE,WAAW,EAAE,KAAK,EAAE,QAAQ,CAAC,KAAK,EAAE,CAAA;AAEvE,CAAC"}
|
@@ -0,0 +1,64 @@
|
|
1
|
+
"use strict";
|
2
|
+
var __importDefault = (this && this.__importDefault) || function (mod) {
|
3
|
+
return (mod && mod.__esModule) ? mod : { "default": mod };
|
4
|
+
};
|
5
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
6
|
+
exports.createPdfDocumentFromSource = createPdfDocumentFromSource;
|
7
|
+
const activity_1 = require("@temporalio/activity");
|
8
|
+
const fs_1 = __importDefault(require("fs"));
|
9
|
+
const mutool_js_1 = require("../conversion/mutool.js");
|
10
|
+
const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
|
11
|
+
const errors_js_1 = require("../errors.js");
|
12
|
+
const blobs_js_1 = require("../utils/blobs.js");
|
13
|
+
const memory_js_1 = require("../utils/memory.js");
|
14
|
+
/**
|
15
|
+
* Create a new PDF by extrracting pages from a source PDF
|
16
|
+
* @returns
|
17
|
+
*/
|
18
|
+
async function createPdfDocumentFromSource(payload) {
|
19
|
+
const { client, objectId, params } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
20
|
+
const inputObject = await client.objects.retrieve(objectId);
|
21
|
+
const { pages, filename, title } = params;
|
22
|
+
activity_1.log.info(`Creating PDF from source`, { objectId, pages, filename, title });
|
23
|
+
if (!pages || pages.length === 0) {
|
24
|
+
activity_1.log.error(`No pages provided`);
|
25
|
+
throw new Error(`No pages provided`);
|
26
|
+
}
|
27
|
+
if (!inputObject) {
|
28
|
+
activity_1.log.error(`Document ${objectId} not found`);
|
29
|
+
throw new errors_js_1.NoDocumentFound(`Document ${objectId} not found`, [objectId]);
|
30
|
+
}
|
31
|
+
if (!inputObject.content?.source) {
|
32
|
+
activity_1.log.error(`Document ${objectId} has no source`);
|
33
|
+
throw new errors_js_1.NoDocumentFound(`Document ${objectId} has no source`, [objectId]);
|
34
|
+
}
|
35
|
+
if (!inputObject.content.type || (!inputObject.content.type?.startsWith('application/pdf'))) {
|
36
|
+
activity_1.log.error(`Document ${objectId} is not an image`);
|
37
|
+
throw new errors_js_1.NoDocumentFound(`Document ${objectId} is not an image or pdf: ${inputObject.content.type}`, [objectId]);
|
38
|
+
}
|
39
|
+
const targetType = await client.types.getTypeByName(params.target_object_type);
|
40
|
+
if (!targetType) {
|
41
|
+
activity_1.log.error(`Type ${params.target_object_type} not found`);
|
42
|
+
throw new errors_js_1.NoDocumentFound(`Type ${params.target_object_type} not found`);
|
43
|
+
}
|
44
|
+
const tmpFile = await (0, blobs_js_1.saveBlobToTempFile)(client, inputObject.content.source, ".pdf");
|
45
|
+
const newPdf = await (0, mutool_js_1.pdfExtractPages)(tmpFile, pages);
|
46
|
+
activity_1.log.info(`PDF created from pages ${pages.join(', ')} `, { newPdf });
|
47
|
+
const name = `pages-${pages.join('-')}.pdf`;
|
48
|
+
const sourceToUpload = new memory_js_1.NodeStreamSource(fs_1.default.createReadStream(newPdf), name, "application/pdf");
|
49
|
+
activity_1.log.info(`Uploading file ${newPdf} `);
|
50
|
+
const upload = await client.objects.upload(sourceToUpload);
|
51
|
+
activity_1.log.info(`File uploaded ${upload.source} `);
|
52
|
+
const newObject = await client.objects.create({
|
53
|
+
type: targetType.id,
|
54
|
+
name: title || targetType.name,
|
55
|
+
parent: objectId,
|
56
|
+
content: {
|
57
|
+
source: upload.source,
|
58
|
+
name: upload.name,
|
59
|
+
type: 'application/pdf'
|
60
|
+
}
|
61
|
+
});
|
62
|
+
return { newObjectId: newObject.id, uploadedFile: upload.name };
|
63
|
+
}
|
64
|
+
//# sourceMappingURL=createDocumentFromOther.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"createDocumentFromOther.js","sourceRoot":"","sources":["../../../src/activities/createDocumentFromOther.ts"],"names":[],"mappings":";;;;;AA6BA,kEA8DC;AA1FD,mDAA2C;AAC3C,4CAAoB;AACpB,uDAA0D;AAC1D,wEAAgE;AAChE,4CAA+C;AAC/C,gDAAuD;AACvD,kDAAsD;AAkBtD;;;GAGG;AACI,KAAK,UAAU,2BAA2B,CAAC,OAAoC;IAClF,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,MAAM,EAAE,GAAG,MAAM,IAAA,kCAAa,EAAoC,OAAO,CAAC,CAAC;IACrG,MAAM,WAAW,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC;IAE5D,MAAM,EAAE,KAAK,EAAE,QAAQ,EAAE,KAAK,EAAE,GAAG,MAAM,CAAC;IAC1C,cAAG,CAAC,IAAI,CAAC,0BAA0B,EAAE,EAAE,QAAQ,EAAE,KAAK,EAAE,QAAQ,EAAE,KAAK,EAAE,CAAC,CAAC;IAE3E,IAAI,CAAC,KAAK,IAAI,KAAK,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC/B,cAAG,CAAC,KAAK,CAAC,mBAAmB,CAAC,CAAC;QAC/B,MAAM,IAAI,KAAK,CAAC,mBAAmB,CAAC,CAAC;IACzC,CAAC;IAED,IAAI,CAAC,WAAW,EAAE,CAAC;QACf,cAAG,CAAC,KAAK,CAAC,YAAY,QAAQ,YAAY,CAAC,CAAC;QAC5C,MAAM,IAAI,2BAAe,CAAC,YAAY,QAAQ,YAAY,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;IAC5E,CAAC;IAED,IAAI,CAAC,WAAW,CAAC,OAAO,EAAE,MAAM,EAAE,CAAC;QAC/B,cAAG,CAAC,KAAK,CAAC,YAAY,QAAQ,gBAAgB,CAAC,CAAC;QAChD,MAAM,IAAI,2BAAe,CAAC,YAAY,QAAQ,gBAAgB,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;IAChF,CAAC;IAED,IAAI,CAAC,WAAW,CAAC,OAAO,CAAC,IAAI,IAAI,CAAC,CAAC,WAAW,CAAC,OAAO,CAAC,IAAI,EAAE,UAAU,CAAC,iBAAiB,CAAC,CAAC,EAAE,CAAC;QAC1F,cAAG,CAAC,KAAK,CAAC,YAAY,QAAQ,kBAAkB,CAAC,CAAC;QAClD,MAAM,IAAI,2BAAe,CAAC,YAAY,QAAQ,4BAA4B,WAAW,CAAC,OAAO,CAAC,IAAI,EAAE,EAAE,CAAC,QAAQ,CAAC,CAAC,CAAC;IACtH,CAAC;IAED,MAAM,UAAU,GAAG,MAAM,MAAM,CAAC,KAAK,CAAC,aAAa,CAAC,MAAM,CAAC,kBAAkB,CAAC,CAAC;IAC/E,IAAI,CAAC,UAAU,EAAE,CAAC;QACd,cAAG,CAAC,KAAK,CAAC,QAAQ,MAAM,CAAC,kBAAkB,YAAY,CAAC,CAAC;QACzD,MAAM,IAAI,2BAAe,CAAC,QAAQ,MAAM,CAAC,kBAAkB,YAAY,CAAC,CAAC;IAC7E,CAAC;IAED,MAAM,OAAO,GAAG,MAAM,IAAA,6BAAkB,EAAC,MAAM,EAAE,WAAW,CAAC,OAAO,CAAC,MAAM,EAAE,MAAM,CAAC,CAAC;IACrF,MAAM,MAAM,GAAG,MAAM,IAAA,2BAAe,EAAC,OAAO,EAAE,KAAK,CAAC,CAAC;IACrD,cAAG,CAAC,IAAI,CAAC,0BAA0B,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,EAAE,EAAE,MAAM,EAAE,CAAC,CAAC;IACpE,MAAM,IAAI,GAAG,SAAS,KAAK,CAAC,IAAI,CAAC,GAAG,CAAC,MAAM,CAAC;IAE5C,MAAM,cAAc,GAAG,IAAI,4BAAgB,CACvC,YAAE,CAAC,gBAAgB,CAAC,MAAM,CAAC,EAC3B,IAAI,EACJ,iBAAiB,CACpB,CAAA;IAED,cAAG,CAAC,IAAI,CAAC,kBAAkB,MAAM,GAAG,CAAC,CAAC;IACtC,MAAM,MAAM,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,cAAc,CAAC,CAAC;IAC3D,cAAG,CAAC,IAAI,CAAC,iBAAiB,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC;IAE5C,MAAM,SAAS,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC;QAC1C,IAAI,EAAE,UAAU,CAAC,EAAE;QACnB,IAAI,EAAE,KAAK,IAAI,UAAU,CAAC,IAAI;QAC9B,MAAM,EAAE,QAAQ;QAChB,OAAO,EAAE;YACL,MAAM,EAAE,MAAM,CAAC,MAAM;YACrB,IAAI,EAAE,MAAM,CAAC,IAAI;YACjB,IAAI,EAAE,iBAAiB;SAC1B;KACJ,CAAC,CAAC;IAEH,OAAO,EAAE,WAAW,EAAE,SAAS,CAAC,EAAE,EAAE,YAAY,EAAE,MAAM,CAAC,IAAI,EAAE,CAAC;AAGpE,CAAC"}
|
@@ -0,0 +1,135 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.executeInteraction = executeInteraction;
|
4
|
+
exports.executeInteractionFromActivity = executeInteractionFromActivity;
|
5
|
+
const common_1 = require("@vertesia/common");
|
6
|
+
const activity_1 = require("@temporalio/activity");
|
7
|
+
const projections_js_1 = require("../dsl/projections.js");
|
8
|
+
const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
|
9
|
+
const tokens_js_1 = require("../utils/tokens.js");
|
10
|
+
//Example:
|
11
|
+
//@ts-ignore
|
12
|
+
const JSON = {
|
13
|
+
name: 'executeInteraction',
|
14
|
+
import: ["defaultModel", "guidlineId", "docTypeId"],
|
15
|
+
params: {
|
16
|
+
defaultModel: "${model}",
|
17
|
+
interactionName: "GenerateSummary",
|
18
|
+
model: "${defaultModel ?? 'gpt4'}",
|
19
|
+
environment: "13456",
|
20
|
+
max_tokens: 100,
|
21
|
+
temperature: 0.5,
|
22
|
+
tags: ["test"],
|
23
|
+
result_schema: "${docType.object_schema}",
|
24
|
+
prompt_data: {
|
25
|
+
documents: "${documents}",
|
26
|
+
guidline: "${guidline.text}"
|
27
|
+
}
|
28
|
+
},
|
29
|
+
fetch: {
|
30
|
+
documents: {
|
31
|
+
type: "document",
|
32
|
+
query: {
|
33
|
+
id: { $in: "${objectIds}" },
|
34
|
+
},
|
35
|
+
select: "+text",
|
36
|
+
},
|
37
|
+
guidline: {
|
38
|
+
type: "document",
|
39
|
+
limit: 1,
|
40
|
+
query: {
|
41
|
+
id: "${guidlineId}",
|
42
|
+
},
|
43
|
+
select: "+text",
|
44
|
+
on_not_found: "throw"
|
45
|
+
},
|
46
|
+
docType: {
|
47
|
+
type: "document_type",
|
48
|
+
limit: 1,
|
49
|
+
query: {
|
50
|
+
id: "${docTypeId}",
|
51
|
+
},
|
52
|
+
select: "+object_schema",
|
53
|
+
}
|
54
|
+
}
|
55
|
+
};
|
56
|
+
async function executeInteraction(payload) {
|
57
|
+
const { client, params } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
58
|
+
const { interactionName, prompt_data } = params;
|
59
|
+
if (params.truncate) {
|
60
|
+
const truncate = params.truncate;
|
61
|
+
for (const [key, value] of Object.entries(truncate)) {
|
62
|
+
prompt_data[key] = (0, tokens_js_1.truncByMaxTokens)(prompt_data[key], value);
|
63
|
+
}
|
64
|
+
}
|
65
|
+
const res = await executeInteractionFromActivity(client, interactionName, params, prompt_data, payload.debug_mode);
|
66
|
+
return (0, projections_js_1.projectResult)(payload, params, res, {
|
67
|
+
runId: res.id,
|
68
|
+
status: res.status,
|
69
|
+
result: res.result,
|
70
|
+
});
|
71
|
+
}
|
72
|
+
async function executeInteractionFromActivity(client, interactionName, params, prompt_data, debug) {
|
73
|
+
const userTags = params.tags;
|
74
|
+
const info = (0, activity_1.activityInfo)();
|
75
|
+
const runId = info.workflowExecution.runId;
|
76
|
+
let tags = ["workflow", `tmpRunId:${runId}`]; //TODO use wf:wfName
|
77
|
+
if (userTags) {
|
78
|
+
tags = tags.concat(userTags);
|
79
|
+
}
|
80
|
+
let previousStudioExecutionRun = undefined;
|
81
|
+
if (params.include_previous_error) {
|
82
|
+
//retrieve last failed run if any
|
83
|
+
if (info.attempt > 1) {
|
84
|
+
activity_1.log.info("Retrying, searching for previous run", { tags: ["tmpRunId:" + runId] });
|
85
|
+
const payload = {
|
86
|
+
query: { tags: ["tmpRunId:" + info.workflowExecution.runId] },
|
87
|
+
limit: 1,
|
88
|
+
};
|
89
|
+
const previousRun = await client.runs.search(payload).then((res) => {
|
90
|
+
activity_1.log.info("Search results", { results: res });
|
91
|
+
return res ? res[0] ?? undefined : undefined;
|
92
|
+
});
|
93
|
+
if (previousRun) {
|
94
|
+
activity_1.log.info("Found previous run", { previousRun });
|
95
|
+
previousStudioExecutionRun = await client.runs.retrieve(previousRun.id);
|
96
|
+
}
|
97
|
+
}
|
98
|
+
}
|
99
|
+
if (debug && previousStudioExecutionRun?.error) {
|
100
|
+
activity_1.log.info(`Found previous run error`, { error: previousStudioExecutionRun?.error });
|
101
|
+
}
|
102
|
+
const config = {
|
103
|
+
environment: params.environment,
|
104
|
+
model: params.model,
|
105
|
+
max_tokens: params.max_tokens,
|
106
|
+
temperature: params.temperature
|
107
|
+
};
|
108
|
+
const data = {
|
109
|
+
...prompt_data,
|
110
|
+
previous_error: previousStudioExecutionRun?.error,
|
111
|
+
};
|
112
|
+
const result_schema = params.result_schema;
|
113
|
+
if (debug) {
|
114
|
+
activity_1.log.info(`About to execute interaction ${interactionName}`, { config, data, result_schema, tags });
|
115
|
+
}
|
116
|
+
const res = await client.interactions.executeByName(interactionName, {
|
117
|
+
config,
|
118
|
+
data,
|
119
|
+
result_schema,
|
120
|
+
tags,
|
121
|
+
stream: false,
|
122
|
+
}).catch((err) => {
|
123
|
+
activity_1.log.error(`Error executing interaction ${interactionName}`, { err });
|
124
|
+
throw new Error(`Interaction Execution failed ${interactionName}: ${err.message}`);
|
125
|
+
});
|
126
|
+
if (debug) {
|
127
|
+
activity_1.log.info(`Interaction executed ${interactionName}`, res);
|
128
|
+
}
|
129
|
+
if (res.error || res.status === common_1.ExecutionRunStatus.failed) {
|
130
|
+
activity_1.log.error(`Error executing interaction ${interactionName}`, { error: res.error });
|
131
|
+
throw new Error(`Interaction Execution failed ${interactionName}: ${res.error}`);
|
132
|
+
}
|
133
|
+
return res;
|
134
|
+
}
|
135
|
+
//# sourceMappingURL=executeInteraction.js.map
|
@@ -0,0 +1 @@
|
|
1
|
+
{"version":3,"file":"executeInteraction.js","sourceRoot":"","sources":["../../../src/activities/executeInteraction.ts"],"names":[],"mappings":";;AA+FA,gDAsBC;AAED,wEAuEC;AA7LD,6CAAuK;AACvK,mDAAyD;AACzD,0DAAsD;AACtD,wEAAgE;AAChE,kDAAoE;AAGpE,UAAU;AACV,YAAY;AACZ,MAAM,IAAI,GAAoB;IAC1B,IAAI,EAAE,oBAAoB;IAC1B,MAAM,EAAE,CAAC,cAAc,EAAE,YAAY,EAAE,WAAW,CAAC;IACnD,MAAM,EAAE;QACJ,YAAY,EAAE,UAAU;QACxB,eAAe,EAAE,iBAAiB;QAClC,KAAK,EAAE,2BAA2B;QAClC,WAAW,EAAE,OAAO;QACpB,UAAU,EAAE,GAAG;QACf,WAAW,EAAE,GAAG;QAChB,IAAI,EAAE,CAAC,MAAM,CAAC;QACd,aAAa,EAAE,0BAA0B;QACzC,WAAW,EAAE;YACT,SAAS,EAAE,cAAc;YACzB,QAAQ,EAAE,kBAAkB;SAC/B;KACJ;IACD,KAAK,EAAE;QACH,SAAS,EAAE;YACP,IAAI,EAAE,UAAU;YAChB,KAAK,EAAE;gBACH,EAAE,EAAE,EAAE,GAAG,EAAE,cAAc,EAAE;aAC9B;YACD,MAAM,EAAE,OAAO;SAClB;QACD,QAAQ,EAAE;YACN,IAAI,EAAE,UAAU;YAChB,KAAK,EAAE,CAAC;YACR,KAAK,EAAE;gBACH,EAAE,EAAE,eAAe;aACtB;YACD,MAAM,EAAE,OAAO;YACf,YAAY,EAAE,OAAO;SACxB;QACD,OAAO,EAAE;YACL,IAAI,EAAE,eAAe;YACrB,KAAK,EAAE,CAAC;YACR,KAAK,EAAE;gBACH,EAAE,EAAE,cAAc;aACrB;YACD,MAAM,EAAE,gBAAgB;SAC3B;KACJ;CACJ,CAAA;AA0CM,KAAK,UAAU,kBAAkB,CAAC,OAAoC;IACzE,MAAM,EACF,MAAM,EAAE,MAAM,EACjB,GAAG,MAAM,IAAA,kCAAa,EAA2B,OAAO,CAAC,CAAC;IAE3D,MAAM,EAAE,eAAe,EAAE,WAAW,EAAE,GAAG,MAAM,CAAC;IAEhD,IAAI,MAAM,CAAC,QAAQ,EAAE,CAAC;QAClB,MAAM,QAAQ,GAAG,MAAM,CAAC,QAAQ,CAAC;QACjC,KAAK,MAAM,CAAC,GAAG,EAAE,KAAK,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,QAAQ,CAAC,EAAE,CAAC;YAClD,WAAW,CAAC,GAAG,CAAC,GAAG,IAAA,4BAAgB,EAAC,WAAW,CAAC,GAAG,CAAC,EAAE,KAAK,CAAC,CAAC;QACjE,CAAC;IACL,CAAC;IAED,MAAM,GAAG,GAAG,MAAM,8BAA8B,CAAC,MAAM,EAAE,eAAe,EAAE,MAAM,EAAE,WAAW,EAAE,OAAO,CAAC,UAAU,CAAC,CAAC;IAEnH,OAAO,IAAA,8BAAa,EAAC,OAAO,EAAE,MAAM,EAAE,GAAG,EAAE;QACvC,KAAK,EAAE,GAAG,CAAC,EAAE;QACb,MAAM,EAAE,GAAG,CAAC,MAAM;QAClB,MAAM,EAAE,GAAG,CAAC,MAAM;KACrB,CAAC,CAAC;AAEP,CAAC;AAEM,KAAK,UAAU,8BAA8B,CAAC,MAAwB,EAAE,eAAuB,EAAE,MAAkC,EAAE,WAAgB,EAAE,KAAe;IACzK,MAAM,QAAQ,GAAG,MAAM,CAAC,IAAI,CAAC;IAC7B,MAAM,IAAI,GAAG,IAAA,uBAAY,GAAE,CAAC;IAC5B,MAAM,KAAK,GAAG,IAAI,CAAC,iBAAiB,CAAC,KAAK,CAAC;IAC3C,IAAI,IAAI,GAAG,CAAC,UAAU,EAAE,YAAY,KAAK,EAAE,CAAC,CAAC,CAAC,oBAAoB;IAClE,IAAI,QAAQ,EAAE,CAAC;QACX,IAAI,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;IACjC,CAAC;IAED,IAAI,0BAA0B,GAA6B,SAAS,CAAC;IACrE,IAAI,MAAM,CAAC,sBAAsB,EAAE,CAAC;QAChC,iCAAiC;QACjC,IAAI,IAAI,CAAC,OAAO,GAAG,CAAC,EAAE,CAAC;YACnB,cAAG,CAAC,IAAI,CAAC,sCAAsC,EAAE,EAAE,IAAI,EAAE,CAAC,WAAW,GAAG,KAAK,CAAC,EAAE,CAAC,CAAC;YAClF,MAAM,OAAO,GAAqB;gBAC9B,KAAK,EAAE,EAAE,IAAI,EAAE,CAAC,WAAW,GAAG,IAAI,CAAC,iBAAiB,CAAC,KAAK,CAAC,EAAE;gBAC7D,KAAK,EAAE,CAAC;aACX,CAAC;YACF,MAAM,WAAW,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,IAAI,CAAC,CAAC,GAAG,EAAE,EAAE;gBAC/D,cAAG,CAAC,IAAI,CAAC,gBAAgB,EAAE,EAAE,OAAO,EAAE,GAAG,EAAE,CAAC,CAAC;gBAC7C,OAAO,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,SAAS,CAAC,CAAC,CAAC,SAAS,CAAA;YAChD,CAAC,CAAC,CAAC;YAEH,IAAI,WAAW,EAAE,CAAC;gBACd,cAAG,CAAC,IAAI,CAAC,oBAAoB,EAAE,EAAE,WAAW,EAAE,CAAC,CAAC;gBAChD,0BAA0B,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,QAAQ,CAAC,WAAW,CAAC,EAAE,CAAC,CAAC;YAC5E,CAAC;QACL,CAAC;IACL,CAAC;IACD,IAAI,KAAK,IAAI,0BAA0B,EAAE,KAAK,EAAE,CAAC;QAC7C,cAAG,CAAC,IAAI,CAAC,2BAA2B,EAAE,EAAE,KAAK,EAAE,0BAA0B,EAAE,KAAK,EAAE,CAAC,CAAC;IACxF,CAAC;IAED,MAAM,MAAM,GAAsC;QAC9C,WAAW,EAAE,MAAM,CAAC,WAAW;QAC/B,KAAK,EAAE,MAAM,CAAC,KAAK;QACnB,UAAU,EAAE,MAAM,CAAC,UAAU;QAC7B,WAAW,EAAE,MAAM,CAAC,WAAW;KAClC,CAAA;IACD,MAAM,IAAI,GAAG;QACT,GAAG,WAAW;QACd,cAAc,EAAE,0BAA0B,EAAE,KAAK;KACpD,CAAA;IAED,MAAM,aAAa,GAAG,MAAM,CAAC,aAAa,CAAC;IAE3C,IAAI,KAAK,EAAE,CAAC;QACR,cAAG,CAAC,IAAI,CAAC,gCAAgC,eAAe,EAAE,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,aAAa,EAAE,IAAI,EAAE,CAAC,CAAC;IACvG,CAAC;IAED,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,YAAY,CAAC,aAAa,CAAC,eAAe,EAAE;QACjE,MAAM;QACN,IAAI;QACJ,aAAa;QACb,IAAI;QACJ,MAAM,EAAE,KAAK;KAChB,CAAC,CAAC,KAAK,CAAC,CAAC,GAAG,EAAE,EAAE;QACb,cAAG,CAAC,KAAK,CAAC,+BAA+B,eAAe,EAAE,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;QACrE,MAAM,IAAI,KAAK,CAAC,gCAAgC,eAAe,KAAK,GAAG,CAAC,OAAO,EAAE,CAAC,CAAC;IACvF,CAAC,CAAC,CAAC;IAEH,IAAI,KAAK,EAAE,CAAC;QACR,cAAG,CAAC,IAAI,CAAC,wBAAwB,eAAe,EAAE,EAAE,GAAG,CAAC,CAAC;IAC7D,CAAC;IAED,IAAI,GAAG,CAAC,KAAK,IAAI,GAAG,CAAC,MAAM,KAAK,2BAAkB,CAAC,MAAM,EAAE,CAAC;QACxD,cAAG,CAAC,KAAK,CAAC,+BAA+B,eAAe,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,CAAC,KAAK,EAAE,CAAC,CAAC;QAClF,MAAM,IAAI,KAAK,CAAC,gCAAgC,eAAe,KAAK,GAAG,CAAC,KAAK,EAAE,CAAC,CAAC;IACrF,CAAC;IAED,OAAO,GAAG,CAAC;AACf,CAAC"}
|
@@ -0,0 +1,140 @@
|
|
1
|
+
"use strict";
|
2
|
+
Object.defineProperty(exports, "__esModule", { value: true });
|
3
|
+
exports.extractDocumentText = extractDocumentText;
|
4
|
+
const activity_1 = require("@temporalio/activity");
|
5
|
+
const mutool_js_1 = require("../conversion/mutool.js");
|
6
|
+
const pandoc_js_1 = require("../conversion/pandoc.js");
|
7
|
+
const pdf_js_1 = require("../conversion/pdf.js");
|
8
|
+
const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
|
9
|
+
const errors_js_1 = require("../errors.js");
|
10
|
+
const result_types_js_1 = require("../result-types.js");
|
11
|
+
const blobs_js_1 = require("../utils/blobs.js");
|
12
|
+
const tokens_js_1 = require("../utils/tokens.js");
|
13
|
+
//@ts-ignore
|
14
|
+
const JSON = {
|
15
|
+
name: 'extractDocumentText',
|
16
|
+
};
|
17
|
+
async function extractDocumentText(payload) {
|
18
|
+
const { client, objectId } = await (0, ActivityContext_js_1.setupActivity)(payload);
|
19
|
+
const r = await client.objects.find({
|
20
|
+
query: { _id: objectId },
|
21
|
+
limit: 1,
|
22
|
+
select: "+text"
|
23
|
+
});
|
24
|
+
const doc = r[0];
|
25
|
+
if (!doc) {
|
26
|
+
activity_1.log.error(`Document ${objectId} not found`);
|
27
|
+
throw new errors_js_1.NoDocumentFound(`Document ${objectId} not found`, payload.objectIds);
|
28
|
+
}
|
29
|
+
activity_1.log.info(`Extracting text for object ${doc.id}`);
|
30
|
+
if (!doc.content?.type || !doc.content?.source) {
|
31
|
+
if (doc.text) {
|
32
|
+
return createResponse(doc, doc.text, result_types_js_1.TextExtractionStatus.skipped, "Text present and no source or type");
|
33
|
+
}
|
34
|
+
else {
|
35
|
+
return createResponse(doc, "", result_types_js_1.TextExtractionStatus.error, "No source or type found");
|
36
|
+
}
|
37
|
+
}
|
38
|
+
//skip if text already extracted and proper etag
|
39
|
+
if (doc.text && doc.text.length > 0 && doc.text_etag === doc.content.etag) {
|
40
|
+
return createResponse(doc, doc.text, result_types_js_1.TextExtractionStatus.skipped, "Text already extracted");
|
41
|
+
}
|
42
|
+
let fileBuffer;
|
43
|
+
try {
|
44
|
+
fileBuffer = await (0, blobs_js_1.fetchBlobAsBuffer)(client, doc.content.source);
|
45
|
+
}
|
46
|
+
catch (e) {
|
47
|
+
activity_1.log.error(`Error reading file: ${e}`);
|
48
|
+
return createResponse(doc, "", result_types_js_1.TextExtractionStatus.error, e.message);
|
49
|
+
}
|
50
|
+
let txt;
|
51
|
+
switch (doc.content.type) {
|
52
|
+
case 'application/pdf':
|
53
|
+
//if pdf is more than 2MB, use mutool
|
54
|
+
if (fileBuffer.length > 2 * 1024 * 1024) {
|
55
|
+
txt = await (0, mutool_js_1.mutoolPdfToText)(fileBuffer);
|
56
|
+
}
|
57
|
+
else {
|
58
|
+
txt = await (0, pdf_js_1.trasformPdfToMarkdown)(fileBuffer);
|
59
|
+
}
|
60
|
+
break;
|
61
|
+
case 'text/plain':
|
62
|
+
txt = fileBuffer.toString('utf8');
|
63
|
+
break;
|
64
|
+
//docx
|
65
|
+
case 'application/vnd.openxmlformats-officedocument.wordprocessingml.document':
|
66
|
+
txt = await (0, pandoc_js_1.manyToMarkdown)(fileBuffer, 'docx');
|
67
|
+
break;
|
68
|
+
//html
|
69
|
+
case 'text/html':
|
70
|
+
txt = await (0, pandoc_js_1.manyToMarkdown)(fileBuffer, 'html');
|
71
|
+
break;
|
72
|
+
//opendocument
|
73
|
+
case 'application/vnd.oasis.opendocument.text':
|
74
|
+
txt = await (0, pandoc_js_1.manyToMarkdown)(fileBuffer, 'odt');
|
75
|
+
break;
|
76
|
+
//rtf
|
77
|
+
case 'application/rtf':
|
78
|
+
txt = await (0, pandoc_js_1.manyToMarkdown)(fileBuffer, 'rtf');
|
79
|
+
break;
|
80
|
+
//markdown
|
81
|
+
case 'text/markdown':
|
82
|
+
txt = fileBuffer.toString('utf8');
|
83
|
+
break;
|
84
|
+
//csv
|
85
|
+
case 'text/csv':
|
86
|
+
txt = fileBuffer.toString('utf8');
|
87
|
+
break;
|
88
|
+
//typescript
|
89
|
+
case 'application/typescript':
|
90
|
+
txt = fileBuffer.toString('utf8');
|
91
|
+
break;
|
92
|
+
//javascript
|
93
|
+
case 'application/javascript':
|
94
|
+
txt = fileBuffer.toString('utf8');
|
95
|
+
break;
|
96
|
+
//json
|
97
|
+
case 'application/json':
|
98
|
+
txt = fileBuffer.toString('utf8');
|
99
|
+
break;
|
100
|
+
default:
|
101
|
+
if (sniffIfText(fileBuffer)) {
|
102
|
+
txt = fileBuffer.toString('utf8'); //TODO: add charset detection
|
103
|
+
break;
|
104
|
+
}
|
105
|
+
return createResponse(doc, doc.text ?? '', result_types_js_1.TextExtractionStatus.skipped, `Unsupported mime type: ${doc.content.type}`);
|
106
|
+
}
|
107
|
+
const tokensData = (0, tokens_js_1.countTokens)(txt);
|
108
|
+
const etag = doc.content.etag ?? (0, blobs_js_1.md5)(txt);
|
109
|
+
const updateData = {
|
110
|
+
text: txt,
|
111
|
+
text_etag: etag,
|
112
|
+
tokens: {
|
113
|
+
...tokensData,
|
114
|
+
etag: etag,
|
115
|
+
}
|
116
|
+
};
|
117
|
+
await client.objects.update(doc.id, updateData);
|
118
|
+
return createResponse(doc, txt, result_types_js_1.TextExtractionStatus.success);
|
119
|
+
}
|
120
|
+
function createResponse(doc, text, status, message) {
|
121
|
+
return {
|
122
|
+
status,
|
123
|
+
message,
|
124
|
+
tokens: doc.tokens,
|
125
|
+
len: text.length,
|
126
|
+
objectId: doc.id,
|
127
|
+
hasText: !!text,
|
128
|
+
};
|
129
|
+
}
|
130
|
+
//if file is less than 100KB, check if it looks like text
|
131
|
+
function sniffIfText(buf) {
|
132
|
+
if (buf.length < 100 * 1024) {
|
133
|
+
const s = buf.toString('utf8');
|
134
|
+
if (s.length > 0) {
|
135
|
+
return true;
|
136
|
+
}
|
137
|
+
}
|
138
|
+
return false;
|
139
|
+
}
|
140
|
+
//# sourceMappingURL=extractDocumentText.js.map
|