@vertesia/workflow 1.0.0-dev.20260203.130115Z → 1.0.0-dev.20260227.112605Z

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (449) hide show
  1. package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js +33 -0
  2. package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
  3. package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +73 -0
  4. package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
  5. package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js +19 -0
  6. package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
  7. package/lib/cjs/activities/chunkDocument.js +113 -0
  8. package/lib/cjs/activities/chunkDocument.js.map +1 -0
  9. package/lib/cjs/activities/copyParentArtifacts.js +127 -0
  10. package/lib/cjs/activities/copyParentArtifacts.js.map +1 -0
  11. package/lib/cjs/activities/createDocumentFromOther.js +64 -0
  12. package/lib/cjs/activities/createDocumentFromOther.js.map +1 -0
  13. package/lib/cjs/activities/executeInteraction.js +221 -0
  14. package/lib/cjs/activities/executeInteraction.js.map +1 -0
  15. package/lib/cjs/activities/extractDocumentText.js +196 -0
  16. package/lib/cjs/activities/extractDocumentText.js.map +1 -0
  17. package/lib/cjs/activities/generateDocumentProperties.js +109 -0
  18. package/lib/cjs/activities/generateDocumentProperties.js.map +1 -0
  19. package/lib/cjs/activities/generateEmbeddings.js +267 -0
  20. package/lib/cjs/activities/generateEmbeddings.js.map +1 -0
  21. package/lib/cjs/activities/generateOrAssignContentType.js +173 -0
  22. package/lib/cjs/activities/generateOrAssignContentType.js.map +1 -0
  23. package/lib/cjs/activities/getObjectFromStore.js +20 -0
  24. package/lib/cjs/activities/getObjectFromStore.js.map +1 -0
  25. package/lib/cjs/activities/handleError.js +22 -0
  26. package/lib/cjs/activities/handleError.js.map +1 -0
  27. package/lib/cjs/activities/index-dsl.js +53 -0
  28. package/lib/cjs/activities/index-dsl.js.map +1 -0
  29. package/lib/cjs/activities/index.js +21 -0
  30. package/lib/cjs/activities/index.js.map +1 -0
  31. package/lib/cjs/activities/media/prepareAudio.js +239 -0
  32. package/lib/cjs/activities/media/prepareAudio.js.map +1 -0
  33. package/lib/cjs/activities/media/prepareVideo.js +429 -0
  34. package/lib/cjs/activities/media/prepareVideo.js.map +1 -0
  35. package/lib/cjs/activities/media/processPdfWithTextract.js +103 -0
  36. package/lib/cjs/activities/media/processPdfWithTextract.js.map +1 -0
  37. package/lib/cjs/activities/media/saveGladiaTranscription.js +95 -0
  38. package/lib/cjs/activities/media/saveGladiaTranscription.js.map +1 -0
  39. package/lib/cjs/activities/media/transcribeMediaWithGladia.js +99 -0
  40. package/lib/cjs/activities/media/transcribeMediaWithGladia.js.map +1 -0
  41. package/lib/cjs/activities/mergeChildArtifacts.js +150 -0
  42. package/lib/cjs/activities/mergeChildArtifacts.js.map +1 -0
  43. package/lib/cjs/activities/notifyWebhook.js +167 -0
  44. package/lib/cjs/activities/notifyWebhook.js.map +1 -0
  45. package/lib/cjs/activities/rateLimiter.js +30 -0
  46. package/lib/cjs/activities/rateLimiter.js.map +1 -0
  47. package/lib/cjs/activities/renditions/generateImageRendition.js +66 -0
  48. package/lib/cjs/activities/renditions/generateImageRendition.js.map +1 -0
  49. package/lib/cjs/activities/renditions/generateVideoRendition.js +200 -0
  50. package/lib/cjs/activities/renditions/generateVideoRendition.js.map +1 -0
  51. package/lib/cjs/activities/setDocumentStatus.js +26 -0
  52. package/lib/cjs/activities/setDocumentStatus.js.map +1 -0
  53. package/lib/cjs/conversion/TextractProcessor.js +417 -0
  54. package/lib/cjs/conversion/TextractProcessor.js.map +1 -0
  55. package/lib/cjs/conversion/image.js +149 -0
  56. package/lib/cjs/conversion/image.js.map +1 -0
  57. package/lib/cjs/conversion/markitdown.js +42 -0
  58. package/lib/cjs/conversion/markitdown.js.map +1 -0
  59. package/lib/cjs/conversion/mutool.js +147 -0
  60. package/lib/cjs/conversion/mutool.js.map +1 -0
  61. package/lib/cjs/conversion/pandoc.js +39 -0
  62. package/lib/cjs/conversion/pandoc.js.map +1 -0
  63. package/lib/cjs/dsl/conditions.js +81 -0
  64. package/lib/cjs/dsl/conditions.js.map +1 -0
  65. package/lib/cjs/dsl/dsl-workflow.js +380 -0
  66. package/lib/cjs/dsl/dsl-workflow.js.map +1 -0
  67. package/lib/cjs/dsl/dslProxyActivities.js +23 -0
  68. package/lib/cjs/dsl/dslProxyActivities.js.map +1 -0
  69. package/lib/cjs/dsl/projections.js +59 -0
  70. package/lib/cjs/dsl/projections.js.map +1 -0
  71. package/lib/cjs/dsl/setup/ActivityContext.js +178 -0
  72. package/lib/cjs/dsl/setup/ActivityContext.js.map +1 -0
  73. package/lib/cjs/dsl/setup/fetch/DataProvider.js +51 -0
  74. package/lib/cjs/dsl/setup/fetch/DataProvider.js.map +1 -0
  75. package/lib/cjs/dsl/setup/fetch/index.js +16 -0
  76. package/lib/cjs/dsl/setup/fetch/index.js.map +1 -0
  77. package/lib/cjs/dsl/setup/fetch/providers.js +67 -0
  78. package/lib/cjs/dsl/setup/fetch/providers.js.map +1 -0
  79. package/lib/cjs/dsl/test/test-child-workflow.js +10 -0
  80. package/lib/cjs/dsl/test/test-child-workflow.js.map +1 -0
  81. package/lib/cjs/dsl/validation.js +122 -0
  82. package/lib/cjs/dsl/validation.js.map +1 -0
  83. package/lib/cjs/dsl/vars.js +341 -0
  84. package/lib/cjs/dsl/vars.js.map +1 -0
  85. package/lib/cjs/dsl/walk.js +100 -0
  86. package/lib/cjs/dsl/walk.js.map +1 -0
  87. package/lib/cjs/dsl.js +20 -0
  88. package/lib/cjs/dsl.js.map +1 -0
  89. package/lib/cjs/errors.js +89 -0
  90. package/lib/cjs/errors.js.map +1 -0
  91. package/lib/cjs/index.js +57 -0
  92. package/lib/cjs/index.js.map +1 -0
  93. package/lib/cjs/iterative-generation/activities/extractToc.js +47 -0
  94. package/lib/cjs/iterative-generation/activities/extractToc.js.map +1 -0
  95. package/lib/cjs/iterative-generation/activities/finalizeOutput.js +72 -0
  96. package/lib/cjs/iterative-generation/activities/finalizeOutput.js.map +1 -0
  97. package/lib/cjs/iterative-generation/activities/generatePart.js +78 -0
  98. package/lib/cjs/iterative-generation/activities/generatePart.js.map +1 -0
  99. package/lib/cjs/iterative-generation/activities/generateToc.js +86 -0
  100. package/lib/cjs/iterative-generation/activities/generateToc.js.map +1 -0
  101. package/lib/cjs/iterative-generation/activities/index.js +12 -0
  102. package/lib/cjs/iterative-generation/activities/index.js.map +1 -0
  103. package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js +56 -0
  104. package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
  105. package/lib/cjs/iterative-generation/types.js +5 -0
  106. package/lib/cjs/iterative-generation/types.js.map +1 -0
  107. package/lib/cjs/iterative-generation/utils.js +121 -0
  108. package/lib/cjs/iterative-generation/utils.js.map +1 -0
  109. package/lib/cjs/package.json +3 -0
  110. package/lib/cjs/result-types.js +10 -0
  111. package/lib/cjs/result-types.js.map +1 -0
  112. package/lib/cjs/system/notifyWebhookWorkflow.js +53 -0
  113. package/lib/cjs/system/notifyWebhookWorkflow.js.map +1 -0
  114. package/lib/cjs/system/recalculateEmbeddingsWorkflow.js +33 -0
  115. package/lib/cjs/system/recalculateEmbeddingsWorkflow.js.map +1 -0
  116. package/lib/cjs/utils/auth.js +15 -0
  117. package/lib/cjs/utils/auth.js.map +1 -0
  118. package/lib/cjs/utils/blobs.js +64 -0
  119. package/lib/cjs/utils/blobs.js.map +1 -0
  120. package/lib/cjs/utils/chunks.js +14 -0
  121. package/lib/cjs/utils/chunks.js.map +1 -0
  122. package/lib/cjs/utils/client.js +31 -0
  123. package/lib/cjs/utils/client.js.map +1 -0
  124. package/lib/cjs/utils/expand-vars.js +33 -0
  125. package/lib/cjs/utils/expand-vars.js.map +1 -0
  126. package/lib/cjs/utils/memory.js +65 -0
  127. package/lib/cjs/utils/memory.js.map +1 -0
  128. package/lib/cjs/utils/renditions.js +92 -0
  129. package/lib/cjs/utils/renditions.js.map +1 -0
  130. package/lib/cjs/utils/storage.js +54 -0
  131. package/lib/cjs/utils/storage.js.map +1 -0
  132. package/lib/cjs/utils/text-preview-utils.js +43 -0
  133. package/lib/cjs/utils/text-preview-utils.js.map +1 -0
  134. package/lib/cjs/utils/tokens.js +38 -0
  135. package/lib/cjs/utils/tokens.js.map +1 -0
  136. package/lib/cjs/vars.js +20 -0
  137. package/lib/cjs/vars.js.map +1 -0
  138. package/lib/cjs/workflows.js +15 -0
  139. package/lib/cjs/workflows.js.map +1 -0
  140. package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js +30 -0
  141. package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
  142. package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +70 -0
  143. package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
  144. package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js +16 -0
  145. package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
  146. package/lib/esm/activities/chunkDocument.js +110 -0
  147. package/lib/esm/activities/chunkDocument.js.map +1 -0
  148. package/lib/esm/activities/copyParentArtifacts.js +124 -0
  149. package/lib/esm/activities/copyParentArtifacts.js.map +1 -0
  150. package/lib/esm/activities/createDocumentFromOther.js +58 -0
  151. package/lib/esm/activities/createDocumentFromOther.js.map +1 -0
  152. package/lib/esm/activities/executeInteraction.js +217 -0
  153. package/lib/esm/activities/executeInteraction.js.map +1 -0
  154. package/lib/esm/activities/extractDocumentText.js +193 -0
  155. package/lib/esm/activities/extractDocumentText.js.map +1 -0
  156. package/lib/esm/activities/generateDocumentProperties.js +106 -0
  157. package/lib/esm/activities/generateDocumentProperties.js.map +1 -0
  158. package/lib/esm/activities/generateEmbeddings.js +264 -0
  159. package/lib/esm/activities/generateEmbeddings.js.map +1 -0
  160. package/lib/esm/activities/generateOrAssignContentType.js +170 -0
  161. package/lib/esm/activities/generateOrAssignContentType.js.map +1 -0
  162. package/lib/esm/activities/getObjectFromStore.js +17 -0
  163. package/lib/esm/activities/getObjectFromStore.js.map +1 -0
  164. package/lib/esm/activities/handleError.js +19 -0
  165. package/lib/esm/activities/handleError.js.map +1 -0
  166. package/lib/esm/activities/index-dsl.js +26 -0
  167. package/lib/esm/activities/index-dsl.js.map +1 -0
  168. package/lib/esm/activities/index.js +5 -0
  169. package/lib/esm/activities/index.js.map +1 -0
  170. package/lib/esm/activities/media/prepareAudio.js +200 -0
  171. package/lib/esm/activities/media/prepareAudio.js.map +1 -0
  172. package/lib/esm/activities/media/prepareVideo.js +390 -0
  173. package/lib/esm/activities/media/prepareVideo.js.map +1 -0
  174. package/lib/esm/activities/media/processPdfWithTextract.js +99 -0
  175. package/lib/esm/activities/media/processPdfWithTextract.js.map +1 -0
  176. package/lib/esm/activities/media/saveGladiaTranscription.js +92 -0
  177. package/lib/esm/activities/media/saveGladiaTranscription.js.map +1 -0
  178. package/lib/esm/activities/media/transcribeMediaWithGladia.js +96 -0
  179. package/lib/esm/activities/media/transcribeMediaWithGladia.js.map +1 -0
  180. package/lib/esm/activities/mergeChildArtifacts.js +147 -0
  181. package/lib/esm/activities/mergeChildArtifacts.js.map +1 -0
  182. package/lib/esm/activities/notifyWebhook.js +164 -0
  183. package/lib/esm/activities/notifyWebhook.js.map +1 -0
  184. package/lib/esm/activities/rateLimiter.js +27 -0
  185. package/lib/esm/activities/rateLimiter.js.map +1 -0
  186. package/lib/esm/activities/renditions/generateImageRendition.js +63 -0
  187. package/lib/esm/activities/renditions/generateImageRendition.js.map +1 -0
  188. package/lib/esm/activities/renditions/generateVideoRendition.js +194 -0
  189. package/lib/esm/activities/renditions/generateVideoRendition.js.map +1 -0
  190. package/lib/esm/activities/setDocumentStatus.js +23 -0
  191. package/lib/esm/activities/setDocumentStatus.js.map +1 -0
  192. package/lib/esm/conversion/TextractProcessor.js +410 -0
  193. package/lib/esm/conversion/TextractProcessor.js.map +1 -0
  194. package/lib/esm/conversion/image.js +143 -0
  195. package/lib/esm/conversion/image.js.map +1 -0
  196. package/lib/esm/conversion/markitdown.js +36 -0
  197. package/lib/esm/conversion/markitdown.js.map +1 -0
  198. package/lib/esm/conversion/mutool.js +139 -0
  199. package/lib/esm/conversion/mutool.js.map +1 -0
  200. package/lib/esm/conversion/pandoc.js +36 -0
  201. package/lib/esm/conversion/pandoc.js.map +1 -0
  202. package/lib/esm/dsl/conditions.js +75 -0
  203. package/lib/esm/dsl/conditions.js.map +1 -0
  204. package/lib/esm/dsl/dsl-workflow.js +373 -0
  205. package/lib/esm/dsl/dsl-workflow.js.map +1 -0
  206. package/lib/esm/dsl/dslProxyActivities.js +20 -0
  207. package/lib/esm/dsl/dslProxyActivities.js.map +1 -0
  208. package/lib/esm/dsl/projections.js +55 -0
  209. package/lib/esm/dsl/projections.js.map +1 -0
  210. package/lib/esm/dsl/setup/ActivityContext.js +173 -0
  211. package/lib/esm/dsl/setup/ActivityContext.js.map +1 -0
  212. package/lib/esm/dsl/setup/fetch/DataProvider.js +47 -0
  213. package/lib/esm/dsl/setup/fetch/DataProvider.js.map +1 -0
  214. package/lib/esm/dsl/setup/fetch/index.js +12 -0
  215. package/lib/esm/dsl/setup/fetch/index.js.map +1 -0
  216. package/lib/esm/dsl/setup/fetch/providers.js +61 -0
  217. package/lib/esm/dsl/setup/fetch/providers.js.map +1 -0
  218. package/lib/esm/dsl/test/test-child-workflow.js +5 -0
  219. package/lib/esm/dsl/test/test-child-workflow.js.map +1 -0
  220. package/lib/esm/dsl/validation.js +118 -0
  221. package/lib/esm/dsl/validation.js.map +1 -0
  222. package/lib/esm/dsl/vars.js +335 -0
  223. package/lib/esm/dsl/vars.js.map +1 -0
  224. package/lib/esm/dsl/walk.js +96 -0
  225. package/lib/esm/dsl/walk.js.map +1 -0
  226. package/lib/esm/dsl.js +4 -0
  227. package/lib/esm/dsl.js.map +1 -0
  228. package/lib/esm/errors.js +78 -0
  229. package/lib/esm/errors.js.map +1 -0
  230. package/lib/esm/index.js +39 -0
  231. package/lib/esm/index.js.map +1 -0
  232. package/lib/esm/iterative-generation/activities/extractToc.js +44 -0
  233. package/lib/esm/iterative-generation/activities/extractToc.js.map +1 -0
  234. package/lib/esm/iterative-generation/activities/finalizeOutput.js +69 -0
  235. package/lib/esm/iterative-generation/activities/finalizeOutput.js.map +1 -0
  236. package/lib/esm/iterative-generation/activities/generatePart.js +75 -0
  237. package/lib/esm/iterative-generation/activities/generatePart.js.map +1 -0
  238. package/lib/esm/iterative-generation/activities/generateToc.js +83 -0
  239. package/lib/esm/iterative-generation/activities/generateToc.js.map +1 -0
  240. package/lib/esm/iterative-generation/activities/index.js +5 -0
  241. package/lib/esm/iterative-generation/activities/index.js.map +1 -0
  242. package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js +53 -0
  243. package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
  244. package/lib/esm/iterative-generation/types.js +2 -0
  245. package/lib/esm/iterative-generation/types.js.map +1 -0
  246. package/lib/esm/iterative-generation/utils.js +112 -0
  247. package/lib/esm/iterative-generation/utils.js.map +1 -0
  248. package/lib/esm/result-types.js +7 -0
  249. package/lib/esm/result-types.js.map +1 -0
  250. package/lib/esm/system/notifyWebhookWorkflow.js +50 -0
  251. package/lib/esm/system/notifyWebhookWorkflow.js.map +1 -0
  252. package/lib/esm/system/recalculateEmbeddingsWorkflow.js +30 -0
  253. package/lib/esm/system/recalculateEmbeddingsWorkflow.js.map +1 -0
  254. package/lib/esm/utils/auth.js +8 -0
  255. package/lib/esm/utils/auth.js.map +1 -0
  256. package/lib/esm/utils/blobs.js +54 -0
  257. package/lib/esm/utils/blobs.js.map +1 -0
  258. package/lib/esm/utils/chunks.js +9 -0
  259. package/lib/esm/utils/chunks.js.map +1 -0
  260. package/lib/esm/utils/client.js +27 -0
  261. package/lib/esm/utils/client.js.map +1 -0
  262. package/lib/esm/utils/expand-vars.js +30 -0
  263. package/lib/esm/utils/expand-vars.js.map +1 -0
  264. package/lib/esm/utils/memory.js +55 -0
  265. package/lib/esm/utils/memory.js.map +1 -0
  266. package/lib/esm/utils/renditions.js +84 -0
  267. package/lib/esm/utils/renditions.js.map +1 -0
  268. package/lib/esm/utils/storage.js +45 -0
  269. package/lib/esm/utils/storage.js.map +1 -0
  270. package/lib/esm/utils/text-preview-utils.js +38 -0
  271. package/lib/esm/utils/text-preview-utils.js.map +1 -0
  272. package/lib/esm/utils/tokens.js +34 -0
  273. package/lib/esm/utils/tokens.js.map +1 -0
  274. package/lib/esm/vars.js +4 -0
  275. package/lib/esm/vars.js.map +1 -0
  276. package/lib/esm/workflows.js +8 -0
  277. package/lib/esm/workflows.js.map +1 -0
  278. package/lib/tsconfig.tsbuildinfo +1 -0
  279. package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts +17 -0
  280. package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts.map +1 -0
  281. package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts +39 -0
  282. package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts.map +1 -0
  283. package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts +19 -0
  284. package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts.map +1 -0
  285. package/lib/types/activities/chunkDocument.d.ts +33 -0
  286. package/lib/types/activities/chunkDocument.d.ts.map +1 -0
  287. package/lib/types/activities/copyParentArtifacts.d.ts +19 -0
  288. package/lib/types/activities/copyParentArtifacts.d.ts.map +1 -0
  289. package/lib/types/activities/createDocumentFromOther.d.ts +21 -0
  290. package/lib/types/activities/createDocumentFromOther.d.ts.map +1 -0
  291. package/lib/types/activities/executeInteraction.d.ts +61 -0
  292. package/lib/types/activities/executeInteraction.d.ts.map +1 -0
  293. package/lib/types/activities/extractDocumentText.d.ts +11 -0
  294. package/lib/types/activities/extractDocumentText.d.ts.map +1 -0
  295. package/lib/types/activities/generateDocumentProperties.d.ts +32 -0
  296. package/lib/types/activities/generateDocumentProperties.d.ts.map +1 -0
  297. package/lib/types/activities/generateEmbeddings.d.ts +53 -0
  298. package/lib/types/activities/generateEmbeddings.d.ts.map +1 -0
  299. package/lib/types/activities/generateOrAssignContentType.d.ts +44 -0
  300. package/lib/types/activities/generateOrAssignContentType.d.ts.map +1 -0
  301. package/lib/types/activities/getObjectFromStore.d.ts +14 -0
  302. package/lib/types/activities/getObjectFromStore.d.ts.map +1 -0
  303. package/lib/types/activities/handleError.d.ts +6 -0
  304. package/lib/types/activities/handleError.d.ts.map +1 -0
  305. package/lib/types/activities/index-dsl.d.ts +26 -0
  306. package/lib/types/activities/index-dsl.d.ts.map +1 -0
  307. package/lib/types/activities/index.d.ts +5 -0
  308. package/lib/types/activities/index.d.ts.map +1 -0
  309. package/lib/types/activities/media/prepareAudio.d.ts +25 -0
  310. package/lib/types/activities/media/prepareAudio.d.ts.map +1 -0
  311. package/lib/types/activities/media/prepareVideo.d.ts +30 -0
  312. package/lib/types/activities/media/prepareVideo.d.ts.map +1 -0
  313. package/lib/types/activities/media/processPdfWithTextract.d.ts +26 -0
  314. package/lib/types/activities/media/processPdfWithTextract.d.ts.map +1 -0
  315. package/lib/types/activities/media/saveGladiaTranscription.d.ts +15 -0
  316. package/lib/types/activities/media/saveGladiaTranscription.d.ts.map +1 -0
  317. package/lib/types/activities/media/transcribeMediaWithGladia.d.ts +20 -0
  318. package/lib/types/activities/media/transcribeMediaWithGladia.d.ts.map +1 -0
  319. package/lib/types/activities/mergeChildArtifacts.d.ts +24 -0
  320. package/lib/types/activities/mergeChildArtifacts.d.ts.map +1 -0
  321. package/lib/types/activities/notifyWebhook.d.ts +27 -0
  322. package/lib/types/activities/notifyWebhook.d.ts.map +1 -0
  323. package/lib/types/activities/rateLimiter.d.ts +11 -0
  324. package/lib/types/activities/rateLimiter.d.ts.map +1 -0
  325. package/lib/types/activities/renditions/generateImageRendition.d.ts +14 -0
  326. package/lib/types/activities/renditions/generateImageRendition.d.ts.map +1 -0
  327. package/lib/types/activities/renditions/generateVideoRendition.d.ts +15 -0
  328. package/lib/types/activities/renditions/generateVideoRendition.d.ts.map +1 -0
  329. package/lib/types/activities/setDocumentStatus.d.ts +15 -0
  330. package/lib/types/activities/setDocumentStatus.d.ts.map +1 -0
  331. package/lib/types/conversion/TextractProcessor.d.ts +45 -0
  332. package/lib/types/conversion/TextractProcessor.d.ts.map +1 -0
  333. package/lib/types/conversion/image.d.ts +13 -0
  334. package/lib/types/conversion/image.d.ts.map +1 -0
  335. package/lib/types/conversion/markitdown.d.ts +2 -0
  336. package/lib/types/conversion/markitdown.d.ts.map +1 -0
  337. package/lib/types/conversion/mutool.d.ts +19 -0
  338. package/lib/types/conversion/mutool.d.ts.map +1 -0
  339. package/lib/types/conversion/pandoc.d.ts +2 -0
  340. package/lib/types/conversion/pandoc.d.ts.map +1 -0
  341. package/lib/types/dsl/conditions.d.ts +2 -0
  342. package/lib/types/dsl/conditions.d.ts.map +1 -0
  343. package/lib/types/dsl/dsl-workflow.d.ts +5 -0
  344. package/lib/types/dsl/dsl-workflow.d.ts.map +1 -0
  345. package/lib/types/dsl/dslProxyActivities.d.ts +10 -0
  346. package/lib/types/dsl/dslProxyActivities.d.ts.map +1 -0
  347. package/lib/types/dsl/projections.d.ts +4 -0
  348. package/lib/types/dsl/projections.d.ts.map +1 -0
  349. package/lib/types/dsl/setup/ActivityContext.d.ts +47 -0
  350. package/lib/types/dsl/setup/ActivityContext.d.ts.map +1 -0
  351. package/lib/types/dsl/setup/fetch/DataProvider.d.ts +9 -0
  352. package/lib/types/dsl/setup/fetch/DataProvider.d.ts.map +1 -0
  353. package/lib/types/dsl/setup/fetch/index.d.ts +6 -0
  354. package/lib/types/dsl/setup/fetch/index.d.ts.map +1 -0
  355. package/lib/types/dsl/setup/fetch/providers.d.ts +25 -0
  356. package/lib/types/dsl/setup/fetch/providers.d.ts.map +1 -0
  357. package/lib/types/dsl/test/test-child-workflow.d.ts +4 -0
  358. package/lib/types/dsl/test/test-child-workflow.d.ts.map +1 -0
  359. package/lib/types/dsl/validation.d.ts +4 -0
  360. package/lib/types/dsl/validation.d.ts.map +1 -0
  361. package/lib/types/dsl/vars.d.ts +48 -0
  362. package/lib/types/dsl/vars.d.ts.map +1 -0
  363. package/lib/types/dsl/walk.d.ts +18 -0
  364. package/lib/types/dsl/walk.d.ts.map +1 -0
  365. package/lib/types/dsl.d.ts +4 -0
  366. package/lib/types/dsl.d.ts.map +1 -0
  367. package/lib/types/errors.d.ts +41 -0
  368. package/lib/types/errors.d.ts.map +1 -0
  369. package/lib/types/index.d.ts +38 -0
  370. package/lib/types/index.d.ts.map +1 -0
  371. package/lib/types/iterative-generation/activities/extractToc.d.ts +10 -0
  372. package/lib/types/iterative-generation/activities/extractToc.d.ts.map +1 -0
  373. package/lib/types/iterative-generation/activities/finalizeOutput.d.ts +3 -0
  374. package/lib/types/iterative-generation/activities/finalizeOutput.d.ts.map +1 -0
  375. package/lib/types/iterative-generation/activities/generatePart.d.ts +3 -0
  376. package/lib/types/iterative-generation/activities/generatePart.d.ts.map +1 -0
  377. package/lib/types/iterative-generation/activities/generateToc.d.ts +4 -0
  378. package/lib/types/iterative-generation/activities/generateToc.d.ts.map +1 -0
  379. package/lib/types/iterative-generation/activities/index.d.ts +5 -0
  380. package/lib/types/iterative-generation/activities/index.d.ts.map +1 -0
  381. package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts +3 -0
  382. package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts.map +1 -0
  383. package/lib/types/iterative-generation/types.d.ts +79 -0
  384. package/lib/types/iterative-generation/types.d.ts.map +1 -0
  385. package/lib/types/iterative-generation/utils.d.ts +26 -0
  386. package/lib/types/iterative-generation/utils.d.ts.map +1 -0
  387. package/lib/types/result-types.d.ts +26 -0
  388. package/lib/types/result-types.d.ts.map +1 -0
  389. package/lib/types/system/notifyWebhookWorkflow.d.ts +8 -0
  390. package/lib/types/system/notifyWebhookWorkflow.d.ts.map +1 -0
  391. package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts +25 -0
  392. package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts.map +1 -0
  393. package/lib/types/utils/auth.d.ts +4 -0
  394. package/lib/types/utils/auth.d.ts.map +1 -0
  395. package/lib/types/utils/blobs.d.ts +7 -0
  396. package/lib/types/utils/blobs.d.ts.map +1 -0
  397. package/lib/types/utils/chunks.d.ts +9 -0
  398. package/lib/types/utils/chunks.d.ts.map +1 -0
  399. package/lib/types/utils/client.d.ts +8 -0
  400. package/lib/types/utils/client.d.ts.map +1 -0
  401. package/lib/types/utils/expand-vars.d.ts +8 -0
  402. package/lib/types/utils/expand-vars.d.ts.map +1 -0
  403. package/lib/types/utils/memory.d.ts +8 -0
  404. package/lib/types/utils/memory.d.ts.map +1 -0
  405. package/lib/types/utils/renditions.d.ts +25 -0
  406. package/lib/types/utils/renditions.d.ts.map +1 -0
  407. package/lib/types/utils/storage.d.ts +16 -0
  408. package/lib/types/utils/storage.d.ts.map +1 -0
  409. package/lib/types/utils/text-preview-utils.d.ts +15 -0
  410. package/lib/types/utils/text-preview-utils.d.ts.map +1 -0
  411. package/lib/types/utils/tokens.d.ts +11 -0
  412. package/lib/types/utils/tokens.d.ts.map +1 -0
  413. package/lib/types/vars.d.ts +3 -0
  414. package/lib/types/vars.d.ts.map +1 -0
  415. package/lib/types/workflows.d.ts +8 -0
  416. package/lib/types/workflows.d.ts.map +1 -0
  417. package/lib/workflows-bundle.js +18083 -0
  418. package/package.json +6 -7
  419. package/src/activities/advanced/createOrUpdateDocumentFromInteractionRun.ts +1 -1
  420. package/src/activities/chunkDocument.ts +35 -6
  421. package/src/activities/executeInteraction.ts +37 -5
  422. package/src/activities/extractDocumentText.ts +84 -28
  423. package/src/activities/generateDocumentProperties.ts +42 -15
  424. package/src/activities/generateEmbeddings.ts +9 -9
  425. package/src/activities/generateOrAssignContentType.ts +74 -24
  426. package/src/activities/index-dsl.ts +4 -3
  427. package/src/activities/media/saveGladiaTranscription.test.ts +406 -0
  428. package/src/activities/media/saveGladiaTranscription.ts +41 -26
  429. package/src/activities/media/transcribeMediaWithGladia.test.ts +583 -0
  430. package/src/activities/media/transcribeMediaWithGladia.ts +46 -25
  431. package/src/activities/notifyWebhook.test.ts +121 -8
  432. package/src/activities/notifyWebhook.ts +10 -2
  433. package/src/activities/renditions/generateImageRendition.ts +2 -2
  434. package/src/conversion/image.test.ts +1 -0
  435. package/src/conversion/image.ts +10 -10
  436. package/src/conversion/mutool.test.ts +1 -4
  437. package/src/conversion/pandoc.test.ts +1 -4
  438. package/src/dsl/dsl-workflow.ts +49 -9
  439. package/src/dsl/setup/ActivityContext.ts +73 -0
  440. package/src/dsl/workflow-exec-child.test.ts +12 -8
  441. package/src/dsl/workflow-fetch.test.ts +9 -6
  442. package/src/dsl/workflow-import.test.ts +10 -7
  443. package/src/dsl/workflow.test.ts +11 -8
  444. package/src/dsl.ts +1 -0
  445. package/src/errors.ts +14 -0
  446. package/src/index.ts +6 -5
  447. package/src/result-types.ts +5 -1
  448. package/src/utils/renditions.ts +11 -5
  449. package/src/utils/text-preview-utils.ts +62 -0
@@ -0,0 +1,221 @@
1
+ "use strict";
2
+ Object.defineProperty(exports, "__esModule", { value: true });
3
+ exports.executeInteraction = executeInteraction;
4
+ exports.executeInteractionFromActivity = executeInteractionFromActivity;
5
+ const common_1 = require("@llumiverse/common");
6
+ const activity_1 = require("@temporalio/activity");
7
+ const node_1 = require("@vertesia/client/node");
8
+ const common_2 = require("@vertesia/common");
9
+ const projections_js_1 = require("../dsl/projections.js");
10
+ const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
11
+ const errors_js_1 = require("../errors.js");
12
+ const tokens_js_1 = require("../utils/tokens.js");
13
+ const stream_1 = require("stream");
14
+ //Example:
15
+ //@ts-ignore
16
+ const JSON = {
17
+ name: "executeInteraction",
18
+ import: ["defaultModel", "guidlineId", "docTypeId"],
19
+ params: {
20
+ defaultModel: "${model}",
21
+ interactionName: "GenerateSummary",
22
+ model: "${defaultModel ?? 'gpt4'}",
23
+ environment: "13456",
24
+ max_tokens: 100,
25
+ temperature: 0.5,
26
+ tags: ["test"],
27
+ result_schema: "${docType.object_schema}",
28
+ prompt_data: {
29
+ documents: "${documents}",
30
+ guidline: "${guidline.text}",
31
+ },
32
+ },
33
+ fetch: {
34
+ documents: {
35
+ type: "document",
36
+ query: {
37
+ id: { $in: "${objectIds}" },
38
+ },
39
+ select: "+text",
40
+ },
41
+ guidline: {
42
+ type: "document",
43
+ limit: 1,
44
+ query: {
45
+ id: "${guidlineId}",
46
+ },
47
+ select: "+text",
48
+ on_not_found: "throw",
49
+ },
50
+ docType: {
51
+ type: "document_type",
52
+ limit: 1,
53
+ query: {
54
+ id: "${docTypeId}",
55
+ },
56
+ select: "+object_schema",
57
+ },
58
+ },
59
+ };
60
+ async function executeInteraction(payload) {
61
+ const { client, params } = await (0, ActivityContext_js_1.setupActivity)(payload);
62
+ const { interactionName, prompt_data, static_prompt_data: wf_prompt_data } = params;
63
+ if (wf_prompt_data) {
64
+ Object.assign(prompt_data, wf_prompt_data);
65
+ }
66
+ if (!interactionName) {
67
+ activity_1.log.error("Missing interactionName", { params });
68
+ throw new errors_js_1.ActivityParamNotFoundError("interactionName", payload.activity);
69
+ }
70
+ if (params.truncate) {
71
+ const truncate = params.truncate;
72
+ for (const [key, value] of Object.entries(truncate)) {
73
+ prompt_data[key] = (0, tokens_js_1.truncByMaxTokens)(prompt_data[key], value);
74
+ }
75
+ }
76
+ try {
77
+ const res = await executeInteractionFromActivity(client, interactionName, params, prompt_data, payload.debug_mode);
78
+ let completionResult = res.result;
79
+ // Handle image uploads if the result contains base64 images
80
+ const imageResults = completionResult.filter(r => r.type === "image");
81
+ if (imageResults.length > 0) {
82
+ const uploadedImages = await Promise.all(completionResult.map(async (item, index) => {
83
+ if (item.type === "image") {
84
+ const image = item.value;
85
+ // Extract base64 data and create buffer
86
+ const base64Data = image.replace(/^data:image\/[a-z]+;base64,/, "");
87
+ const buffer = Buffer.from(base64Data, 'base64');
88
+ // Generate filename
89
+ const { runId } = (0, activity_1.activityInfo)().workflowExecution;
90
+ const { activityId } = (0, activity_1.activityInfo)();
91
+ const filename = `generated-image-${runId}-${activityId}-${index}.png`;
92
+ // Create a readable stream from the buffer
93
+ const stream = stream_1.Readable.from(buffer);
94
+ const source = new node_1.NodeStreamSource(stream, filename, "image/png");
95
+ const file = await client.files.uploadFile(source);
96
+ return { type: "image", value: file };
97
+ }
98
+ return item;
99
+ }));
100
+ completionResult = uploadedImages;
101
+ }
102
+ return (0, projections_js_1.projectResult)(payload, params, res, {
103
+ runId: res.id,
104
+ status: res.status,
105
+ result: completionResult,
106
+ });
107
+ }
108
+ catch (error) {
109
+ activity_1.log.error(`Failed to execute interaction ${interactionName}`, { error });
110
+ if (error.statusCode === 429 && params.exit_on_resource_exhaustion) {
111
+ throw new errors_js_1.ResourceExhaustedError(error.statusCode, "Resource exhausted - rate limit exceeded");
112
+ }
113
+ else if (error.message.includes("Failed to validate merged prompt schema")) {
114
+ //issue with the input data, don't retry
115
+ throw new errors_js_1.ActivityParamInvalidError("prompt_data", payload.activity, error.message);
116
+ }
117
+ else if (error.message.includes("modelId: Path `modelId` is required")) {
118
+ //issue with the input data, don't retry
119
+ throw new errors_js_1.ActivityParamInvalidError("model", payload.activity, error.message);
120
+ }
121
+ // Check retryability from error object (set by executeInteractionFromActivity)
122
+ // or from LlumiverseError instance (direct driver errors in some paths)
123
+ const isRetryable = error.retryable !== undefined
124
+ ? error.retryable !== false // Treat undefined as retryable
125
+ : (error instanceof common_1.LlumiverseError ? error.retryable !== false : undefined);
126
+ if (isRetryable !== undefined) {
127
+ if (isRetryable) {
128
+ activity_1.log.debug('Marking error as retryable', { interactionName, errorCode: error.errorCode });
129
+ throw activity_1.ApplicationFailure.create({
130
+ message: `Interaction Execution failed ${interactionName}: ${error.message}`,
131
+ nonRetryable: false,
132
+ });
133
+ }
134
+ else {
135
+ activity_1.log.debug('Marking error as non-retryable', { interactionName, errorCode: error.errorCode });
136
+ throw activity_1.ApplicationFailure.create({
137
+ message: `Non-retryable Interaction Execution failed ${interactionName}: ${error.message}`,
138
+ nonRetryable: true,
139
+ });
140
+ }
141
+ }
142
+ // Unknown retryability - rethrow as generic error (Temporal will use default retry policy)
143
+ throw new Error(`Interaction Execution failed ${interactionName}: ${error.message}`);
144
+ }
145
+ }
146
+ async function executeInteractionFromActivity(client, interactionName, params, prompt_data, debug) {
147
+ const userTags = params.tags;
148
+ const info = (0, activity_1.activityInfo)();
149
+ const runId = info.workflowExecution.runId;
150
+ let tags = ["workflow"];
151
+ if (userTags) {
152
+ tags = tags.concat(userTags);
153
+ }
154
+ const workflow = {
155
+ run_id: info.workflowExecution.runId,
156
+ workflow_id: info.workflowExecution.workflowId,
157
+ activity_type: info.activityType,
158
+ };
159
+ let previousStudioExecutionRun = undefined;
160
+ if (params.include_previous_error) {
161
+ //retrieve last failed run if any
162
+ if (info.attempt > 1) {
163
+ activity_1.log.info("Retrying, searching for previous run", { prev_run_id: runId });
164
+ const payload = {
165
+ query: { workflow_run_ids: [runId] },
166
+ limit: 1,
167
+ };
168
+ const previousRun = await client.runs.search(payload).then((res) => {
169
+ activity_1.log.info("Search results", { results: res });
170
+ return res ? (res[0] ?? undefined) : undefined;
171
+ });
172
+ if (previousRun) {
173
+ activity_1.log.info("Found previous run", { previousRun });
174
+ previousStudioExecutionRun = await client.runs.retrieve(previousRun.id);
175
+ }
176
+ }
177
+ }
178
+ if (debug && previousStudioExecutionRun?.error) {
179
+ activity_1.log.info(`Found previous run error`, { error: previousStudioExecutionRun?.error });
180
+ }
181
+ const config = {
182
+ environment: params.environment,
183
+ model: params.model,
184
+ model_options: params.model_options,
185
+ do_validate: params.validate_result,
186
+ };
187
+ const data = {
188
+ ...prompt_data,
189
+ previous_error: previousStudioExecutionRun?.error,
190
+ };
191
+ const result_schema = params.result_schema;
192
+ activity_1.log.debug(`About to execute interaction ${interactionName}`, { config, data, result_schema, tags, workflow });
193
+ const res = await client.interactions
194
+ .executeByName(interactionName, {
195
+ config,
196
+ data,
197
+ result_schema,
198
+ tags,
199
+ stream: false,
200
+ workflow,
201
+ })
202
+ .catch((err) => {
203
+ activity_1.log.error(`Error executing interaction ${interactionName}`, { err });
204
+ throw err;
205
+ });
206
+ if (debug) {
207
+ activity_1.log.info(`Interaction executed ${interactionName}`, res);
208
+ }
209
+ if (res.error || res.status === common_2.ExecutionRunStatus.failed) {
210
+ activity_1.log.error(`Error executing interaction ${interactionName}`, { error: res.error });
211
+ // Create error with retryability information
212
+ const errorMessage = `Interaction Execution failed ${interactionName}: ${res.error?.message || 'Unknown error'}`;
213
+ const error = new Error(errorMessage);
214
+ // Attach retryable property so the catch block can access it
215
+ error.retryable = res.error?.retryable;
216
+ error.errorCode = res.error?.code;
217
+ throw error;
218
+ }
219
+ return res;
220
+ }
221
+ //# sourceMappingURL=executeInteraction.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"executeInteraction.js","sourceRoot":"","sources":["../../../src/activities/executeInteraction.ts"],"names":[],"mappings":";;AAiIA,gDA4GC;AAED,wEA4FC;AA3UD,+CAAqF;AACrF,mDAA6E;AAE7E,gDAAyD;AACzD,6CAQ0B;AAC1B,0DAAsD;AACtD,wEAAgE;AAChE,4CAA6G;AAC7G,kDAAoE;AACpE,mCAAkC;AAElC,UAAU;AACV,YAAY;AACZ,MAAM,IAAI,GAAoB;IAC1B,IAAI,EAAE,oBAAoB;IAC1B,MAAM,EAAE,CAAC,cAAc,EAAE,YAAY,EAAE,WAAW,CAAC;IACnD,MAAM,EAAE;QACJ,YAAY,EAAE,UAAU;QACxB,eAAe,EAAE,iBAAiB;QAClC,KAAK,EAAE,2BAA2B;QAClC,WAAW,EAAE,OAAO;QACpB,UAAU,EAAE,GAAG;QACf,WAAW,EAAE,GAAG;QAChB,IAAI,EAAE,CAAC,MAAM,CAAC;QACd,aAAa,EAAE,0BAA0B;QACzC,WAAW,EAAE;YACT,SAAS,EAAE,cAAc;YACzB,QAAQ,EAAE,kBAAkB;SAC/B;KACJ;IACD,KAAK,EAAE;QACH,SAAS,EAAE;YACP,IAAI,EAAE,UAAU;YAChB,KAAK,EAAE;gBACH,EAAE,EAAE,EAAE,GAAG,EAAE,cAAc,EAAE;aAC9B;YACD,MAAM,EAAE,OAAO;SAClB;QACD,QAAQ,EAAE;YACN,IAAI,EAAE,UAAU;YAChB,KAAK,EAAE,CAAC;YACR,KAAK,EAAE;gBACH,EAAE,EAAE,eAAe;aACtB;YACD,MAAM,EAAE,OAAO;YACf,YAAY,EAAE,OAAO;SACxB;QACD,OAAO,EAAE;YACL,IAAI,EAAE,eAAe;YACrB,KAAK,EAAE,CAAC;YACR,KAAK,EAAE;gBACH,EAAE,EAAE,cAAc;aACrB;YACD,MAAM,EAAE,gBAAgB;SAC3B;KACJ;CACJ,CAAC;AAiEK,KAAK,UAAU,kBAAkB,CAAC,OAA8D;IACnG,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,GAAG,MAAM,IAAA,kCAAa,EAA2B,OAAO,CAAC,CAAC;IAElF,MAAM,EAAE,eAAe,EAAE,WAAW,EAAE,kBAAkB,EAAE,cAAc,EAAE,GAAG,MAAM,CAAC;IACpF,IAAI,cAAc,EAAE,CAAC;QACjB,MAAM,CAAC,MAAM,CAAC,WAAW,EAAE,cAAc,CAAC,CAAC;IAC/C,CAAC;IAED,IAAI,CAAC,eAAe,EAAE,CAAC;QACnB,cAAG,CAAC,KAAK,CAAC,yBAAyB,EAAE,EAAE,MAAM,EAAE,CAAC,CAAC;QACjD,MAAM,IAAI,sCAA0B,CAAC,iBAAiB,EAAE,OAAO,CAAC,QAAQ,CAAC,CAAC;IAC9E,CAAC;IAED,IAAI,MAAM,CAAC,QAAQ,EAAE,CAAC;QAClB,MAAM,QAAQ,GAAG,MAAM,CAAC,QAAQ,CAAC;QACjC,KAAK,MAAM,CAAC,GAAG,EAAE,KAAK,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,QAAQ,CAAC,EAAE,CAAC;YAClD,WAAW,CAAC,GAAG,CAAC,GAAG,IAAA,4BAAgB,EAAC,WAAW,CAAC,GAAG,CAAC,EAAE,KAAK,CAAC,CAAC;QACjE,CAAC;IACL,CAAC;IAED,IAAI,CAAC;QACD,MAAM,GAAG,GAAG,MAAM,8BAA8B,CAC5C,MAAM,EACN,eAAe,EACf,MAAM,EACN,WAAW,EACX,OAAO,CAAC,UAAU,CACrB,CAAC;QAEF,IAAI,gBAAgB,GAAuB,GAAG,CAAC,MAAM,CAAC;QAEtD,4DAA4D;QAC5D,MAAM,YAAY,GAAG,gBAAgB,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,OAAO,CAAC,CAAC;QACtE,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;YAC1B,MAAM,cAAc,GAAG,MAAM,OAAO,CAAC,GAAG,CACpC,gBAAgB,CAAC,GAAG,CAAC,KAAK,EAAE,IAAI,EAAE,KAAK,EAAE,EAAE;gBACvC,IAAI,IAAI,CAAC,IAAI,KAAK,OAAO,EAAE,CAAC;oBACxB,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC;oBACzB,wCAAwC;oBACxC,MAAM,UAAU,GAAG,KAAK,CAAC,OAAO,CAAC,6BAA6B,EAAE,EAAE,CAAC,CAAC;oBACpE,MAAM,MAAM,GAAG,MAAM,CAAC,IAAI,CAAC,UAAU,EAAE,QAAQ,CAAC,CAAC;oBAEjD,oBAAoB;oBACpB,MAAM,EAAE,KAAK,EAAE,GAAG,IAAA,uBAAY,GAAE,CAAC,iBAAiB,CAAC;oBACnD,MAAM,EAAE,UAAU,EAAE,GAAG,IAAA,uBAAY,GAAE,CAAC;oBACtC,MAAM,QAAQ,GAAG,mBAAmB,KAAK,IAAI,UAAU,IAAI,KAAK,MAAM,CAAC;oBAEvE,2CAA2C;oBAC3C,MAAM,MAAM,GAAG,iBAAQ,CAAC,IAAI,CAAC,MAAM,CAAC,CAAC;oBAErC,MAAM,MAAM,GAAG,IAAI,uBAAgB,CAC/B,MAAM,EACN,QAAQ,EACR,WAAW,CACd,CAAC;oBAEF,MAAM,IAAI,GAAG,MAAM,MAAM,CAAC,KAAK,CAAC,UAAU,CAAC,MAAM,CAAC,CAAC;oBACnD,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,IAAI,EAAsB,CAAC;gBAC9D,CAAC;gBACD,OAAO,IAAI,CAAC;YAChB,CAAC,CAAC,CACL,CAAC;YACF,gBAAgB,GAAG,cAAc,CAAC;QACtC,CAAC;QAED,OAAO,IAAA,8BAAa,EAAC,OAAO,EAAE,MAAM,EAAE,GAAG,EAAE;YACvC,KAAK,EAAE,GAAG,CAAC,EAAE;YACb,MAAM,EAAE,GAAG,CAAC,MAAM;YAClB,MAAM,EAAE,gBAAgB;SAC3B,CAAC,CAAC;IAEP,CAAC;IAAC,OAAO,KAAU,EAAE,CAAC;QAClB,cAAG,CAAC,KAAK,CAAC,iCAAiC,eAAe,EAAE,EAAE,EAAE,KAAK,EAAE,CAAC,CAAC;QACzE,IAAI,KAAK,CAAC,UAAU,KAAK,GAAG,IAAI,MAAM,CAAC,2BAA2B,EAAE,CAAC;YACjE,MAAM,IAAI,kCAAsB,CAAC,KAAK,CAAC,UAAU,EAAE,0CAA0C,CAAC,CAAC;QACnG,CAAC;aAAM,IAAI,KAAK,CAAC,OAAO,CAAC,QAAQ,CAAC,yCAAyC,CAAC,EAAE,CAAC;YAC3E,wCAAwC;YACxC,MAAM,IAAI,qCAAyB,CAAC,aAAa,EAAE,OAAO,CAAC,QAAQ,EAAE,KAAK,CAAC,OAAO,CAAC,CAAC;QACxF,CAAC;aAAM,IAAI,KAAK,CAAC,OAAO,CAAC,QAAQ,CAAC,qCAAqC,CAAC,EAAE,CAAC;YACvE,wCAAwC;YACxC,MAAM,IAAI,qCAAyB,CAAC,OAAO,EAAE,OAAO,CAAC,QAAQ,EAAE,KAAK,CAAC,OAAO,CAAC,CAAC;QAClF,CAAC;QAED,+EAA+E;QAC/E,wEAAwE;QACxE,MAAM,WAAW,GAAG,KAAK,CAAC,SAAS,KAAK,SAAS;YAC7C,CAAC,CAAC,KAAK,CAAC,SAAS,KAAK,KAAK,CAAE,+BAA+B;YAC5D,CAAC,CAAC,CAAC,KAAK,YAAY,wBAAe,CAAC,CAAC,CAAC,KAAK,CAAC,SAAS,KAAK,KAAK,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC;QAEjF,IAAI,WAAW,KAAK,SAAS,EAAE,CAAC;YAC5B,IAAI,WAAW,EAAE,CAAC;gBACd,cAAG,CAAC,KAAK,CAAC,4BAA4B,EAAE,EAAE,eAAe,EAAE,SAAS,EAAE,KAAK,CAAC,SAAS,EAAE,CAAC,CAAC;gBACzF,MAAM,6BAAkB,CAAC,MAAM,CAAC;oBAC5B,OAAO,EAAE,gCAAgC,eAAe,KAAK,KAAK,CAAC,OAAO,EAAE;oBAC5E,YAAY,EAAE,KAAK;iBACtB,CAAC,CAAC;YACP,CAAC;iBAAM,CAAC;gBACJ,cAAG,CAAC,KAAK,CAAC,gCAAgC,EAAE,EAAE,eAAe,EAAE,SAAS,EAAE,KAAK,CAAC,SAAS,EAAE,CAAC,CAAC;gBAC7F,MAAM,6BAAkB,CAAC,MAAM,CAAC;oBAC5B,OAAO,EAAE,8CAA8C,eAAe,KAAK,KAAK,CAAC,OAAO,EAAE;oBAC1F,YAAY,EAAE,IAAI;iBACrB,CAAC,CAAC;YACP,CAAC;QACL,CAAC;QAED,2FAA2F;QAC3F,MAAM,IAAI,KAAK,CAAC,gCAAgC,eAAe,KAAK,KAAK,CAAC,OAAO,EAAE,CAAC,CAAC;IACzF,CAAC;AACL,CAAC;AAEM,KAAK,UAAU,8BAA8B,CAChD,MAAsB,EACtB,eAAuB,EACvB,MAAkC,EAClC,WAAgB,EAChB,KAAe;IAEf,MAAM,QAAQ,GAAG,MAAM,CAAC,IAAI,CAAC;IAC7B,MAAM,IAAI,GAAG,IAAA,uBAAY,GAAE,CAAC;IAC5B,MAAM,KAAK,GAAG,IAAI,CAAC,iBAAiB,CAAC,KAAK,CAAC;IAC3C,IAAI,IAAI,GAAG,CAAC,UAAU,CAAC,CAAC;IACxB,IAAI,QAAQ,EAAE,CAAC;QACX,IAAI,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;IACjC,CAAC;IACD,MAAM,QAAQ,GAAyB;QACnC,MAAM,EAAE,IAAI,CAAC,iBAAiB,CAAC,KAAK;QACpC,WAAW,EAAE,IAAI,CAAC,iBAAiB,CAAC,UAAU;QAC9C,aAAa,EAAE,IAAI,CAAC,YAAY;KACnC,CAAC;IAEF,IAAI,0BAA0B,GAA6B,SAAS,CAAC;IACrE,IAAI,MAAM,CAAC,sBAAsB,EAAE,CAAC;QAChC,iCAAiC;QACjC,IAAI,IAAI,CAAC,OAAO,GAAG,CAAC,EAAE,CAAC;YACnB,cAAG,CAAC,IAAI,CAAC,sCAAsC,EAAE,EAAE,WAAW,EAAE,KAAK,EAAE,CAAC,CAAC;YACzE,MAAM,OAAO,GAAqB;gBAC9B,KAAK,EAAE,EAAE,gBAAgB,EAAE,CAAC,KAAK,CAAC,EAAE;gBACpC,KAAK,EAAE,CAAC;aACX,CAAC;YACF,MAAM,WAAW,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC,IAAI,CAAC,CAAC,GAAG,EAAE,EAAE;gBAC/D,cAAG,CAAC,IAAI,CAAC,gBAAgB,EAAE,EAAE,OAAO,EAAE,GAAG,EAAE,CAAC,CAAC;gBAC7C,OAAO,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,SAAS,CAAC,CAAC,CAAC,CAAC,SAAS,CAAC;YACnD,CAAC,CAAC,CAAC;YAEH,IAAI,WAAW,EAAE,CAAC;gBACd,cAAG,CAAC,IAAI,CAAC,oBAAoB,EAAE,EAAE,WAAW,EAAE,CAAC,CAAC;gBAChD,0BAA0B,GAAG,MAAM,MAAM,CAAC,IAAI,CAAC,QAAQ,CAAC,WAAW,CAAC,EAAE,CAAC,CAAC;YAC5E,CAAC;QACL,CAAC;IACL,CAAC;IACD,IAAI,KAAK,IAAI,0BAA0B,EAAE,KAAK,EAAE,CAAC;QAC7C,cAAG,CAAC,IAAI,CAAC,2BAA2B,EAAE,EAAE,KAAK,EAAE,0BAA0B,EAAE,KAAK,EAAE,CAAC,CAAC;IACxF,CAAC;IAED,MAAM,MAAM,GAAsC;QAC9C,WAAW,EAAE,MAAM,CAAC,WAAW;QAC/B,KAAK,EAAE,MAAM,CAAC,KAAK;QACnB,aAAa,EAAE,MAAM,CAAC,aAAa;QACnC,WAAW,EAAE,MAAM,CAAC,eAAe;KACtC,CAAC;IACF,MAAM,IAAI,GAAG;QACT,GAAG,WAAW;QACd,cAAc,EAAE,0BAA0B,EAAE,KAAK;KACpD,CAAC;IAEF,MAAM,aAAa,GAAG,MAAM,CAAC,aAAa,CAAC;IAE3C,cAAG,CAAC,KAAK,CAAC,gCAAgC,eAAe,EAAE,EAAE,EAAE,MAAM,EAAE,IAAI,EAAE,aAAa,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,CAAC;IAE9G,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,YAAY;SAChC,aAAa,CAAC,eAAe,EAAE;QAC5B,MAAM;QACN,IAAI;QACJ,aAAa;QACb,IAAI;QACJ,MAAM,EAAE,KAAK;QACb,QAAQ;KACX,CAAC;SACD,KAAK,CAAC,CAAC,GAAG,EAAE,EAAE;QACX,cAAG,CAAC,KAAK,CAAC,+BAA+B,eAAe,EAAE,EAAE,EAAE,GAAG,EAAE,CAAC,CAAC;QACrE,MAAM,GAAG,CAAC;IACd,CAAC,CAAC,CAAC;IAEP,IAAI,KAAK,EAAE,CAAC;QACR,cAAG,CAAC,IAAI,CAAC,wBAAwB,eAAe,EAAE,EAAE,GAAG,CAAC,CAAC;IAC7D,CAAC;IAED,IAAI,GAAG,CAAC,KAAK,IAAI,GAAG,CAAC,MAAM,KAAK,2BAAkB,CAAC,MAAM,EAAE,CAAC;QACxD,cAAG,CAAC,KAAK,CAAC,+BAA+B,eAAe,EAAE,EAAE,EAAE,KAAK,EAAE,GAAG,CAAC,KAAK,EAAE,CAAC,CAAC;QAElF,6CAA6C;QAC7C,MAAM,YAAY,GAAG,gCAAgC,eAAe,KAAK,GAAG,CAAC,KAAK,EAAE,OAAO,IAAI,eAAe,EAAE,CAAC;QACjH,MAAM,KAAK,GAAG,IAAI,KAAK,CAAC,YAAY,CAAC,CAAC;QAEtC,6DAA6D;QAC5D,KAAa,CAAC,SAAS,GAAG,GAAG,CAAC,KAAK,EAAE,SAAS,CAAC;QAC/C,KAAa,CAAC,SAAS,GAAG,GAAG,CAAC,KAAK,EAAE,IAAI,CAAC;QAE3C,MAAM,KAAK,CAAC;IAChB,CAAC;IAED,OAAO,GAAG,CAAC;AACf,CAAC"}
@@ -0,0 +1,196 @@
1
+ "use strict";
2
+ Object.defineProperty(exports, "__esModule", { value: true });
3
+ exports.extractDocumentText = extractDocumentText;
4
+ const activity_1 = require("@temporalio/activity");
5
+ const markitdown_js_1 = require("../conversion/markitdown.js");
6
+ const mutool_js_1 = require("../conversion/mutool.js");
7
+ const pandoc_js_1 = require("../conversion/pandoc.js");
8
+ const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
9
+ const errors_js_1 = require("../errors.js");
10
+ const result_types_js_1 = require("../result-types.js");
11
+ const blobs_js_1 = require("../utils/blobs.js");
12
+ const text_preview_utils_js_1 = require("../utils/text-preview-utils.js");
13
+ const tokens_js_1 = require("../utils/tokens.js");
14
+ //@ts-ignore
15
+ const JSON = {
16
+ name: "extractDocumentText",
17
+ };
18
+ async function extractDocumentText(payload) {
19
+ const context = await (0, ActivityContext_js_1.setupActivity)(payload);
20
+ const { client, inputType, params } = context;
21
+ const { output_storage_path } = params;
22
+ if (inputType === 'files') {
23
+ // File mode: extract from file source
24
+ if (!output_storage_path) {
25
+ throw new Error('output_storage_path is required when extracting text from file sources');
26
+ }
27
+ return extractFromFileSource(client, context.file, output_storage_path);
28
+ }
29
+ else {
30
+ // Object mode: fetch from object store
31
+ return extractFromObject(client, context.objectId, context.objectIds || []);
32
+ }
33
+ }
34
+ async function extractFromObject(client, objectId, objectIds) {
35
+ const r = await client.objects.find({
36
+ query: { _id: objectId },
37
+ limit: 1,
38
+ select: "+text",
39
+ });
40
+ const doc = r[0];
41
+ if (!doc) {
42
+ activity_1.log.error(`Document ${objectId} not found`);
43
+ throw new errors_js_1.DocumentNotFoundError(`Document ${objectId} not found`, objectIds);
44
+ }
45
+ activity_1.log.info(`Extracting text for object ${doc.id}`);
46
+ if (!doc.content?.type || !doc.content?.source) {
47
+ if (doc.text) {
48
+ return createResponse(doc, doc.text, result_types_js_1.TextExtractionStatus.skipped, "Text present and no source or type");
49
+ }
50
+ else {
51
+ return createResponse(doc, "", result_types_js_1.TextExtractionStatus.error, "No source or type found");
52
+ }
53
+ }
54
+ //skip if text already extracted and proper etag
55
+ if (doc.text && doc.text.length > 0 && doc.text_etag === doc.content.etag) {
56
+ return createResponse(doc, doc.text, result_types_js_1.TextExtractionStatus.skipped, "Text already extracted");
57
+ }
58
+ let fileBuffer;
59
+ try {
60
+ fileBuffer = await (0, blobs_js_1.fetchBlobAsBuffer)(client, doc.content.source);
61
+ }
62
+ catch (e) {
63
+ activity_1.log.error(`Error reading file: ${e}`);
64
+ return createResponse(doc, "", result_types_js_1.TextExtractionStatus.error, e.message);
65
+ }
66
+ const txt = await extractTextFromBuffer(fileBuffer, doc.content.type);
67
+ if (!txt) {
68
+ return createResponse(doc, doc.text ?? "", result_types_js_1.TextExtractionStatus.skipped, `Unsupported mime type: ${doc.content.type}`);
69
+ }
70
+ const tokensData = (0, tokens_js_1.countTokens)(txt);
71
+ const etag = doc.content.etag ?? (0, blobs_js_1.md5)(txt);
72
+ const updateData = {
73
+ text: txt,
74
+ text_etag: etag,
75
+ tokens: {
76
+ ...tokensData,
77
+ etag: etag,
78
+ },
79
+ };
80
+ await client.objects.update(doc.id, updateData);
81
+ return createResponse(doc, txt, result_types_js_1.TextExtractionStatus.success);
82
+ }
83
+ async function extractFromFileSource(client, input_file, output_storage_path) {
84
+ activity_1.log.info(`Extracting text from ${input_file}`);
85
+ let fileBuffer;
86
+ try {
87
+ fileBuffer = await (0, blobs_js_1.fetchBlobAsBuffer)(client, input_file.url);
88
+ }
89
+ catch (e) {
90
+ activity_1.log.error(`Error reading file: ${e}`);
91
+ return (0, text_preview_utils_js_1.createFileSourceResult)(input_file.url, output_storage_path, null);
92
+ }
93
+ const txt = await extractTextFromBuffer(fileBuffer, input_file.mimetype);
94
+ // Upload extracted text to storage
95
+ if (txt && output_storage_path) {
96
+ await (0, text_preview_utils_js_1.uploadTextPreviewToStorage)(client, txt, output_storage_path, "Document");
97
+ }
98
+ return (0, text_preview_utils_js_1.createFileSourceResult)(input_file.url, output_storage_path, txt);
99
+ }
100
+ async function extractTextFromBuffer(fileBuffer, mimeType) {
101
+ let txt;
102
+ switch (mimeType) {
103
+ case "application/pdf":
104
+ txt = await (0, mutool_js_1.mutoolPdfToText)(fileBuffer);
105
+ break;
106
+ case "text/plain":
107
+ txt = fileBuffer.toString("utf8");
108
+ break;
109
+ //docx
110
+ case "application/vnd.openxmlformats-officedocument.wordprocessingml.document":
111
+ txt = await (0, markitdown_js_1.markdownWithMarkitdown)(fileBuffer, "docx");
112
+ break;
113
+ //pptx
114
+ case "application/vnd.openxmlformats-officedocument.presentationml.presentation":
115
+ txt = await (0, markitdown_js_1.markdownWithMarkitdown)(fileBuffer, "pptx");
116
+ break;
117
+ //html
118
+ case "text/html":
119
+ txt = await (0, pandoc_js_1.markdownWithPandoc)(fileBuffer, "html");
120
+ break;
121
+ //opendocument
122
+ case "application/vnd.oasis.opendocument.text":
123
+ txt = await (0, pandoc_js_1.markdownWithPandoc)(fileBuffer, "odt");
124
+ break;
125
+ //rtf
126
+ case "application/rtf":
127
+ txt = await (0, pandoc_js_1.markdownWithPandoc)(fileBuffer, "rtf");
128
+ break;
129
+ //markdown
130
+ case "text/markdown":
131
+ txt = fileBuffer.toString("utf8");
132
+ break;
133
+ //csv
134
+ case "text/csv":
135
+ txt = fileBuffer.toString("utf8");
136
+ break;
137
+ //typescript
138
+ case "application/typescript":
139
+ txt = fileBuffer.toString("utf8");
140
+ break;
141
+ //javascript
142
+ case "application/javascript":
143
+ txt = fileBuffer.toString("utf8");
144
+ break;
145
+ //json
146
+ case "application/json":
147
+ txt = fileBuffer.toString("utf8");
148
+ break;
149
+ default:
150
+ if (sniffIfText(fileBuffer)) {
151
+ txt = fileBuffer.toString("utf8"); //TODO: add charset detection
152
+ break;
153
+ }
154
+ return null;
155
+ }
156
+ return txt;
157
+ }
158
+ function createResponse(doc, text, status, message) {
159
+ return {
160
+ status,
161
+ message,
162
+ tokens: doc.tokens,
163
+ len: text.length,
164
+ objectId: doc.id,
165
+ hasText: !!text,
166
+ };
167
+ }
168
+ function sniffIfText(buf) {
169
+ // If file is too large, don't even try
170
+ if (buf.length > 500 * 1024) {
171
+ return false;
172
+ }
173
+ // Count binary/control characters
174
+ let binaryCount = 0;
175
+ const sampleSize = Math.min(buf.length, 1000); // Check first 1000 bytes
176
+ for (let i = 0; i < sampleSize; i++) {
177
+ // Count control characters (except common whitespace)
178
+ const byte = buf[i];
179
+ if ((byte < 32 && ![9, 10, 13].includes(byte)) || byte === 0) {
180
+ binaryCount++;
181
+ }
182
+ }
183
+ // If more than 10% binary/control chars, probably not text
184
+ if (binaryCount / sampleSize > 0.1) {
185
+ return false;
186
+ }
187
+ // Additional check for valid UTF-8 encoding
188
+ try {
189
+ const s = buf.toString("utf8");
190
+ return s.length > 0 && !s.includes("\uFFFD"); // Replacement character
191
+ }
192
+ catch (e) {
193
+ return false;
194
+ }
195
+ }
196
+ //# sourceMappingURL=extractDocumentText.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"extractDocumentText.js","sourceRoot":"","sources":["../../../src/activities/extractDocumentText.ts"],"names":[],"mappings":";;AAkCA,kDAiBC;AAnDD,mDAA2C;AAQ3C,+DAAqE;AACrE,uDAA0D;AAC1D,uDAA6D;AAC7D,wEAAgE;AAChE,4CAAqD;AACrD,wDAAgF;AAChF,gDAA2D;AAC3D,0EAGwC;AACxC,kDAAiD;AAEjD,YAAY;AACZ,MAAM,IAAI,GAAoB;IAC1B,IAAI,EAAE,qBAAqB;CAC9B,CAAC;AAUK,KAAK,UAAU,mBAAmB,CACrC,OAA+D;IAE/D,MAAM,OAAO,GAAG,MAAM,IAAA,kCAAa,EAAC,OAAO,CAAC,CAAC;IAC7C,MAAM,EAAE,MAAM,EAAE,SAAS,EAAE,MAAM,EAAE,GAAG,OAAO,CAAC;IAC9C,MAAM,EAAE,mBAAmB,EAAE,GAAG,MAAM,CAAC;IAEvC,IAAI,SAAS,KAAK,OAAO,EAAE,CAAC;QACxB,sCAAsC;QACtC,IAAI,CAAC,mBAAmB,EAAE,CAAC;YACvB,MAAM,IAAI,KAAK,CAAC,wEAAwE,CAAC,CAAC;QAC9F,CAAC;QACD,OAAO,qBAAqB,CAAC,MAAM,EAAE,OAAO,CAAC,IAAI,EAAE,mBAAmB,CAAC,CAAC;IAC5E,CAAC;SAAM,CAAC;QACJ,uCAAuC;QACvC,OAAO,iBAAiB,CAAC,MAAM,EAAE,OAAO,CAAC,QAAQ,EAAE,OAAO,CAAC,SAAS,IAAI,EAAE,CAAC,CAAC;IAChF,CAAC;AACL,CAAC;AAED,KAAK,UAAU,iBAAiB,CAC5B,MAAW,EACX,QAAgB,EAChB,SAAmB;IAEnB,MAAM,CAAC,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,IAAI,CAAC;QAChC,KAAK,EAAE,EAAE,GAAG,EAAE,QAAQ,EAAE;QACxB,KAAK,EAAE,CAAC;QACR,MAAM,EAAE,OAAO;KAClB,CAAC,CAAC;IACH,MAAM,GAAG,GAAG,CAAC,CAAC,CAAC,CAAkB,CAAC;IAClC,IAAI,CAAC,GAAG,EAAE,CAAC;QACP,cAAG,CAAC,KAAK,CAAC,YAAY,QAAQ,YAAY,CAAC,CAAC;QAC5C,MAAM,IAAI,iCAAqB,CAAC,YAAY,QAAQ,YAAY,EAAE,SAAS,CAAC,CAAC;IACjF,CAAC;IAED,cAAG,CAAC,IAAI,CAAC,8BAA8B,GAAG,CAAC,EAAE,EAAE,CAAC,CAAC;IAEjD,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,IAAI,IAAI,CAAC,GAAG,CAAC,OAAO,EAAE,MAAM,EAAE,CAAC;QAC7C,IAAI,GAAG,CAAC,IAAI,EAAE,CAAC;YACX,OAAO,cAAc,CAAC,GAAG,EAAE,GAAG,CAAC,IAAI,EAAE,sCAAoB,CAAC,OAAO,EAAE,oCAAoC,CAAC,CAAC;QAC7G,CAAC;aAAM,CAAC;YACJ,OAAO,cAAc,CAAC,GAAG,EAAE,EAAE,EAAE,sCAAoB,CAAC,KAAK,EAAE,yBAAyB,CAAC,CAAC;QAC1F,CAAC;IACL,CAAC;IAED,gDAAgD;IAChD,IAAI,GAAG,CAAC,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,IAAI,GAAG,CAAC,SAAS,KAAK,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC;QACxE,OAAO,cAAc,CAAC,GAAG,EAAE,GAAG,CAAC,IAAI,EAAE,sCAAoB,CAAC,OAAO,EAAE,wBAAwB,CAAC,CAAC;IACjG,CAAC;IAED,IAAI,UAAkB,CAAC;IACvB,IAAI,CAAC;QACD,UAAU,GAAG,MAAM,IAAA,4BAAiB,EAAC,MAAM,EAAE,GAAG,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;IACrE,CAAC;IAAC,OAAO,CAAM,EAAE,CAAC;QACd,cAAG,CAAC,KAAK,CAAC,uBAAuB,CAAC,EAAE,CAAC,CAAC;QACtC,OAAO,cAAc,CAAC,GAAG,EAAE,EAAE,EAAE,sCAAoB,CAAC,KAAK,EAAE,CAAC,CAAC,OAAO,CAAC,CAAC;IAC1E,CAAC;IAED,MAAM,GAAG,GAAG,MAAM,qBAAqB,CAAC,UAAU,EAAE,GAAG,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC;IACtE,IAAI,CAAC,GAAG,EAAE,CAAC;QACP,OAAO,cAAc,CACjB,GAAG,EACH,GAAG,CAAC,IAAI,IAAI,EAAE,EACd,sCAAoB,CAAC,OAAO,EAC5B,0BAA0B,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,CAC/C,CAAC;IACN,CAAC;IAED,MAAM,UAAU,GAAG,IAAA,uBAAW,EAAC,GAAG,CAAC,CAAC;IACpC,MAAM,IAAI,GAAG,GAAG,CAAC,OAAO,CAAC,IAAI,IAAI,IAAA,cAAG,EAAC,GAAG,CAAC,CAAC;IAE1C,MAAM,UAAU,GAA+B;QAC3C,IAAI,EAAE,GAAG;QACT,SAAS,EAAE,IAAI;QACf,MAAM,EAAE;YACJ,GAAG,UAAU;YACb,IAAI,EAAE,IAAI;SACb;KACJ,CAAC;IAEF,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,EAAE,UAAU,CAAC,CAAC;IAEhD,OAAO,cAAc,CAAC,GAAG,EAAE,GAAG,EAAE,sCAAoB,CAAC,OAAO,CAAC,CAAC;AAClE,CAAC;AAED,KAAK,UAAU,qBAAqB,CAChC,MAAW,EACX,UAA6B,EAC7B,mBAA2B;IAE3B,cAAG,CAAC,IAAI,CAAC,wBAAwB,UAAU,EAAE,CAAC,CAAC;IAE/C,IAAI,UAAkB,CAAC;IACvB,IAAI,CAAC;QACD,UAAU,GAAG,MAAM,IAAA,4BAAiB,EAAC,MAAM,EAAE,UAAU,CAAC,GAAG,CAAC,CAAC;IACjE,CAAC;IAAC,OAAO,CAAM,EAAE,CAAC;QACd,cAAG,CAAC,KAAK,CAAC,uBAAuB,CAAC,EAAE,CAAC,CAAC;QACtC,OAAO,IAAA,8CAAsB,EAAC,UAAU,CAAC,GAAG,EAAE,mBAAmB,EAAE,IAAI,CAAC,CAAC;IAC7E,CAAC;IAED,MAAM,GAAG,GAAG,MAAM,qBAAqB,CAAC,UAAU,EAAE,UAAU,CAAC,QAAQ,CAAC,CAAC;IAEzE,mCAAmC;IACnC,IAAI,GAAG,IAAI,mBAAmB,EAAE,CAAC;QAC7B,MAAM,IAAA,kDAA0B,EAAC,MAAM,EAAE,GAAG,EAAE,mBAAmB,EAAE,UAAU,CAAC,CAAC;IACnF,CAAC;IAED,OAAO,IAAA,8CAAsB,EAAC,UAAU,CAAC,GAAG,EAAE,mBAAmB,EAAE,GAAG,CAAC,CAAC;AAC5E,CAAC;AAED,KAAK,UAAU,qBAAqB,CAAC,UAAkB,EAAE,QAAgB;IACrE,IAAI,GAAW,CAAC;IAEhB,QAAQ,QAAQ,EAAE,CAAC;QACf,KAAK,iBAAiB;YAClB,GAAG,GAAG,MAAM,IAAA,2BAAe,EAAC,UAAU,CAAC,CAAC;YACxC,MAAM;QAEV,KAAK,YAAY;YACb,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV,MAAM;QACN,KAAK,yEAAyE;YAC1E,GAAG,GAAG,MAAM,IAAA,sCAAsB,EAAC,UAAU,EAAE,MAAM,CAAC,CAAC;YACvD,MAAM;QAEV,MAAM;QACN,KAAK,2EAA2E;YAC5E,GAAG,GAAG,MAAM,IAAA,sCAAsB,EAAC,UAAU,EAAE,MAAM,CAAC,CAAC;YACvD,MAAM;QAEV,MAAM;QACN,KAAK,WAAW;YACZ,GAAG,GAAG,MAAM,IAAA,8BAAkB,EAAC,UAAU,EAAE,MAAM,CAAC,CAAC;YACnD,MAAM;QAEV,cAAc;QACd,KAAK,yCAAyC;YAC1C,GAAG,GAAG,MAAM,IAAA,8BAAkB,EAAC,UAAU,EAAE,KAAK,CAAC,CAAC;YAClD,MAAM;QAEV,KAAK;QACL,KAAK,iBAAiB;YAClB,GAAG,GAAG,MAAM,IAAA,8BAAkB,EAAC,UAAU,EAAE,KAAK,CAAC,CAAC;YAClD,MAAM;QAEV,UAAU;QACV,KAAK,eAAe;YAChB,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV,KAAK;QACL,KAAK,UAAU;YACX,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV,YAAY;QACZ,KAAK,wBAAwB;YACzB,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV,YAAY;QACZ,KAAK,wBAAwB;YACzB,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV,MAAM;QACN,KAAK,kBAAkB;YACnB,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;YAClC,MAAM;QAEV;YACI,IAAI,WAAW,CAAC,UAAU,CAAC,EAAE,CAAC;gBAC1B,GAAG,GAAG,UAAU,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC,CAAC,6BAA6B;gBAChE,MAAM;YACV,CAAC;YACD,OAAO,IAAI,CAAC;IACpB,CAAC;IAED,OAAO,GAAG,CAAC;AACf,CAAC;AAED,SAAS,cAAc,CACnB,GAAkB,EAClB,IAAY,EACZ,MAA4B,EAC5B,OAAgB;IAEhB,OAAO;QACH,MAAM;QACN,OAAO;QACP,MAAM,EAAE,GAAG,CAAC,MAAM;QAClB,GAAG,EAAE,IAAI,CAAC,MAAM;QAChB,QAAQ,EAAE,GAAG,CAAC,EAAE;QAChB,OAAO,EAAE,CAAC,CAAC,IAAI;KAClB,CAAC;AACN,CAAC;AAED,SAAS,WAAW,CAAC,GAAW;IAC5B,uCAAuC;IACvC,IAAI,GAAG,CAAC,MAAM,GAAG,GAAG,GAAG,IAAI,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACjB,CAAC;IAED,kCAAkC;IAClC,IAAI,WAAW,GAAG,CAAC,CAAC;IACpB,MAAM,UAAU,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC,MAAM,EAAE,IAAI,CAAC,CAAC,CAAC,yBAAyB;IAExE,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,UAAU,EAAE,CAAC,EAAE,EAAE,CAAC;QAClC,sDAAsD;QACtD,MAAM,IAAI,GAAG,GAAG,CAAC,CAAC,CAAC,CAAC;QACpB,IAAI,CAAC,IAAI,GAAG,EAAE,IAAI,CAAC,CAAC,CAAC,EAAE,EAAE,EAAE,EAAE,CAAC,CAAC,QAAQ,CAAC,IAAI,CAAC,CAAC,IAAI,IAAI,KAAK,CAAC,EAAE,CAAC;YAC3D,WAAW,EAAE,CAAC;QAClB,CAAC;IACL,CAAC;IAED,2DAA2D;IAC3D,IAAI,WAAW,GAAG,UAAU,GAAG,GAAG,EAAE,CAAC;QACjC,OAAO,KAAK,CAAC;IACjB,CAAC;IAED,4CAA4C;IAC5C,IAAI,CAAC;QACD,MAAM,CAAC,GAAG,GAAG,CAAC,QAAQ,CAAC,MAAM,CAAC,CAAC;QAC/B,OAAO,CAAC,CAAC,MAAM,GAAG,CAAC,IAAI,CAAC,CAAC,CAAC,QAAQ,CAAC,QAAQ,CAAC,CAAC,CAAC,wBAAwB;IAC1E,CAAC;IAAC,OAAO,CAAC,EAAE,CAAC;QACT,OAAO,KAAK,CAAC;IACjB,CAAC;AACL,CAAC"}
@@ -0,0 +1,109 @@
1
+ "use strict";
2
+ Object.defineProperty(exports, "__esModule", { value: true });
3
+ exports.generateDocumentProperties = generateDocumentProperties;
4
+ const activity_1 = require("@temporalio/activity");
5
+ const ActivityContext_js_1 = require("../dsl/setup/ActivityContext.js");
6
+ const tokens_js_1 = require("../utils/tokens.js");
7
+ const executeInteraction_js_1 = require("./executeInteraction.js");
8
+ const INT_EXTRACT_INFORMATION = "sys:ExtractInformation";
9
+ async function generateDocumentProperties(payload) {
10
+ const context = await (0, ActivityContext_js_1.setupActivity)(payload);
11
+ const { params, client, objectId } = context;
12
+ const interactionName = params.interactionName ?? INT_EXTRACT_INFORMATION;
13
+ const project = await context.fetchProject();
14
+ const doc = await client.objects.retrieve(objectId, "+text");
15
+ const type = doc.type
16
+ ? await client.types.catalog.resolve(doc.type)
17
+ : undefined;
18
+ if (!doc?.text && !params.use_vision && !doc?.content?.type?.startsWith("image/")) {
19
+ activity_1.log.warn(`Object ${objectId} not found or text is empty`);
20
+ return { status: "failed", error: "no-text" };
21
+ }
22
+ if (!type || !type.object_schema) {
23
+ activity_1.log.info(`Object ${objectId} has no schema`);
24
+ return { document: objectId, status: "skipped", message: "no schema defined on type" };
25
+ }
26
+ const getImageRef = () => {
27
+ if (doc.content?.type?.startsWith("image/")) {
28
+ return "store:" + doc.id;
29
+ }
30
+ if (params.use_vision && doc.content?.type?.startsWith("application/pdf")) {
31
+ return "store:" + doc.id;
32
+ }
33
+ activity_1.log.info(`Object ${objectId} is not an image or pdf`);
34
+ return undefined;
35
+ };
36
+ const content = doc.text
37
+ ? (0, tokens_js_1.truncByMaxTokens)(doc.text, params.truncate || 30000)
38
+ : undefined;
39
+ const promptData = {
40
+ content: content,
41
+ image: getImageRef() ?? undefined,
42
+ human_context: project?.configuration?.human_context ?? undefined,
43
+ };
44
+ activity_1.log.info(` Extracting information from object ${objectId} with type ${type.name}`, payload.debug_mode ? { params } : undefined);
45
+ let infoRes;
46
+ try {
47
+ infoRes = await (0, executeInteraction_js_1.executeInteractionFromActivity)(client, interactionName, {
48
+ ...params,
49
+ include_previous_error: true,
50
+ result_schema: type.object_schema,
51
+ validate_result: type.strict_mode,
52
+ }, promptData, payload.debug_mode ?? false);
53
+ }
54
+ catch (error) {
55
+ activity_1.log.error(`Failed to extract document properties for ${objectId}`, { error, retryable: error.retryable });
56
+ const isRetryable = error.retryable !== undefined
57
+ ? error.retryable !== false
58
+ : undefined;
59
+ if (isRetryable !== undefined) {
60
+ if (isRetryable) {
61
+ throw activity_1.ApplicationFailure.create({
62
+ message: `Document property extraction failed for ${objectId}: ${error.message}`,
63
+ nonRetryable: false,
64
+ });
65
+ }
66
+ else {
67
+ throw activity_1.ApplicationFailure.create({
68
+ message: `Non-retryable document property extraction failed for ${objectId}: ${error.message}`,
69
+ nonRetryable: true,
70
+ });
71
+ }
72
+ }
73
+ throw error;
74
+ }
75
+ const getText = () => {
76
+ if (doc.text) {
77
+ return undefined;
78
+ }
79
+ let text = "";
80
+ const jsonResult = infoRes.result.object();
81
+ if (jsonResult.title) {
82
+ text += jsonResult.title + "\n";
83
+ }
84
+ if (jsonResult.description) {
85
+ text += jsonResult.description;
86
+ }
87
+ if (text) {
88
+ return text;
89
+ }
90
+ else {
91
+ return undefined;
92
+ }
93
+ };
94
+ activity_1.log.info(`Extracted information from object ${objectId} with type ${type.name}`, { runId: infoRes.id });
95
+ await client.objects.update(doc.id, {
96
+ properties: {
97
+ ...infoRes.result.object(),
98
+ etag: doc.text_etag,
99
+ },
100
+ text: getText(),
101
+ generation_run_info: {
102
+ id: infoRes.id,
103
+ date: new Date().toISOString(),
104
+ model: infoRes.modelId ?? "",
105
+ },
106
+ }, { suppressWorkflows: true });
107
+ return { status: "completed" };
108
+ }
109
+ //# sourceMappingURL=generateDocumentProperties.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"generateDocumentProperties.js","sourceRoot":"","sources":["../../../src/activities/generateDocumentProperties.ts"],"names":[],"mappings":";;AAsBA,gEA4HC;AAlJD,mDAA+D;AAE/D,wEAAgE;AAChE,kDAAoE;AACpE,mEAAqG;AAErG,MAAM,uBAAuB,GAAG,wBAAwB,CAAC;AAgBlD,KAAK,UAAU,0BAA0B,CAC5C,OAAsE;IAEtE,MAAM,OAAO,GAAG,MAAM,IAAA,kCAAa,EAAmC,OAAO,CAAC,CAAC;IAC/E,MAAM,EAAE,MAAM,EAAE,MAAM,EAAE,QAAQ,EAAE,GAAG,OAAO,CAAC;IAC7C,MAAM,eAAe,GAAG,MAAM,CAAC,eAAe,IAAI,uBAAuB,CAAC;IAE1E,MAAM,OAAO,GAAG,MAAM,OAAO,CAAC,YAAY,EAAE,CAAC;IAE7C,MAAM,GAAG,GAAG,MAAM,MAAM,CAAC,OAAO,CAAC,QAAQ,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC;IAC7D,MAAM,IAAI,GAAG,GAAG,CAAC,IAAI;QACjB,CAAC,CAAC,MAAM,MAAM,CAAC,KAAK,CAAC,OAAO,CAAC,OAAO,CAAC,GAAG,CAAC,IAAI,CAAC;QAC9C,CAAC,CAAC,SAAS,CAAC;IAEhB,IAAI,CAAC,GAAG,EAAE,IAAI,IAAI,CAAC,MAAM,CAAC,UAAU,IAAI,CAAC,GAAG,EAAE,OAAO,EAAE,IAAI,EAAE,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;QAChF,cAAG,CAAC,IAAI,CAAC,UAAU,QAAQ,6BAA6B,CAAC,CAAC;QAC1D,OAAO,EAAE,MAAM,EAAE,QAAQ,EAAE,KAAK,EAAE,SAAS,EAAE,CAAC;IAClD,CAAC;IAED,IAAI,CAAC,IAAI,IAAI,CAAC,IAAI,CAAC,aAAa,EAAE,CAAC;QAC/B,cAAG,CAAC,IAAI,CAAC,UAAU,QAAQ,gBAAgB,CAAC,CAAC;QAC7C,OAAO,EAAE,QAAQ,EAAE,QAAQ,EAAE,MAAM,EAAE,SAAS,EAAE,OAAO,EAAE,2BAA2B,EAAE,CAAC;IAC3F,CAAC;IAED,MAAM,WAAW,GAAG,GAAG,EAAE;QACrB,IAAI,GAAG,CAAC,OAAO,EAAE,IAAI,EAAE,UAAU,CAAC,QAAQ,CAAC,EAAE,CAAC;YAC1C,OAAO,QAAQ,GAAG,GAAG,CAAC,EAAE,CAAC;QAC7B,CAAC;QAED,IAAI,MAAM,CAAC,UAAU,IAAI,GAAG,CAAC,OAAO,EAAE,IAAI,EAAE,UAAU,CAAC,iBAAiB,CAAC,EAAE,CAAC;YACxE,OAAO,QAAQ,GAAG,GAAG,CAAC,EAAE,CAAC;QAC7B,CAAC;QAED,cAAG,CAAC,IAAI,CAAC,UAAU,QAAQ,yBAAyB,CAAC,CAAC;QACtD,OAAO,SAAS,CAAC;IACrB,CAAC,CAAC;IAEF,MAAM,OAAO,GAAG,GAAG,CAAC,IAAI;QACpB,CAAC,CAAC,IAAA,4BAAgB,EAAC,GAAG,CAAC,IAAI,EAAE,MAAM,CAAC,QAAQ,IAAI,KAAK,CAAC;QACtD,CAAC,CAAC,SAAS,CAAC;IAEhB,MAAM,UAAU,GAAG;QACf,OAAO,EAAE,OAAO;QAChB,KAAK,EAAE,WAAW,EAAE,IAAI,SAAS;QACjC,aAAa,EAAE,OAAO,EAAE,aAAa,EAAE,aAAa,IAAI,SAAS;KACpE,CAAC;IAEF,cAAG,CAAC,IAAI,CACJ,uCAAuC,QAAQ,cAAc,IAAI,CAAC,IAAI,EAAE,EACxE,OAAO,CAAC,UAAU,CAAC,CAAC,CAAC,EAAE,MAAM,EAAE,CAAC,CAAC,CAAC,SAAS,CAC9C,CAAC;IAEF,IAAI,OAAO,CAAC;IACZ,IAAI,CAAC;QACD,OAAO,GAAG,MAAM,IAAA,sDAA8B,EAC1C,MAAM,EACN,eAAe,EACf;YACI,GAAG,MAAM;YACT,sBAAsB,EAAE,IAAI;YAC5B,aAAa,EAAE,IAAI,CAAC,aAAa;YACjC,eAAe,EAAE,IAAI,CAAC,WAAW;SACpC,EACD,UAAU,EACV,OAAO,CAAC,UAAU,IAAI,KAAK,CAC9B,CAAC;IACN,CAAC;IAAC,OAAO,KAAU,EAAE,CAAC;QAClB,cAAG,CAAC,KAAK,CAAC,6CAA6C,QAAQ,EAAE,EAAE,EAAE,KAAK,EAAE,SAAS,EAAE,KAAK,CAAC,SAAS,EAAE,CAAC,CAAC;QAE1G,MAAM,WAAW,GAAG,KAAK,CAAC,SAAS,KAAK,SAAS;YAC7C,CAAC,CAAC,KAAK,CAAC,SAAS,KAAK,KAAK;YAC3B,CAAC,CAAC,SAAS,CAAC;QAEhB,IAAI,WAAW,KAAK,SAAS,EAAE,CAAC;YAC5B,IAAI,WAAW,EAAE,CAAC;gBACd,MAAM,6BAAkB,CAAC,MAAM,CAAC;oBAC5B,OAAO,EAAE,2CAA2C,QAAQ,KAAK,KAAK,CAAC,OAAO,EAAE;oBAChF,YAAY,EAAE,KAAK;iBACtB,CAAC,CAAC;YACP,CAAC;iBAAM,CAAC;gBACJ,MAAM,6BAAkB,CAAC,MAAM,CAAC;oBAC5B,OAAO,EAAE,yDAAyD,QAAQ,KAAK,KAAK,CAAC,OAAO,EAAE;oBAC9F,YAAY,EAAE,IAAI;iBACrB,CAAC,CAAC;YACP,CAAC;QACL,CAAC;QAED,MAAM,KAAK,CAAC;IAChB,CAAC;IAED,MAAM,OAAO,GAAG,GAAG,EAAE;QACjB,IAAI,GAAG,CAAC,IAAI,EAAE,CAAC;YACX,OAAO,SAAS,CAAC;QACrB,CAAC;QACD,IAAI,IAAI,GAAG,EAAE,CAAC;QACd,MAAM,UAAU,GAAG,OAAO,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC;QAC3C,IAAI,UAAU,CAAC,KAAK,EAAE,CAAC;YACnB,IAAI,IAAI,UAAU,CAAC,KAAK,GAAG,IAAI,CAAC;QACpC,CAAC;QACD,IAAI,UAAU,CAAC,WAAW,EAAE,CAAC;YACzB,IAAI,IAAI,UAAU,CAAC,WAAW,CAAC;QACnC,CAAC;QACD,IAAI,IAAI,EAAE,CAAC;YACP,OAAO,IAAI,CAAC;QAChB,CAAC;aAAM,CAAC;YACJ,OAAO,SAAS,CAAC;QACrB,CAAC;IACL,CAAC,CAAC;IAEF,cAAG,CAAC,IAAI,CAAC,qCAAqC,QAAQ,cAAc,IAAI,CAAC,IAAI,EAAE,EAAE,EAAE,KAAK,EAAE,OAAO,CAAC,EAAE,EAAE,CAAC,CAAC;IACxG,MAAM,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,EAAE;QAChC,UAAU,EAAE;YACR,GAAG,OAAO,CAAC,MAAM,CAAC,MAAM,EAAE;YAC1B,IAAI,EAAE,GAAG,CAAC,SAAS;SACtB;QACD,IAAI,EAAE,OAAO,EAAE;QACf,mBAAmB,EAAE;YACjB,EAAE,EAAE,OAAO,CAAC,EAAE;YACd,IAAI,EAAE,IAAI,IAAI,EAAE,CAAC,WAAW,EAAE;YAC9B,KAAK,EAAE,OAAO,CAAC,OAAO,IAAI,EAAE;SAC/B;KACJ,EAAE,EAAE,iBAAiB,EAAE,IAAI,EAAE,CAAC,CAAC;IAEhC,OAAO,EAAE,MAAM,EAAE,WAAW,EAAE,CAAC;AACnC,CAAC"}