@vertesia/workflow 0.24.0-dev.202601221707

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (490) hide show
  1. package/LICENSE +13 -0
  2. package/README.md +65 -0
  3. package/bin/bundle-workflows.mjs +39 -0
  4. package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js +33 -0
  5. package/lib/cjs/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
  6. package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +73 -0
  7. package/lib/cjs/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
  8. package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js +19 -0
  9. package/lib/cjs/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
  10. package/lib/cjs/activities/chunkDocument.js +85 -0
  11. package/lib/cjs/activities/chunkDocument.js.map +1 -0
  12. package/lib/cjs/activities/copyParentArtifacts.js +127 -0
  13. package/lib/cjs/activities/copyParentArtifacts.js.map +1 -0
  14. package/lib/cjs/activities/createDocumentFromOther.js +64 -0
  15. package/lib/cjs/activities/createDocumentFromOther.js.map +1 -0
  16. package/lib/cjs/activities/executeInteraction.js +194 -0
  17. package/lib/cjs/activities/executeInteraction.js.map +1 -0
  18. package/lib/cjs/activities/extractDocumentText.js +156 -0
  19. package/lib/cjs/activities/extractDocumentText.js.map +1 -0
  20. package/lib/cjs/activities/generateDocumentProperties.js +83 -0
  21. package/lib/cjs/activities/generateDocumentProperties.js.map +1 -0
  22. package/lib/cjs/activities/generateEmbeddings.js +257 -0
  23. package/lib/cjs/activities/generateEmbeddings.js.map +1 -0
  24. package/lib/cjs/activities/generateOrAssignContentType.js +125 -0
  25. package/lib/cjs/activities/generateOrAssignContentType.js.map +1 -0
  26. package/lib/cjs/activities/getObjectFromStore.js +20 -0
  27. package/lib/cjs/activities/getObjectFromStore.js.map +1 -0
  28. package/lib/cjs/activities/handleError.js +22 -0
  29. package/lib/cjs/activities/handleError.js.map +1 -0
  30. package/lib/cjs/activities/index-dsl.js +51 -0
  31. package/lib/cjs/activities/index-dsl.js.map +1 -0
  32. package/lib/cjs/activities/index.js +21 -0
  33. package/lib/cjs/activities/index.js.map +1 -0
  34. package/lib/cjs/activities/media/prepareAudio.js +239 -0
  35. package/lib/cjs/activities/media/prepareAudio.js.map +1 -0
  36. package/lib/cjs/activities/media/prepareVideo.js +429 -0
  37. package/lib/cjs/activities/media/prepareVideo.js.map +1 -0
  38. package/lib/cjs/activities/media/processPdfWithTextract.js +103 -0
  39. package/lib/cjs/activities/media/processPdfWithTextract.js.map +1 -0
  40. package/lib/cjs/activities/media/saveGladiaTranscription.js +81 -0
  41. package/lib/cjs/activities/media/saveGladiaTranscription.js.map +1 -0
  42. package/lib/cjs/activities/media/transcribeMediaWithGladia.js +82 -0
  43. package/lib/cjs/activities/media/transcribeMediaWithGladia.js.map +1 -0
  44. package/lib/cjs/activities/notifyWebhook.js +158 -0
  45. package/lib/cjs/activities/notifyWebhook.js.map +1 -0
  46. package/lib/cjs/activities/rateLimiter.js +30 -0
  47. package/lib/cjs/activities/rateLimiter.js.map +1 -0
  48. package/lib/cjs/activities/renditions/generateImageRendition.js +66 -0
  49. package/lib/cjs/activities/renditions/generateImageRendition.js.map +1 -0
  50. package/lib/cjs/activities/renditions/generateVideoRendition.js +200 -0
  51. package/lib/cjs/activities/renditions/generateVideoRendition.js.map +1 -0
  52. package/lib/cjs/activities/setDocumentStatus.js +15 -0
  53. package/lib/cjs/activities/setDocumentStatus.js.map +1 -0
  54. package/lib/cjs/conversion/TextractProcessor.js +417 -0
  55. package/lib/cjs/conversion/TextractProcessor.js.map +1 -0
  56. package/lib/cjs/conversion/image.js +149 -0
  57. package/lib/cjs/conversion/image.js.map +1 -0
  58. package/lib/cjs/conversion/markitdown.js +42 -0
  59. package/lib/cjs/conversion/markitdown.js.map +1 -0
  60. package/lib/cjs/conversion/mutool.js +147 -0
  61. package/lib/cjs/conversion/mutool.js.map +1 -0
  62. package/lib/cjs/conversion/pandoc.js +39 -0
  63. package/lib/cjs/conversion/pandoc.js.map +1 -0
  64. package/lib/cjs/dsl/conditions.js +81 -0
  65. package/lib/cjs/dsl/conditions.js.map +1 -0
  66. package/lib/cjs/dsl/dsl-workflow.js +343 -0
  67. package/lib/cjs/dsl/dsl-workflow.js.map +1 -0
  68. package/lib/cjs/dsl/dslProxyActivities.js +23 -0
  69. package/lib/cjs/dsl/dslProxyActivities.js.map +1 -0
  70. package/lib/cjs/dsl/projections.js +59 -0
  71. package/lib/cjs/dsl/projections.js.map +1 -0
  72. package/lib/cjs/dsl/setup/ActivityContext.js +122 -0
  73. package/lib/cjs/dsl/setup/ActivityContext.js.map +1 -0
  74. package/lib/cjs/dsl/setup/fetch/DataProvider.js +51 -0
  75. package/lib/cjs/dsl/setup/fetch/DataProvider.js.map +1 -0
  76. package/lib/cjs/dsl/setup/fetch/index.js +16 -0
  77. package/lib/cjs/dsl/setup/fetch/index.js.map +1 -0
  78. package/lib/cjs/dsl/setup/fetch/providers.js +67 -0
  79. package/lib/cjs/dsl/setup/fetch/providers.js.map +1 -0
  80. package/lib/cjs/dsl/test/test-child-workflow.js +10 -0
  81. package/lib/cjs/dsl/test/test-child-workflow.js.map +1 -0
  82. package/lib/cjs/dsl/validation.js +122 -0
  83. package/lib/cjs/dsl/validation.js.map +1 -0
  84. package/lib/cjs/dsl/vars.js +341 -0
  85. package/lib/cjs/dsl/vars.js.map +1 -0
  86. package/lib/cjs/dsl/walk.js +100 -0
  87. package/lib/cjs/dsl/walk.js.map +1 -0
  88. package/lib/cjs/dsl.js +20 -0
  89. package/lib/cjs/dsl.js.map +1 -0
  90. package/lib/cjs/errors.js +79 -0
  91. package/lib/cjs/errors.js.map +1 -0
  92. package/lib/cjs/index.js +56 -0
  93. package/lib/cjs/index.js.map +1 -0
  94. package/lib/cjs/iterative-generation/activities/extractToc.js +47 -0
  95. package/lib/cjs/iterative-generation/activities/extractToc.js.map +1 -0
  96. package/lib/cjs/iterative-generation/activities/finalizeOutput.js +72 -0
  97. package/lib/cjs/iterative-generation/activities/finalizeOutput.js.map +1 -0
  98. package/lib/cjs/iterative-generation/activities/generatePart.js +78 -0
  99. package/lib/cjs/iterative-generation/activities/generatePart.js.map +1 -0
  100. package/lib/cjs/iterative-generation/activities/generateToc.js +86 -0
  101. package/lib/cjs/iterative-generation/activities/generateToc.js.map +1 -0
  102. package/lib/cjs/iterative-generation/activities/index.js +12 -0
  103. package/lib/cjs/iterative-generation/activities/index.js.map +1 -0
  104. package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js +56 -0
  105. package/lib/cjs/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
  106. package/lib/cjs/iterative-generation/types.js +5 -0
  107. package/lib/cjs/iterative-generation/types.js.map +1 -0
  108. package/lib/cjs/iterative-generation/utils.js +121 -0
  109. package/lib/cjs/iterative-generation/utils.js.map +1 -0
  110. package/lib/cjs/package.json +3 -0
  111. package/lib/cjs/result-types.js +10 -0
  112. package/lib/cjs/result-types.js.map +1 -0
  113. package/lib/cjs/system/notifyWebhookWorkflow.js +53 -0
  114. package/lib/cjs/system/notifyWebhookWorkflow.js.map +1 -0
  115. package/lib/cjs/system/recalculateEmbeddingsWorkflow.js +33 -0
  116. package/lib/cjs/system/recalculateEmbeddingsWorkflow.js.map +1 -0
  117. package/lib/cjs/utils/auth.js +15 -0
  118. package/lib/cjs/utils/auth.js.map +1 -0
  119. package/lib/cjs/utils/blobs.js +64 -0
  120. package/lib/cjs/utils/blobs.js.map +1 -0
  121. package/lib/cjs/utils/chunks.js +14 -0
  122. package/lib/cjs/utils/chunks.js.map +1 -0
  123. package/lib/cjs/utils/client.js +31 -0
  124. package/lib/cjs/utils/client.js.map +1 -0
  125. package/lib/cjs/utils/expand-vars.js +33 -0
  126. package/lib/cjs/utils/expand-vars.js.map +1 -0
  127. package/lib/cjs/utils/memory.js +65 -0
  128. package/lib/cjs/utils/memory.js.map +1 -0
  129. package/lib/cjs/utils/renditions.js +88 -0
  130. package/lib/cjs/utils/renditions.js.map +1 -0
  131. package/lib/cjs/utils/storage.js +54 -0
  132. package/lib/cjs/utils/storage.js.map +1 -0
  133. package/lib/cjs/utils/tokens.js +38 -0
  134. package/lib/cjs/utils/tokens.js.map +1 -0
  135. package/lib/cjs/vars.js +20 -0
  136. package/lib/cjs/vars.js.map +1 -0
  137. package/lib/cjs/workflows.js +15 -0
  138. package/lib/cjs/workflows.js.map +1 -0
  139. package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js +30 -0
  140. package/lib/esm/activities/advanced/createDocumentTypeFromInteractionRun.js.map +1 -0
  141. package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js +70 -0
  142. package/lib/esm/activities/advanced/createOrUpdateDocumentFromInteractionRun.js.map +1 -0
  143. package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js +16 -0
  144. package/lib/esm/activities/advanced/updateDocumentFromInteractionRun.js.map +1 -0
  145. package/lib/esm/activities/chunkDocument.js +82 -0
  146. package/lib/esm/activities/chunkDocument.js.map +1 -0
  147. package/lib/esm/activities/copyParentArtifacts.js +124 -0
  148. package/lib/esm/activities/copyParentArtifacts.js.map +1 -0
  149. package/lib/esm/activities/createDocumentFromOther.js +58 -0
  150. package/lib/esm/activities/createDocumentFromOther.js.map +1 -0
  151. package/lib/esm/activities/executeInteraction.js +190 -0
  152. package/lib/esm/activities/executeInteraction.js.map +1 -0
  153. package/lib/esm/activities/extractDocumentText.js +153 -0
  154. package/lib/esm/activities/extractDocumentText.js.map +1 -0
  155. package/lib/esm/activities/generateDocumentProperties.js +80 -0
  156. package/lib/esm/activities/generateDocumentProperties.js.map +1 -0
  157. package/lib/esm/activities/generateEmbeddings.js +254 -0
  158. package/lib/esm/activities/generateEmbeddings.js.map +1 -0
  159. package/lib/esm/activities/generateOrAssignContentType.js +122 -0
  160. package/lib/esm/activities/generateOrAssignContentType.js.map +1 -0
  161. package/lib/esm/activities/getObjectFromStore.js +17 -0
  162. package/lib/esm/activities/getObjectFromStore.js.map +1 -0
  163. package/lib/esm/activities/handleError.js +19 -0
  164. package/lib/esm/activities/handleError.js.map +1 -0
  165. package/lib/esm/activities/index-dsl.js +25 -0
  166. package/lib/esm/activities/index-dsl.js.map +1 -0
  167. package/lib/esm/activities/index.js +5 -0
  168. package/lib/esm/activities/index.js.map +1 -0
  169. package/lib/esm/activities/media/prepareAudio.js +200 -0
  170. package/lib/esm/activities/media/prepareAudio.js.map +1 -0
  171. package/lib/esm/activities/media/prepareVideo.js +390 -0
  172. package/lib/esm/activities/media/prepareVideo.js.map +1 -0
  173. package/lib/esm/activities/media/processPdfWithTextract.js +99 -0
  174. package/lib/esm/activities/media/processPdfWithTextract.js.map +1 -0
  175. package/lib/esm/activities/media/saveGladiaTranscription.js +78 -0
  176. package/lib/esm/activities/media/saveGladiaTranscription.js.map +1 -0
  177. package/lib/esm/activities/media/transcribeMediaWithGladia.js +79 -0
  178. package/lib/esm/activities/media/transcribeMediaWithGladia.js.map +1 -0
  179. package/lib/esm/activities/notifyWebhook.js +155 -0
  180. package/lib/esm/activities/notifyWebhook.js.map +1 -0
  181. package/lib/esm/activities/rateLimiter.js +27 -0
  182. package/lib/esm/activities/rateLimiter.js.map +1 -0
  183. package/lib/esm/activities/renditions/generateImageRendition.js +63 -0
  184. package/lib/esm/activities/renditions/generateImageRendition.js.map +1 -0
  185. package/lib/esm/activities/renditions/generateVideoRendition.js +194 -0
  186. package/lib/esm/activities/renditions/generateVideoRendition.js.map +1 -0
  187. package/lib/esm/activities/setDocumentStatus.js +12 -0
  188. package/lib/esm/activities/setDocumentStatus.js.map +1 -0
  189. package/lib/esm/conversion/TextractProcessor.js +410 -0
  190. package/lib/esm/conversion/TextractProcessor.js.map +1 -0
  191. package/lib/esm/conversion/image.js +143 -0
  192. package/lib/esm/conversion/image.js.map +1 -0
  193. package/lib/esm/conversion/markitdown.js +36 -0
  194. package/lib/esm/conversion/markitdown.js.map +1 -0
  195. package/lib/esm/conversion/mutool.js +139 -0
  196. package/lib/esm/conversion/mutool.js.map +1 -0
  197. package/lib/esm/conversion/pandoc.js +36 -0
  198. package/lib/esm/conversion/pandoc.js.map +1 -0
  199. package/lib/esm/dsl/conditions.js +75 -0
  200. package/lib/esm/dsl/conditions.js.map +1 -0
  201. package/lib/esm/dsl/dsl-workflow.js +336 -0
  202. package/lib/esm/dsl/dsl-workflow.js.map +1 -0
  203. package/lib/esm/dsl/dslProxyActivities.js +20 -0
  204. package/lib/esm/dsl/dslProxyActivities.js.map +1 -0
  205. package/lib/esm/dsl/projections.js +55 -0
  206. package/lib/esm/dsl/projections.js.map +1 -0
  207. package/lib/esm/dsl/setup/ActivityContext.js +117 -0
  208. package/lib/esm/dsl/setup/ActivityContext.js.map +1 -0
  209. package/lib/esm/dsl/setup/fetch/DataProvider.js +47 -0
  210. package/lib/esm/dsl/setup/fetch/DataProvider.js.map +1 -0
  211. package/lib/esm/dsl/setup/fetch/index.js +12 -0
  212. package/lib/esm/dsl/setup/fetch/index.js.map +1 -0
  213. package/lib/esm/dsl/setup/fetch/providers.js +61 -0
  214. package/lib/esm/dsl/setup/fetch/providers.js.map +1 -0
  215. package/lib/esm/dsl/test/test-child-workflow.js +5 -0
  216. package/lib/esm/dsl/test/test-child-workflow.js.map +1 -0
  217. package/lib/esm/dsl/validation.js +118 -0
  218. package/lib/esm/dsl/validation.js.map +1 -0
  219. package/lib/esm/dsl/vars.js +335 -0
  220. package/lib/esm/dsl/vars.js.map +1 -0
  221. package/lib/esm/dsl/walk.js +96 -0
  222. package/lib/esm/dsl/walk.js.map +1 -0
  223. package/lib/esm/dsl.js +4 -0
  224. package/lib/esm/dsl.js.map +1 -0
  225. package/lib/esm/errors.js +69 -0
  226. package/lib/esm/errors.js.map +1 -0
  227. package/lib/esm/index.js +38 -0
  228. package/lib/esm/index.js.map +1 -0
  229. package/lib/esm/iterative-generation/activities/extractToc.js +44 -0
  230. package/lib/esm/iterative-generation/activities/extractToc.js.map +1 -0
  231. package/lib/esm/iterative-generation/activities/finalizeOutput.js +69 -0
  232. package/lib/esm/iterative-generation/activities/finalizeOutput.js.map +1 -0
  233. package/lib/esm/iterative-generation/activities/generatePart.js +75 -0
  234. package/lib/esm/iterative-generation/activities/generatePart.js.map +1 -0
  235. package/lib/esm/iterative-generation/activities/generateToc.js +83 -0
  236. package/lib/esm/iterative-generation/activities/generateToc.js.map +1 -0
  237. package/lib/esm/iterative-generation/activities/index.js +5 -0
  238. package/lib/esm/iterative-generation/activities/index.js.map +1 -0
  239. package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js +53 -0
  240. package/lib/esm/iterative-generation/iterativeGenerationWorkflow.js.map +1 -0
  241. package/lib/esm/iterative-generation/types.js +2 -0
  242. package/lib/esm/iterative-generation/types.js.map +1 -0
  243. package/lib/esm/iterative-generation/utils.js +112 -0
  244. package/lib/esm/iterative-generation/utils.js.map +1 -0
  245. package/lib/esm/result-types.js +7 -0
  246. package/lib/esm/result-types.js.map +1 -0
  247. package/lib/esm/system/notifyWebhookWorkflow.js +50 -0
  248. package/lib/esm/system/notifyWebhookWorkflow.js.map +1 -0
  249. package/lib/esm/system/recalculateEmbeddingsWorkflow.js +30 -0
  250. package/lib/esm/system/recalculateEmbeddingsWorkflow.js.map +1 -0
  251. package/lib/esm/utils/auth.js +8 -0
  252. package/lib/esm/utils/auth.js.map +1 -0
  253. package/lib/esm/utils/blobs.js +54 -0
  254. package/lib/esm/utils/blobs.js.map +1 -0
  255. package/lib/esm/utils/chunks.js +9 -0
  256. package/lib/esm/utils/chunks.js.map +1 -0
  257. package/lib/esm/utils/client.js +27 -0
  258. package/lib/esm/utils/client.js.map +1 -0
  259. package/lib/esm/utils/expand-vars.js +30 -0
  260. package/lib/esm/utils/expand-vars.js.map +1 -0
  261. package/lib/esm/utils/memory.js +55 -0
  262. package/lib/esm/utils/memory.js.map +1 -0
  263. package/lib/esm/utils/renditions.js +80 -0
  264. package/lib/esm/utils/renditions.js.map +1 -0
  265. package/lib/esm/utils/storage.js +45 -0
  266. package/lib/esm/utils/storage.js.map +1 -0
  267. package/lib/esm/utils/tokens.js +34 -0
  268. package/lib/esm/utils/tokens.js.map +1 -0
  269. package/lib/esm/vars.js +4 -0
  270. package/lib/esm/vars.js.map +1 -0
  271. package/lib/esm/workflows.js +8 -0
  272. package/lib/esm/workflows.js.map +1 -0
  273. package/lib/tsconfig.tsbuildinfo +1 -0
  274. package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts +17 -0
  275. package/lib/types/activities/advanced/createDocumentTypeFromInteractionRun.d.ts.map +1 -0
  276. package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts +39 -0
  277. package/lib/types/activities/advanced/createOrUpdateDocumentFromInteractionRun.d.ts.map +1 -0
  278. package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts +19 -0
  279. package/lib/types/activities/advanced/updateDocumentFromInteractionRun.d.ts.map +1 -0
  280. package/lib/types/activities/chunkDocument.d.ts +33 -0
  281. package/lib/types/activities/chunkDocument.d.ts.map +1 -0
  282. package/lib/types/activities/copyParentArtifacts.d.ts +19 -0
  283. package/lib/types/activities/copyParentArtifacts.d.ts.map +1 -0
  284. package/lib/types/activities/createDocumentFromOther.d.ts +21 -0
  285. package/lib/types/activities/createDocumentFromOther.d.ts.map +1 -0
  286. package/lib/types/activities/executeInteraction.d.ts +61 -0
  287. package/lib/types/activities/executeInteraction.d.ts.map +1 -0
  288. package/lib/types/activities/extractDocumentText.d.ts +10 -0
  289. package/lib/types/activities/extractDocumentText.d.ts.map +1 -0
  290. package/lib/types/activities/generateDocumentProperties.d.ts +32 -0
  291. package/lib/types/activities/generateDocumentProperties.d.ts.map +1 -0
  292. package/lib/types/activities/generateEmbeddings.d.ts +53 -0
  293. package/lib/types/activities/generateEmbeddings.d.ts.map +1 -0
  294. package/lib/types/activities/generateOrAssignContentType.d.ts +44 -0
  295. package/lib/types/activities/generateOrAssignContentType.d.ts.map +1 -0
  296. package/lib/types/activities/getObjectFromStore.d.ts +14 -0
  297. package/lib/types/activities/getObjectFromStore.d.ts.map +1 -0
  298. package/lib/types/activities/handleError.d.ts +6 -0
  299. package/lib/types/activities/handleError.d.ts.map +1 -0
  300. package/lib/types/activities/index-dsl.d.ts +25 -0
  301. package/lib/types/activities/index-dsl.d.ts.map +1 -0
  302. package/lib/types/activities/index.d.ts +5 -0
  303. package/lib/types/activities/index.d.ts.map +1 -0
  304. package/lib/types/activities/media/prepareAudio.d.ts +25 -0
  305. package/lib/types/activities/media/prepareAudio.d.ts.map +1 -0
  306. package/lib/types/activities/media/prepareVideo.d.ts +30 -0
  307. package/lib/types/activities/media/prepareVideo.d.ts.map +1 -0
  308. package/lib/types/activities/media/processPdfWithTextract.d.ts +26 -0
  309. package/lib/types/activities/media/processPdfWithTextract.d.ts.map +1 -0
  310. package/lib/types/activities/media/saveGladiaTranscription.d.ts +14 -0
  311. package/lib/types/activities/media/saveGladiaTranscription.d.ts.map +1 -0
  312. package/lib/types/activities/media/transcribeMediaWithGladia.d.ts +19 -0
  313. package/lib/types/activities/media/transcribeMediaWithGladia.d.ts.map +1 -0
  314. package/lib/types/activities/notifyWebhook.d.ts +27 -0
  315. package/lib/types/activities/notifyWebhook.d.ts.map +1 -0
  316. package/lib/types/activities/rateLimiter.d.ts +11 -0
  317. package/lib/types/activities/rateLimiter.d.ts.map +1 -0
  318. package/lib/types/activities/renditions/generateImageRendition.d.ts +14 -0
  319. package/lib/types/activities/renditions/generateImageRendition.d.ts.map +1 -0
  320. package/lib/types/activities/renditions/generateVideoRendition.d.ts +15 -0
  321. package/lib/types/activities/renditions/generateVideoRendition.d.ts.map +1 -0
  322. package/lib/types/activities/setDocumentStatus.d.ts +15 -0
  323. package/lib/types/activities/setDocumentStatus.d.ts.map +1 -0
  324. package/lib/types/conversion/TextractProcessor.d.ts +45 -0
  325. package/lib/types/conversion/TextractProcessor.d.ts.map +1 -0
  326. package/lib/types/conversion/image.d.ts +13 -0
  327. package/lib/types/conversion/image.d.ts.map +1 -0
  328. package/lib/types/conversion/markitdown.d.ts +2 -0
  329. package/lib/types/conversion/markitdown.d.ts.map +1 -0
  330. package/lib/types/conversion/mutool.d.ts +19 -0
  331. package/lib/types/conversion/mutool.d.ts.map +1 -0
  332. package/lib/types/conversion/pandoc.d.ts +2 -0
  333. package/lib/types/conversion/pandoc.d.ts.map +1 -0
  334. package/lib/types/dsl/conditions.d.ts +2 -0
  335. package/lib/types/dsl/conditions.d.ts.map +1 -0
  336. package/lib/types/dsl/dsl-workflow.d.ts +5 -0
  337. package/lib/types/dsl/dsl-workflow.d.ts.map +1 -0
  338. package/lib/types/dsl/dslProxyActivities.d.ts +10 -0
  339. package/lib/types/dsl/dslProxyActivities.d.ts.map +1 -0
  340. package/lib/types/dsl/projections.d.ts +4 -0
  341. package/lib/types/dsl/projections.d.ts.map +1 -0
  342. package/lib/types/dsl/setup/ActivityContext.d.ts +17 -0
  343. package/lib/types/dsl/setup/ActivityContext.d.ts.map +1 -0
  344. package/lib/types/dsl/setup/fetch/DataProvider.d.ts +9 -0
  345. package/lib/types/dsl/setup/fetch/DataProvider.d.ts.map +1 -0
  346. package/lib/types/dsl/setup/fetch/index.d.ts +6 -0
  347. package/lib/types/dsl/setup/fetch/index.d.ts.map +1 -0
  348. package/lib/types/dsl/setup/fetch/providers.d.ts +25 -0
  349. package/lib/types/dsl/setup/fetch/providers.d.ts.map +1 -0
  350. package/lib/types/dsl/test/test-child-workflow.d.ts +4 -0
  351. package/lib/types/dsl/test/test-child-workflow.d.ts.map +1 -0
  352. package/lib/types/dsl/validation.d.ts +4 -0
  353. package/lib/types/dsl/validation.d.ts.map +1 -0
  354. package/lib/types/dsl/vars.d.ts +48 -0
  355. package/lib/types/dsl/vars.d.ts.map +1 -0
  356. package/lib/types/dsl/walk.d.ts +18 -0
  357. package/lib/types/dsl/walk.d.ts.map +1 -0
  358. package/lib/types/dsl.d.ts +4 -0
  359. package/lib/types/dsl.d.ts.map +1 -0
  360. package/lib/types/errors.d.ts +37 -0
  361. package/lib/types/errors.d.ts.map +1 -0
  362. package/lib/types/index.d.ts +37 -0
  363. package/lib/types/index.d.ts.map +1 -0
  364. package/lib/types/iterative-generation/activities/extractToc.d.ts +10 -0
  365. package/lib/types/iterative-generation/activities/extractToc.d.ts.map +1 -0
  366. package/lib/types/iterative-generation/activities/finalizeOutput.d.ts +3 -0
  367. package/lib/types/iterative-generation/activities/finalizeOutput.d.ts.map +1 -0
  368. package/lib/types/iterative-generation/activities/generatePart.d.ts +3 -0
  369. package/lib/types/iterative-generation/activities/generatePart.d.ts.map +1 -0
  370. package/lib/types/iterative-generation/activities/generateToc.d.ts +4 -0
  371. package/lib/types/iterative-generation/activities/generateToc.d.ts.map +1 -0
  372. package/lib/types/iterative-generation/activities/index.d.ts +5 -0
  373. package/lib/types/iterative-generation/activities/index.d.ts.map +1 -0
  374. package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts +3 -0
  375. package/lib/types/iterative-generation/iterativeGenerationWorkflow.d.ts.map +1 -0
  376. package/lib/types/iterative-generation/types.d.ts +79 -0
  377. package/lib/types/iterative-generation/types.d.ts.map +1 -0
  378. package/lib/types/iterative-generation/utils.d.ts +26 -0
  379. package/lib/types/iterative-generation/utils.d.ts.map +1 -0
  380. package/lib/types/result-types.d.ts +22 -0
  381. package/lib/types/result-types.d.ts.map +1 -0
  382. package/lib/types/system/notifyWebhookWorkflow.d.ts +8 -0
  383. package/lib/types/system/notifyWebhookWorkflow.d.ts.map +1 -0
  384. package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts +25 -0
  385. package/lib/types/system/recalculateEmbeddingsWorkflow.d.ts.map +1 -0
  386. package/lib/types/utils/auth.d.ts +4 -0
  387. package/lib/types/utils/auth.d.ts.map +1 -0
  388. package/lib/types/utils/blobs.d.ts +7 -0
  389. package/lib/types/utils/blobs.d.ts.map +1 -0
  390. package/lib/types/utils/chunks.d.ts +9 -0
  391. package/lib/types/utils/chunks.d.ts.map +1 -0
  392. package/lib/types/utils/client.d.ts +8 -0
  393. package/lib/types/utils/client.d.ts.map +1 -0
  394. package/lib/types/utils/expand-vars.d.ts +8 -0
  395. package/lib/types/utils/expand-vars.d.ts.map +1 -0
  396. package/lib/types/utils/memory.d.ts +8 -0
  397. package/lib/types/utils/memory.d.ts.map +1 -0
  398. package/lib/types/utils/renditions.d.ts +23 -0
  399. package/lib/types/utils/renditions.d.ts.map +1 -0
  400. package/lib/types/utils/storage.d.ts +16 -0
  401. package/lib/types/utils/storage.d.ts.map +1 -0
  402. package/lib/types/utils/tokens.d.ts +11 -0
  403. package/lib/types/utils/tokens.d.ts.map +1 -0
  404. package/lib/types/vars.d.ts +3 -0
  405. package/lib/types/vars.d.ts.map +1 -0
  406. package/lib/types/workflows.d.ts +8 -0
  407. package/lib/types/workflows.d.ts.map +1 -0
  408. package/lib/workflows-bundle.js +17213 -0
  409. package/package.json +146 -0
  410. package/src/activities/advanced/createDocumentTypeFromInteractionRun.ts +55 -0
  411. package/src/activities/advanced/createOrUpdateDocumentFromInteractionRun.ts +119 -0
  412. package/src/activities/advanced/updateDocumentFromInteractionRun.ts +35 -0
  413. package/src/activities/chunkDocument.ts +146 -0
  414. package/src/activities/copyParentArtifacts.ts +162 -0
  415. package/src/activities/createDocumentFromOther.ts +92 -0
  416. package/src/activities/executeInteraction.ts +300 -0
  417. package/src/activities/extractDocumentText.ts +205 -0
  418. package/src/activities/generateDocumentProperties.ts +120 -0
  419. package/src/activities/generateEmbeddings.ts +387 -0
  420. package/src/activities/generateOrAssignContentType.ts +218 -0
  421. package/src/activities/getObjectFromStore.ts +31 -0
  422. package/src/activities/handleError.ts +25 -0
  423. package/src/activities/index-dsl.ts +25 -0
  424. package/src/activities/index.ts +4 -0
  425. package/src/activities/media/prepareAudio.ts +334 -0
  426. package/src/activities/media/prepareVideo.ts +622 -0
  427. package/src/activities/media/processPdfWithTextract.ts +141 -0
  428. package/src/activities/media/saveGladiaTranscription.ts +128 -0
  429. package/src/activities/media/transcribeMediaWithGladia.ts +117 -0
  430. package/src/activities/notifyWebhook.test.ts +134 -0
  431. package/src/activities/notifyWebhook.ts +199 -0
  432. package/src/activities/rateLimiter.ts +41 -0
  433. package/src/activities/renditions/generateImageRendition.ts +111 -0
  434. package/src/activities/renditions/generateVideoRendition.ts +293 -0
  435. package/src/activities/setDocumentStatus.ts +25 -0
  436. package/src/conversion/TextractProcessor.ts +506 -0
  437. package/src/conversion/image.test.ts +118 -0
  438. package/src/conversion/image.ts +168 -0
  439. package/src/conversion/markitdown.ts +41 -0
  440. package/src/conversion/mutool.test.ts +74 -0
  441. package/src/conversion/mutool.ts +180 -0
  442. package/src/conversion/pandoc.test.ts +24 -0
  443. package/src/conversion/pandoc.ts +40 -0
  444. package/src/dsl/conditions.ts +76 -0
  445. package/src/dsl/dsl-workflow.test.ts +58 -0
  446. package/src/dsl/dsl-workflow.ts +397 -0
  447. package/src/dsl/dslProxyActivities.ts +38 -0
  448. package/src/dsl/ms.d.ts +11 -0
  449. package/src/dsl/projections.test.ts +159 -0
  450. package/src/dsl/projections.ts +72 -0
  451. package/src/dsl/setup/ActivityContext.ts +178 -0
  452. package/src/dsl/setup/fetch/DataProvider.ts +45 -0
  453. package/src/dsl/setup/fetch/index.ts +19 -0
  454. package/src/dsl/setup/fetch/providers.ts +67 -0
  455. package/src/dsl/test/test-child-workflow.ts +6 -0
  456. package/src/dsl/validation.test.ts +257 -0
  457. package/src/dsl/validation.ts +125 -0
  458. package/src/dsl/vars.test.ts +245 -0
  459. package/src/dsl/vars.ts +340 -0
  460. package/src/dsl/walk.test.ts +81 -0
  461. package/src/dsl/walk.ts +103 -0
  462. package/src/dsl/workflow-exec-child.test.ts +273 -0
  463. package/src/dsl/workflow-fetch.test.ts +138 -0
  464. package/src/dsl/workflow-import.test.ts +89 -0
  465. package/src/dsl/workflow.test.ts +122 -0
  466. package/src/dsl.ts +3 -0
  467. package/src/errors.ts +101 -0
  468. package/src/index.ts +41 -0
  469. package/src/iterative-generation/activities/extractToc.ts +63 -0
  470. package/src/iterative-generation/activities/finalizeOutput.ts +100 -0
  471. package/src/iterative-generation/activities/generatePart.ts +123 -0
  472. package/src/iterative-generation/activities/generateToc.ts +116 -0
  473. package/src/iterative-generation/activities/index.ts +4 -0
  474. package/src/iterative-generation/iterativeGenerationWorkflow.ts +68 -0
  475. package/src/iterative-generation/types.ts +99 -0
  476. package/src/iterative-generation/utils.ts +126 -0
  477. package/src/result-types.ts +25 -0
  478. package/src/system/notifyWebhookWorkflow.ts +70 -0
  479. package/src/system/recalculateEmbeddingsWorkflow.ts +41 -0
  480. package/src/utils/auth.ts +10 -0
  481. package/src/utils/blobs.ts +59 -0
  482. package/src/utils/chunks.ts +17 -0
  483. package/src/utils/client.ts +46 -0
  484. package/src/utils/expand-vars.ts +31 -0
  485. package/src/utils/memory.ts +61 -0
  486. package/src/utils/renditions.ts +127 -0
  487. package/src/utils/storage.ts +60 -0
  488. package/src/utils/tokens.ts +44 -0
  489. package/src/vars.ts +3 -0
  490. package/src/workflows.ts +7 -0
@@ -0,0 +1,120 @@
1
+ import { log } from "@temporalio/activity";
2
+ import { DSLActivityExecutionPayload, DSLActivitySpec } from "@vertesia/common";
3
+ import { setupActivity } from "../dsl/setup/ActivityContext.js";
4
+ import { TruncateSpec, truncByMaxTokens } from "../utils/tokens.js";
5
+ import { InteractionExecutionParams, executeInteractionFromActivity } from "./executeInteraction.js";
6
+
7
+ const INT_EXTRACT_INFORMATION = "sys:ExtractInformation";
8
+ export interface GenerateDocumentPropertiesParams extends InteractionExecutionParams {
9
+ typesHint?: string[];
10
+ /**
11
+ * truncate the input doc text to the specified max_tokens
12
+ */
13
+ truncate?: TruncateSpec;
14
+
15
+ interactionName?: string;
16
+
17
+ use_vision?: boolean;
18
+ }
19
+ export interface GenerateDocumentProperties extends DSLActivitySpec<GenerateDocumentPropertiesParams> {
20
+ name: "generateDocumentProperties";
21
+ }
22
+
23
+ export async function generateDocumentProperties(
24
+ payload: DSLActivityExecutionPayload<GenerateDocumentPropertiesParams>,
25
+ ) {
26
+ const context = await setupActivity<GenerateDocumentPropertiesParams>(payload);
27
+ const { params, client, objectId } = context;
28
+ const interactionName = params.interactionName ?? INT_EXTRACT_INFORMATION;
29
+
30
+ const project = await context.fetchProject();
31
+
32
+ const doc = await client.objects.retrieve(objectId, "+text");
33
+ const type = doc.type ? await client.types.retrieve(doc.type.id) : undefined;
34
+
35
+ if (!doc?.text && !params.use_vision && !doc?.content?.type?.startsWith("image/")) {
36
+ log.warn(`Object ${objectId} not found or text is empty`);
37
+ return { status: "failed", error: "no-text" };
38
+ }
39
+
40
+ if (!type || !type.object_schema) {
41
+ log.info(`Object ${objectId} has no schema`);
42
+ return { document: objectId, status: "skipped", message: "no schema defined on type" };
43
+ }
44
+
45
+ const getImageRef = () => {
46
+ if (doc.content?.type?.startsWith("image/")) {
47
+ return "store:" + doc.id;
48
+ }
49
+
50
+ if (params.use_vision && doc.content?.type?.startsWith("application/pdf")) {
51
+ return "store:" + doc.id;
52
+ }
53
+
54
+ log.info(`Object ${objectId} is not an image or pdf`);
55
+ return undefined;
56
+ };
57
+
58
+ const content = doc.text
59
+ ? truncByMaxTokens(doc.text, params.truncate || 30000)
60
+ : undefined;
61
+
62
+ const promptData = {
63
+ content: content,
64
+ image: getImageRef() ?? undefined,
65
+ human_context: project?.configuration?.human_context ?? undefined,
66
+ };
67
+
68
+ log.info(
69
+ ` Extracting information from object ${objectId} with type ${type.name}`,
70
+ payload.debug_mode ? { params } : undefined,
71
+ );
72
+
73
+ const infoRes = await executeInteractionFromActivity(
74
+ client,
75
+ interactionName,
76
+ {
77
+ ...params,
78
+ include_previous_error: true,
79
+ result_schema: type.object_schema,
80
+ validate_result: type.strict_mode,
81
+ },
82
+ promptData,
83
+ payload.debug_mode ?? false,
84
+ );
85
+
86
+ const getText = () => {
87
+ if (doc.text) {
88
+ return undefined;
89
+ }
90
+ let text = "";
91
+ const jsonResult = infoRes.result.object();
92
+ if (jsonResult.title) {
93
+ text += jsonResult.title + "\n";
94
+ }
95
+ if (jsonResult.description) {
96
+ text += jsonResult.description;
97
+ }
98
+ if (text) {
99
+ return text;
100
+ } else {
101
+ return undefined;
102
+ }
103
+ };
104
+
105
+ log.info(`Extracted information from object ${objectId} with type ${type.name}`, { runId: infoRes.id });
106
+ await client.objects.update(doc.id, {
107
+ properties: {
108
+ ...infoRes.result.object(),
109
+ etag: doc.text_etag,
110
+ },
111
+ text: getText(),
112
+ generation_run_info: {
113
+ id: infoRes.id,
114
+ date: new Date().toISOString(),
115
+ model: infoRes.modelId,
116
+ },
117
+ }, { suppressWorkflows: true });
118
+
119
+ return { status: "completed" };
120
+ }
@@ -0,0 +1,387 @@
1
+ import { EmbeddingsResult } from "@llumiverse/common";
2
+ import { log } from "@temporalio/activity";
3
+ import { VertesiaClient } from "@vertesia/client";
4
+ import {
5
+ ContentObject,
6
+ DSLActivityExecutionPayload,
7
+ DSLActivitySpec,
8
+ ImageRenditionFormat,
9
+ ProjectConfigurationEmbeddings,
10
+ SupportedEmbeddingTypes,
11
+ } from "@vertesia/common";
12
+ import { setupActivity } from "../dsl/setup/ActivityContext.js";
13
+ import { DocumentNotFoundError } from "../errors.js";
14
+ import { fetchBlobAsBase64, md5 } from "../utils/blobs.js";
15
+ import { DocPart } from "../utils/chunks.js";
16
+ import { countTokens } from "../utils/tokens.js";
17
+
18
+ export interface GenerateEmbeddingsParams {
19
+ /**
20
+ * The model to use for embedding generation
21
+ * If not set, the default model for the project will be used
22
+ */
23
+ model?: string;
24
+
25
+ /**
26
+ * The environment to use for embedding generation
27
+ * If not set, the default environment for the project will be used
28
+ */
29
+ environment?: string;
30
+
31
+ /**
32
+ * If true, force embedding generation even if the document already has embeddings
33
+ */
34
+ force?: boolean;
35
+
36
+ /**
37
+ * The embedding type to generate
38
+ */
39
+ type: SupportedEmbeddingTypes;
40
+
41
+ /**
42
+ * The DocParts to use for long documents
43
+ */
44
+ parts?: DocPart[];
45
+ }
46
+
47
+ export interface GenerateEmbeddings
48
+ extends DSLActivitySpec<GenerateEmbeddingsParams> {
49
+ name: "generateEmbeddings";
50
+ }
51
+
52
+ export async function generateEmbeddings(
53
+ payload: DSLActivityExecutionPayload<GenerateEmbeddingsParams>,
54
+ ) {
55
+ const { params, client, objectId, fetchProject } =
56
+ await setupActivity<GenerateEmbeddingsParams>(payload);
57
+ const { force, type } = params;
58
+
59
+ const projectData = await fetchProject();
60
+ const config = projectData?.configuration.embeddings[type];
61
+ if (!projectData) {
62
+ throw new DocumentNotFoundError("Project not found", [payload.project_id]);
63
+ }
64
+ if (!config) {
65
+ throw new DocumentNotFoundError("Embeddings configuration not found", [
66
+ objectId,
67
+ ]);
68
+ }
69
+
70
+ if (!projectData) {
71
+ throw new DocumentNotFoundError("Project not found", [payload.project_id]);
72
+ }
73
+
74
+ if (!projectData?.configuration.embeddings[type]?.enabled) {
75
+ log.info(
76
+ `Embeddings generation disabled for type ${type} on project: ${projectData.name} (${projectData.namespace})`,
77
+ { config },
78
+ );
79
+ return {
80
+ id: objectId,
81
+ status: "skipped",
82
+ message: `Embeddings generation disabled for type ${type}`,
83
+ };
84
+ }
85
+
86
+ log.info(`${type} embedding generation starting for object ${objectId}`, {
87
+ force,
88
+ config,
89
+ });
90
+
91
+ if (!config.environment) {
92
+ throw new Error(
93
+ "No environment found in project configuration. Set environment in project configuration to generate embeddings.",
94
+ );
95
+ }
96
+
97
+ const document = await client.objects.retrieve(
98
+ objectId,
99
+ "+text +parts +embeddings +tokens +properties",
100
+ );
101
+
102
+ if (!document) {
103
+ throw new DocumentNotFoundError("Document not found", [objectId]);
104
+ }
105
+
106
+ if (!document.content) {
107
+ throw new DocumentNotFoundError("Document content not found", [objectId]);
108
+ }
109
+
110
+ let res;
111
+
112
+ switch (type) {
113
+ case SupportedEmbeddingTypes.text:
114
+ res = await generateTextEmbeddings({
115
+ client,
116
+ config,
117
+ document,
118
+ type,
119
+ force,
120
+ });
121
+ break;
122
+ case SupportedEmbeddingTypes.properties:
123
+ res = await generateTextEmbeddings({
124
+ client,
125
+ config,
126
+ document,
127
+ type,
128
+ force,
129
+ });
130
+ break;
131
+ case SupportedEmbeddingTypes.image:
132
+ res = await generateImageEmbeddings({
133
+ client,
134
+ config,
135
+ document,
136
+ type,
137
+ force,
138
+ });
139
+ break;
140
+ default:
141
+ res = {
142
+ id: objectId,
143
+ status: "failed",
144
+ message: `unsupported embedding type: ${type}`,
145
+ };
146
+ }
147
+
148
+ return res;
149
+ }
150
+
151
+ interface ExecuteGenerateEmbeddingsParams {
152
+ document: ContentObject;
153
+ client: VertesiaClient;
154
+ type: SupportedEmbeddingTypes;
155
+ config: ProjectConfigurationEmbeddings;
156
+ property?: string;
157
+ force?: boolean;
158
+ }
159
+
160
+ async function generateTextEmbeddings(
161
+ { document, client, type, config, force }: ExecuteGenerateEmbeddingsParams
162
+ ) {
163
+
164
+ if (!document) {
165
+ return { status: "error", message: "document is null or undefined" };
166
+ }
167
+
168
+ if (
169
+ type !== SupportedEmbeddingTypes.text &&
170
+ type !== SupportedEmbeddingTypes.properties
171
+ ) {
172
+ return {
173
+ id: document.id,
174
+ status: "failed",
175
+ message: `unsupported embedding type: ${type}`,
176
+ };
177
+ }
178
+
179
+ if (type === SupportedEmbeddingTypes.text && !document.text) {
180
+ return { id: document.id, status: "failed", message: "no text found" };
181
+ }
182
+ if (type === SupportedEmbeddingTypes.properties && !document?.properties) {
183
+ return {
184
+ id: document.id,
185
+ status: "failed",
186
+ message: "no properties found",
187
+ };
188
+ }
189
+
190
+ const { environment } = config;
191
+
192
+ // Compute text etag for comparison
193
+ const textEtag = document.text_etag ?? (document.text ? md5(document.text) : undefined);
194
+
195
+ // Skip if embeddings already exist with matching etag (unless force=true)
196
+ const existingEmbedding = document.embeddings?.[type];
197
+ if (!force && existingEmbedding?.etag && textEtag && existingEmbedding.etag === textEtag) {
198
+ log.info(`Skipping ${type} embeddings for document ${document.id} - etag unchanged`);
199
+ return {
200
+ id: document.id,
201
+ type,
202
+ status: "skipped",
203
+ message: "embeddings already exist with matching etag",
204
+ };
205
+ }
206
+
207
+ // Count tokens if needed, do not rely on existing token count
208
+ let tokenCount : number | undefined = undefined;
209
+ if (type === SupportedEmbeddingTypes.text && document.text) {
210
+ tokenCount = countTokens(document.text).count;
211
+ }
212
+
213
+ const maxTokens = config.max_tokens ?? 8000;
214
+
215
+ //generate embeddings for the main doc if document isn't too large
216
+ log.info(`Generating ${type} embeddings for document ${document.id}`);
217
+ if (
218
+ type === SupportedEmbeddingTypes.text &&
219
+ tokenCount !== undefined &&
220
+ tokenCount > maxTokens
221
+ ) {
222
+ //TODO: Review strategy for large documents
223
+ log.warn(
224
+ `Document too large for ${type} embeddings generation, skipping (${tokenCount} tokens)`,
225
+ );
226
+ return {
227
+ id: document.id,
228
+ status: "skipped",
229
+ message: `${type} embeddings generation, skipped for large document (${tokenCount} tokens)`,
230
+ }
231
+ } else {
232
+ log.info(`Generating ${type} embeddings for document`);
233
+
234
+ const res = await generateEmbeddingsFromStudio(
235
+ JSON.stringify(document[type]),
236
+ environment,
237
+ client,
238
+ );
239
+ if (!res || !res.values) {
240
+ return {
241
+ id: document.id,
242
+ status: "failed",
243
+ message: "no embeddings generated",
244
+ };
245
+ }
246
+
247
+ log.info(`${type} embeddings generated for document ${document.id}`, {
248
+ len: res.values.length,
249
+ });
250
+ await client.objects.setEmbedding(document.id, type, {
251
+ values: res.values,
252
+ model: res.model,
253
+ etag: textEtag,
254
+ });
255
+
256
+ return {
257
+ id: document.id,
258
+ type,
259
+ status: "completed",
260
+ len: res.values.length,
261
+ };
262
+ }
263
+ }
264
+
265
+ async function generateImageEmbeddings({
266
+ document,
267
+ client,
268
+ type,
269
+ config,
270
+ force,
271
+ }: ExecuteGenerateEmbeddingsParams) {
272
+ log.info("Generating image embeddings for document " + document.id, {
273
+ content: document.content,
274
+ });
275
+ if (
276
+ !document.content?.type?.startsWith("image/") &&
277
+ !document.content?.type?.includes("pdf")
278
+ ) {
279
+ return {
280
+ id: document.id,
281
+ type,
282
+ status: "failed",
283
+ message: "content is not an image",
284
+ };
285
+ }
286
+
287
+ // Use content etag for image change detection
288
+ const contentEtag = document.content?.etag;
289
+
290
+ // Skip if embeddings already exist with matching etag (unless force=true)
291
+ const existingEmbedding = document.embeddings?.[type];
292
+ if (!force && existingEmbedding?.etag && contentEtag && existingEmbedding.etag === contentEtag) {
293
+ log.info(`Skipping ${type} embeddings for document ${document.id} - content etag unchanged`);
294
+ return {
295
+ id: document.id,
296
+ type,
297
+ status: "skipped",
298
+ message: "embeddings already exist with matching etag",
299
+ };
300
+ }
301
+
302
+ const { environment, model } = config;
303
+
304
+ const resRnd = await client.store.objects.getRendition(document.id, {
305
+ format: ImageRenditionFormat.jpeg,
306
+ generate_if_missing: true,
307
+ sign_url: true,
308
+ });
309
+
310
+ if (resRnd.status === "generating") {
311
+ throw new Error("Rendition is generating, will retry later");
312
+ } else if (
313
+ resRnd.status === "failed" ||
314
+ !resRnd.renditions ||
315
+ !resRnd.renditions.length
316
+ ) {
317
+ throw new DocumentNotFoundError("Rendition retrieval failed", [document.id]);
318
+ }
319
+
320
+ const renditions = resRnd.renditions;
321
+ if (!renditions?.length) {
322
+ throw new DocumentNotFoundError("No source found in rendition", [
323
+ document.id,
324
+ ]);
325
+ }
326
+
327
+ const rendition = renditions[0];
328
+ const image = await fetchBlobAsBase64(client, rendition);
329
+
330
+ const res = await client.environments
331
+ .embeddings(environment, {
332
+ image,
333
+ model,
334
+ })
335
+ .then((res) => res)
336
+ .catch((e) => {
337
+ log.error("Error generating embeddings for image", { error: e });
338
+ throw e;
339
+ });
340
+
341
+ if (!res || !res.values) {
342
+ return {
343
+ id: document.id,
344
+ status: "failed",
345
+ message: "no embeddings generated",
346
+ };
347
+ }
348
+
349
+ await client.objects.setEmbedding(
350
+ document.id,
351
+ SupportedEmbeddingTypes.image,
352
+ {
353
+ values: res.values,
354
+ model: res.model,
355
+ etag: contentEtag,
356
+ },
357
+ );
358
+
359
+ return {
360
+ id: document.id,
361
+ type,
362
+ status: "completed",
363
+ len: res.values.length,
364
+ };
365
+ }
366
+
367
+ async function generateEmbeddingsFromStudio(
368
+ text: string,
369
+ env: string,
370
+ client: VertesiaClient,
371
+ model?: string,
372
+ ): Promise<EmbeddingsResult> {
373
+ log.info(
374
+ `Generating embeddings for text of ${text.length} chars with environment ${env}`,
375
+ );
376
+
377
+ return client.environments
378
+ .embeddings(env, {
379
+ text,
380
+ model,
381
+ })
382
+ .then((res) => res)
383
+ .catch((e) => {
384
+ log.error("Error generating embeddings for text", { error: e });
385
+ throw e;
386
+ });
387
+ }