npm - @botpress/zai - Versions diffs - 2.5.17 → 2.6.0 - Mend

@botpress/zai 2.5.17 → 2.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (32) hide show

package/dist/context.js +14 -0
package/dist/index.d.ts +44 -1
package/dist/operations/answer.js +2 -1
package/dist/operations/check.js +2 -1
package/dist/operations/extract.js +2 -1
package/dist/operations/filter.js +2 -1
package/dist/operations/group.js +190 -2
package/dist/operations/label.js +2 -1
package/dist/operations/patch.js +2 -1
package/dist/operations/rate.js +2 -1
package/dist/operations/rewrite.js +2 -1
package/dist/operations/sort.js +2 -1
package/dist/operations/summarize.js +2 -1
package/dist/operations/text.js +2 -1
package/dist/zai.js +9 -0
package/e2e/data/cache.jsonl +70 -0
package/package.json +1 -1
package/src/context.ts +21 -0
package/src/index.ts +2 -1
package/src/operations/answer.ts +1 -0
package/src/operations/check.ts +1 -0
package/src/operations/extract.ts +1 -0
package/src/operations/filter.ts +1 -0
package/src/operations/group.ts +278 -0
package/src/operations/label.ts +1 -0
package/src/operations/patch.ts +1 -0
package/src/operations/rate.ts +1 -0
package/src/operations/rewrite.ts +1 -0
package/src/operations/sort.ts +1 -0
package/src/operations/summarize.ts +1 -0
package/src/operations/text.ts +1 -0
package/src/zai.ts +32 -0

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@botpress/zai",
   "description": "Zui AI (zai) – An LLM utility library written on top of Zui and the Botpress API",
-  "version": "2.5.17",
+  "version": "2.6.0",
   "main": "./dist/index.js",
   "types": "./dist/index.d.ts",
   "exports": {

package/src/context.ts CHANGED Viewed

@@ -1,6 +1,8 @@
 import { Cognitive, Model, GenerateContentInput, GenerateContentOutput } from '@botpress/cognitive'
 import { Adapter } from './adapters/adapter'
 import { EventEmitter } from './emitter'
+import { fastHash } from './utils'
+import type { Memoizer } from './zai'
 type Meta = Awaited<ReturnType<Cognitive['generateContent']>>['meta']
@@ -16,6 +18,7 @@ export type ZaiContextProps = {
   modelId: string
   adapter?: Adapter
   source?: GenerateContentInput['meta']
+  memoizer?: Memoizer
 }
 /**
@@ -94,10 +97,13 @@ export class ZaiContext {
   public source?: GenerateContentInput['meta']
   private _eventEmitter: EventEmitter<ContextEvents>
+  private _memoizer: Memoizer
   public controller: AbortController = new AbortController()
   private _client: Cognitive
+  private static _noopMemoizer: Memoizer = { run: (_id, fn) => fn() }
   public constructor(props: ZaiContextProps) {
     this._client = props.client.clone()
     this.taskId = props.taskId
@@ -105,6 +111,7 @@ export class ZaiContext {
     this.adapter = props.adapter
     this.source = props.source
     this.taskType = props.taskType
+    this._memoizer = props.memoizer ?? ZaiContext._noopMemoizer
     this._eventEmitter = new EventEmitter<ContextEvents>()
     this._client.on('request', () => {
@@ -148,6 +155,20 @@ export class ZaiContext {
   public async generateContent<Out = string>(
     props: GenerateContentProps<Out>
+  ): Promise<{ meta: Meta; output: GenerateContentOutput; text: string | undefined; extracted: Out }> {
+    const memoKey = `zai:memo:${this.taskType}:${this.taskId || 'default'}:${fastHash(
+      JSON.stringify({
+        s: props.systemPrompt,
+        m: props.messages?.map((m) => ('content' in m ? m.content : '')),
+        st: props.stopSequences,
+      })
+    )}`
+    return this._memoizer.run(memoKey, () => this._generateContentInner(props))
+  }
+  private async _generateContentInner<Out = string>(
+    props: GenerateContentProps<Out>
   ): Promise<{ meta: Meta; output: GenerateContentOutput; text: string | undefined; extracted: Out }> {
     const maxRetries = Math.max(props.maxRetries ?? 3, 0)
     const transform = props.transform

package/src/index.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { Zai } from './zai'
+import { Zai, type Memoizer } from './zai'
 import './operations/text'
 import './operations/rewrite'
@@ -14,3 +14,4 @@ import './operations/answer'
 import './operations/patch'
 export { Zai }
+export type { Memoizer }

package/src/operations/answer.ts CHANGED Viewed

@@ -816,6 +816,7 @@ Zai.prototype.answer = function <T>(
     taskId: this.taskId,
     taskType: 'zai.answer',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<AnswerResult<T>, AnswerResult<T>>(

package/src/operations/check.ts CHANGED Viewed

@@ -354,6 +354,7 @@ Zai.prototype.check = function (
     taskId: this.taskId,
     taskType: 'zai.check',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<

package/src/operations/extract.ts CHANGED Viewed

@@ -484,6 +484,7 @@ Zai.prototype.extract = function <S extends OfType<AnyObjectOrArray>>(
     taskId: this.taskId,
     taskType: 'zai.extract',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<S['_output']>(context, extract(input, schema, _options, context), (result) => result)

package/src/operations/filter.ts CHANGED Viewed

@@ -363,6 +363,7 @@ Zai.prototype.filter = function <T>(
     taskId: this.taskId,
     taskType: 'zai.filter',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<Array<T>>(context, filter(input, condition, _options, context), (result) => result)

package/src/operations/group.ts CHANGED Viewed

@@ -32,6 +32,8 @@ export type Options = {
   tokensPerElement?: number
   chunkLength?: number
   initialGroups?: Array<InitialGroup>
+  maxGroups?: number
+  minElements?: number
 }
 const _Options = z.object({
@@ -39,6 +41,8 @@ const _Options = z.object({
   tokensPerElement: z.number().min(1).max(100_000).optional().default(250),
   chunkLength: z.number().min(100).max(100_000).optional().default(16_000),
   initialGroups: z.array(_InitialGroup).optional().default([]),
+  maxGroups: z.number().min(2).optional(),
+  minElements: z.number().min(1).optional(),
 })
 declare module '@botpress/zai' {
@@ -52,6 +56,8 @@ declare module '@botpress/zai' {
      *
      * @param input - Array of items to group
      * @param options - Configuration for grouping behavior, instructions, and initial categories
+     * @param options.maxGroups - Maximum number of groups allowed (minimum 2). When set, groups are merged at the end until within limit.
+     * @param options.minElements - Minimum elements per group (minimum 1). Groups below this threshold have their elements redistributed via AI.
      * @returns Response with groups array (simplified to Record<groupLabel, items[]>)
      *
      * @example Automatic grouping
@@ -193,6 +199,18 @@ declare module '@botpress/zai' {
      * })
      * ```
      */
+    /**
+     * @example Limiting number of groups
+     * ```typescript
+     * const items = ['apple', 'banana', 'carrot', 'chicken', 'rice', 'bread', 'salmon', 'milk']
+     *
+     * const groups = await zai.group(items, {
+     *   instructions: 'Group by food type',
+     *   maxGroups: 3 // At most 3 groups — smallest groups get merged if exceeded
+     * })
+     * // Guarantees no more than 3 groups in the result
+     * ```
+     */
     group<T>(input: Array<T>, options?: Options): Response<Array<Group<T>>, Record<string, T[]>>
   }
 }
@@ -609,6 +627,265 @@ ${END}`.trim()
     }
   }
+  // Phase 4: Merge groups if maxGroups is set (AI-driven)
+  if (options.maxGroups !== undefined) {
+    const nonEmptyGroupIds = () =>
+      Array.from(groupElements.entries())
+        .filter(([, s]) => s.size > 0)
+        .map(([id]) => id)
+    let currentIds = nonEmptyGroupIds()
+    if (currentIds.length > options.maxGroups) {
+      // Build a summary of each group: label + element count + sample elements
+      const groupSummaries = currentIds.map((gid, idx) => {
+        const info = groups.get(gid)!
+        const elemIndices = Array.from(groupElements.get(gid)!)
+        const sampleElements = elemIndices
+          .slice(0, 3)
+          .map((i) => tokenizer.truncate(elements[i].stringified, 60))
+          .join(', ')
+        return `■${idx}:${info.label} (${elemIndices.length} elements, e.g. ${sampleElements})■`
+      })
+      const mergeSystemPrompt = `You are consolidating groups into fewer, broader categories.
+${options.instructions ? `**Original instructions:** ${options.instructions}\n` : ''}
+**Task:** Merge ${currentIds.length} groups down to at most ${options.maxGroups} groups.
+Combine the most semantically related groups together. Give each merged group a new descriptive label.
+**Output Format:**
+For each input group (■0 to ■${currentIds.length - 1}), output which target label it maps to:
+■0:Merged Label■
+■1:Merged Label■
+${END}
+Use the EXACT SAME label for groups that should be merged together.`.trim()
+      const mergeUserPrompt = `**Current groups:**
+${groupSummaries.join('\n')}
+Merge into at most ${options.maxGroups} groups.
+${END}`.trim()
+      const { extracted: mergeAssignments } = await ctx.generateContent({
+        systemPrompt: mergeSystemPrompt,
+        stopSequences: [END],
+        messages: [{ type: 'text', role: 'user', content: mergeUserPrompt }],
+        transform: (text) => {
+          const assignments: Array<{ sourceIdx: number; label: string }> = []
+          const regex = /■(\d+):([^■]+)■/g
+          let match: RegExpExecArray | null
+          while ((match = regex.exec(text)) !== null) {
+            const idx = parseInt(match[1] ?? '', 10)
+            if (isNaN(idx) || idx < 0 || idx >= currentIds.length) continue
+            const label = (match[2] ?? '').trim()
+            if (!label) continue
+            assignments.push({ sourceIdx: idx, label: label.slice(0, 250) })
+          }
+          return assignments
+        },
+      })
+      // Build merge map: normalized merge label → list of source group IDs
+      const mergeMap = new Map<string, { label: string; sourceGroupIds: string[] }>()
+      for (const { sourceIdx, label } of mergeAssignments) {
+        const sourceGid = currentIds[sourceIdx]
+        if (!sourceGid) continue
+        const normalized = normalizeLabel(label)
+        if (!mergeMap.has(normalized)) {
+          mergeMap.set(normalized, { label, sourceGroupIds: [] })
+        }
+        mergeMap.get(normalized)!.sourceGroupIds.push(sourceGid)
+      }
+      // Apply merges: for each merge target, pick the first source group as the target
+      // and move all elements from other source groups into it
+      for (const [, { label, sourceGroupIds }] of mergeMap) {
+        if (sourceGroupIds.length <= 1) continue
+        const targetGid = sourceGroupIds[0]
+        const targetSet = groupElements.get(targetGid)!
+        // Update label on the target group
+        const targetInfo = groups.get(targetGid)!
+        targetInfo.label = label
+        targetInfo.normalizedLabel = normalizeLabel(label)
+        for (let i = 1; i < sourceGroupIds.length; i++) {
+          const sourceGid = sourceGroupIds[i]
+          const sourceSet = groupElements.get(sourceGid)!
+          sourceSet.forEach((elemIdx) => targetSet.add(elemIdx))
+          sourceSet.clear()
+        }
+      }
+      // Safety: if LLM still produced too many groups, fall back to merging smallest pairs
+      currentIds = nonEmptyGroupIds()
+      while (currentIds.length > options.maxGroups) {
+        currentIds.sort((a, b) => groupElements.get(a)!.size - groupElements.get(b)!.size)
+        const sourceSet = groupElements.get(currentIds[0])!
+        const targetSet = groupElements.get(currentIds[1])!
+        for (const elemIdx of sourceSet) {
+          targetSet.add(elemIdx)
+        }
+        sourceSet.clear()
+        currentIds = nonEmptyGroupIds()
+      }
+    }
+  }
+  // Phase 5: Redistribute undersized groups if minElements is set
+  // Reuses processChunk so orphans see the valid groups as available buckets
+  if (options.minElements !== undefined && options.minElements > 1) {
+    const getNonEmptyGroupIds = () =>
+      Array.from(groupElements.entries())
+        .filter(([, s]) => s.size > 0)
+        .map(([id]) => id)
+    // Collect orphan elements from all undersized groups
+    const orphanIndices: number[] = []
+    for (const gid of getNonEmptyGroupIds()) {
+      const elemSet = groupElements.get(gid)!
+      if (elemSet.size > 0 && elemSet.size < options.minElements) {
+        for (const idx of elemSet) {
+          orphanIndices.push(idx)
+        }
+        elemSet.clear()
+      }
+    }
+    if (orphanIndices.length > 0) {
+      // Valid groups = everything that's still non-empty (i.e. above minElements)
+      const validGroupIds = getNonEmptyGroupIds()
+      // Chunk orphans and run them through processChunk with only valid groups visible
+      const orphanChunks: number[][] = []
+      let currentOrphanChunk: number[] = []
+      let currentOrphanTokens = 0
+      for (const elemIdx of orphanIndices) {
+        const elem = elements[elemIdx]
+        const truncated = tokenizer.truncate(elem.stringified, options.tokensPerElement)
+        const elemTokens = tokenizer.count(truncated)
+        if (
+          (currentOrphanTokens + elemTokens > TOKENS_FOR_ELEMENTS_MAX ||
+            currentOrphanChunk.length >= MAX_ELEMENTS_PER_CHUNK) &&
+          currentOrphanChunk.length > 0
+        ) {
+          orphanChunks.push(currentOrphanChunk)
+          currentOrphanChunk = []
+          currentOrphanTokens = 0
+        }
+        currentOrphanChunk.push(elemIdx)
+        currentOrphanTokens += elemTokens
+      }
+      if (currentOrphanChunk.length > 0) {
+        orphanChunks.push(currentOrphanChunk)
+      }
+      // Process orphan chunks against valid groups (reuses the same processChunk as Phase 1)
+      const orphanResults = await Promise.all(
+        orphanChunks.map((chunk) =>
+          elementLimit(async () => {
+            // If there are valid groups, chunk them; otherwise pass empty so LLM creates new groups
+            const groupChunksForOrphans = validGroupIds.length > 0 ? getGroupChunks() : [[]]
+            const allAssignments = await Promise.all(
+              groupChunksForOrphans
+                .filter((gc) => gc.length === 0 || gc.some((gid) => validGroupIds.includes(gid)))
+                .map((groupChunk) => {
+                  // Only show valid groups (exclude the orphaned/undersized ones)
+                  const filteredGroupChunk = groupChunk.filter((gid) => validGroupIds.includes(gid))
+                  return groupLimit(() => processChunk(chunk, filteredGroupChunk))
+                })
+            )
+            return allAssignments.flat()
+          })
+        )
+      )
+      // Apply assignments
+      const flatAssignments = orphanResults.flat()
+      for (const { elementIndex, label } of flatAssignments) {
+        const normalized = normalizeLabel(label)
+        let groupId = labelToGroupId.get(normalized)
+        if (!groupId) {
+          groupId = `group_${groupIdCounter++}`
+          groups.set(groupId, { id: groupId, label, normalizedLabel: normalized })
+          groupElements.set(groupId, new Set())
+          labelToGroupId.set(normalized, groupId)
+        }
+        groupElements.get(groupId)!.add(elementIndex)
+      }
+      // Safety: any orphans the LLM missed get placed into the largest group
+      const isAssigned = (idx: number) => {
+        for (const [, elemSet] of groupElements) {
+          if (elemSet.has(idx)) return true
+        }
+        return false
+      }
+      const unassigned = orphanIndices.filter((idx) => !isAssigned(idx))
+      const placeIntoLargest = (indices: number[]) => {
+        const allNonEmpty = getNonEmptyGroupIds()
+        if (allNonEmpty.length === 0) return
+        const largestGid = allNonEmpty.reduce((a, b) =>
+          groupElements.get(a)!.size >= groupElements.get(b)!.size ? a : b
+        )
+        for (const idx of indices) {
+          groupElements.get(largestGid)!.add(idx)
+        }
+      }
+      if (unassigned.length > 0) {
+        placeIntoLargest(unassigned)
+      }
+      // Second pass: if any groups are still undersized after redistribution,
+      // merge their elements into the largest group
+      const mergeUndersizedGroups = () => {
+        const allNonEmpty = getNonEmptyGroupIds()
+        if (allNonEmpty.length <= 1) return false
+        const largestGid = allNonEmpty.reduce((a, b) =>
+          groupElements.get(a)!.size >= groupElements.get(b)!.size ? a : b
+        )
+        const targetSet = groupElements.get(largestGid)!
+        let merged = false
+        for (const gid of allNonEmpty) {
+          if (gid === largestGid) continue
+          const elemSet = groupElements.get(gid)!
+          if (elemSet.size > 0 && elemSet.size < options.minElements) {
+            elemSet.forEach((idx) => targetSet.add(idx))
+            elemSet.clear()
+            merged = true
+          }
+        }
+        return merged
+      }
+      while (mergeUndersizedGroups()) {
+        // keep merging until no undersized groups remain
+      }
+    }
+  }
   // Build final result
   const result: Array<Group<T>> = []
@@ -678,6 +955,7 @@ Zai.prototype.group = function <T>(
     taskId: this.taskId,
     taskType: 'zai.group',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<Array<Group<T>>, Record<string, T[]>>(context, group(input, _options, context), (result) => {

package/src/operations/label.ts CHANGED Viewed

@@ -542,6 +542,7 @@ Zai.prototype.label = function <T extends string>(
     taskId: this.taskId,
     taskType: 'zai.label',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<

package/src/operations/patch.ts CHANGED Viewed

@@ -650,6 +650,7 @@ Zai.prototype.patch = function (
     taskId: this.taskId,
     taskType: 'zai.patch',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<Array<File>>(context, patch(files, instructions, _options, context), (result) => result)

package/src/operations/rate.ts CHANGED Viewed

@@ -611,6 +611,7 @@ Zai.prototype.rate = function <T, I extends RatingInstructions>(
     taskId: this.taskId,
     taskType: 'zai.rate',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<Array<RatingResult<I>>, Array<SimplifiedRatingResult<I>>>(

package/src/operations/rewrite.ts CHANGED Viewed

@@ -277,6 +277,7 @@ Zai.prototype.rewrite = function (this: Zai, original: string, prompt: string, _
     taskId: this.taskId,
     taskType: 'zai.rewrite',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<string>(context, rewrite(original, prompt, _options, context), (result) => result)

package/src/operations/sort.ts CHANGED Viewed

@@ -800,6 +800,7 @@ Zai.prototype.sort = function <T>(
     taskId: this.taskId,
     taskType: 'zai.sort',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<Array<T>, Array<T>>(

package/src/operations/summarize.ts CHANGED Viewed

@@ -306,6 +306,7 @@ Zai.prototype.summarize = function (this: Zai, original, _options): Response<str
     taskId: this.taskId,
     taskType: 'summarize',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<string, string>(context, summarize(original, options, context), (value) => value)

package/src/operations/text.ts CHANGED Viewed

@@ -135,6 +135,7 @@ Zai.prototype.text = function (this: Zai, prompt: string, _options?: Options): R
     taskId: this.taskId,
     taskType: 'zai.text',
     adapter: this.adapter,
+    memoizer: this._resolveMemoizer(),
   })
   return new Response<string>(context, text(prompt, _options, context), (result) => result)

package/src/zai.ts CHANGED Viewed

@@ -8,6 +8,17 @@ import { Adapter } from './adapters/adapter'
 import { TableAdapter } from './adapters/botpress-table'
 import { MemoryAdapter } from './adapters/memory'
+/**
+ * A memoizer that caches the result of async operations by a unique key.
+ *
+ * When used with the Botpress ADK workflow `step` function, this enables
+ * Zai operations to resume where they left off if a workflow is interrupted.
+ *
+ */
+export type Memoizer = {
+  run: <T>(id: string, fn: () => Promise<T>) => Promise<T>
+}
 /**
  * Active learning configuration for improving AI operations over time.
  *
@@ -86,6 +97,16 @@ type ZaiConfig = {
   activeLearning?: ActiveLearning
   /** Namespace for organizing tasks (default: 'zai') */
   namespace?: string
+  /**
+   * Memoizer (or factory returning one) for caching cognitive call results.
+   *
+   * When provided, all LLM calls are wrapped in the memoizer, allowing results
+   * to be cached and replayed. This is useful for resuming workflow runs where
+   * Zai operations have already completed their cognitive calls.
+   *
+   * If a factory function is provided, it is called once per Zai operation invocation.
+   */
+  memoize?: Memoizer | (() => Memoizer)
 }
 const _ZaiConfig = z.object({
@@ -195,6 +216,7 @@ export class Zai {
   protected namespace: string
   protected adapter: Adapter
   protected activeLearning: ActiveLearning
+  protected _memoize?: Memoizer | (() => Memoizer)
   /**
    * Creates a new Zai instance with the specified configuration.
@@ -236,6 +258,8 @@ export class Zai {
           tableName: parsed.activeLearning.tableName,
         })
       : new MemoryAdapter([])
+    this._memoize = config.memoize
   }
   /** @internal */
@@ -250,6 +274,14 @@ export class Zai {
     })
   }
+  /** @internal */
+  protected _resolveMemoizer(): Memoizer | undefined {
+    if (!this._memoize) {
+      return undefined
+    }
+    return typeof this._memoize === 'function' ? this._memoize() : this._memoize
+  }
   protected async getTokenizer() {
     Zai.tokenizer ??= await (async () => {
       while (!getWasmTokenizer) {