npm - @mastra/memory - Versions diffs - 1.7.0-alpha.1 → 1.8.0-alpha.0 - Mend

@mastra/memory 1.7.0-alpha.1 → 1.8.0-alpha.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/CHANGELOG.md +40 -0
package/dist/{chunk-M7RAJAZ6.js → chunk-SUU4IAZJ.js} +307 -39
package/dist/chunk-SUU4IAZJ.js.map +1 -0
package/dist/{chunk-SHID74TI.cjs → chunk-YPFNHFT6.cjs} +307 -39
package/dist/chunk-YPFNHFT6.cjs.map +1 -0
package/dist/docs/SKILL.md +1 -1
package/dist/docs/assets/SOURCE_MAP.json +24 -24
package/dist/docs/references/docs-memory-observational-memory.md +23 -0
package/dist/docs/references/reference-memory-observational-memory.md +2 -0
package/dist/index.cjs +64 -368
package/dist/index.cjs.map +1 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +64 -368
package/dist/index.js.map +1 -1
package/dist/{observational-memory-AU6MIH4Q.cjs → observational-memory-3HFM7PY2.cjs} +17 -17
package/dist/{observational-memory-AU6MIH4Q.cjs.map → observational-memory-3HFM7PY2.cjs.map} +1 -1
package/dist/{observational-memory-YRWU6CY3.js → observational-memory-XXD6E2SO.js} +3 -3
package/dist/{observational-memory-YRWU6CY3.js.map → observational-memory-XXD6E2SO.js.map} +1 -1
package/dist/processors/index.cjs +15 -15
package/dist/processors/index.js +1 -1
package/dist/processors/observational-memory/observational-memory.d.ts +21 -0
package/dist/processors/observational-memory/observational-memory.d.ts.map +1 -1
package/dist/processors/observational-memory/observer-agent.d.ts +14 -2
package/dist/processors/observational-memory/observer-agent.d.ts.map +1 -1
package/dist/processors/observational-memory/types.d.ts +7 -0
package/dist/processors/observational-memory/types.d.ts.map +1 -1
package/package.json +8 -8
package/dist/chunk-M7RAJAZ6.js.map +0 -1
package/dist/chunk-SHID74TI.cjs.map +0 -1

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,45 @@
 # @mastra/memory
+## 1.8.0-alpha.0
+### Minor Changes
+- Added observer context optimization for Observational Memory. The `observation.previousObserverTokens` field reduces Observer input token costs for long-running conversations: ([#13568](https://github.com/mastra-ai/mastra/pull/13568))
+  - **previousObserverTokens** (default: `2000`): Truncates the 'Previous Observations' section to a token budget, keeping the most recent observations and automatically replacing already-reflected lines with the buffered reflection summary. Set to `0` to omit previous observations entirely, or `false` to disable truncation and keep the full observation history.
+  ```typescript
+  const memory = new Memory({
+    options: {
+      observationalMemory: {
+        model: 'google/gemini-2.5-flash',
+        observation: {
+          previousObserverTokens: 10_000,
+        },
+      },
+    },
+  });
+  ```
+### Patch Changes
+- Updated dependencies [[`ea86967`](https://github.com/mastra-ai/mastra/commit/ea86967449426e0a3673253bd1c2c052a99d970d), [`db21c21`](https://github.com/mastra-ai/mastra/commit/db21c21a6ae5f33539262cc535342fa8757eb359), [`a1d6b9c`](https://github.com/mastra-ai/mastra/commit/a1d6b9c907c909f259632a7ea26e9e3c221fb691), [`11f5dbe`](https://github.com/mastra-ai/mastra/commit/11f5dbe9a1e7ad8ef3b1ea34fb4a9fa3631d1587), [`c562ec2`](https://github.com/mastra-ai/mastra/commit/c562ec228f1af63693e2984ffa9712aa6db8fea8), [`6751354`](https://github.com/mastra-ai/mastra/commit/67513544d1a64be891d9de7624d40aadc895d56e), [`c958cd3`](https://github.com/mastra-ai/mastra/commit/c958cd36627c1eea122ec241b2b15492977a263a), [`86f2426`](https://github.com/mastra-ai/mastra/commit/86f242631d252a172d2f9f9a2ea0feb8647a76b0), [`950eb07`](https://github.com/mastra-ai/mastra/commit/950eb07b7e7354629630e218d49550fdd299c452)]:
+  - @mastra/core@1.13.0-alpha.0
+  - @mastra/schema-compat@1.2.2-alpha.0
+## 1.7.0
+### Minor Changes
+- Observational Memory now performs local threshold checks with lower CPU and memory overhead. ([#14178](https://github.com/mastra-ai/mastra/pull/14178))
+  This update keeps the same multimodal thresholding behavior for image-aware inputs, so existing Observational Memory configurations continue to work without changes.
+### Patch Changes
+- Updated dependencies [[`709362d`](https://github.com/mastra-ai/mastra/commit/709362d67b80d8832729bbf9e449cad27640a5d2), [`cddf895`](https://github.com/mastra-ai/mastra/commit/cddf895532b8ee7f9fa814136ec672f53d37a9ba), [`9cede11`](https://github.com/mastra-ai/mastra/commit/9cede110abac9d93072e0521bb3c8bcafb9fdadf), [`a59f126`](https://github.com/mastra-ai/mastra/commit/a59f1269104f54726699c5cdb98c72c93606d2df), [`ed8fd75`](https://github.com/mastra-ai/mastra/commit/ed8fd75cbff03bb5e19971ddb30ab7040fc60447), [`c510833`](https://github.com/mastra-ai/mastra/commit/c5108333e8cbc19dafee5f8bfefbcb5ee935335c), [`c4c7dad`](https://github.com/mastra-ai/mastra/commit/c4c7dadfe2e4584f079f6c24bfabdb8c4981827f), [`787f3ac`](https://github.com/mastra-ai/mastra/commit/787f3ac08b3bb77413645a7ab5c447fa851708fd), [`45c3112`](https://github.com/mastra-ai/mastra/commit/45c31122666a0cc56b94727099fcb1871ed1b3f6), [`7296fcc`](https://github.com/mastra-ai/mastra/commit/7296fcc599c876a68699a71c7054a16d5aaf2337), [`00c27f9`](https://github.com/mastra-ai/mastra/commit/00c27f9080731433230a61be69c44e39a7a7b4c7), [`5e7c287`](https://github.com/mastra-ai/mastra/commit/5e7c28701f2bce795dd5c811e4c3060bf2ea2242), [`7e17d3f`](https://github.com/mastra-ai/mastra/commit/7e17d3f656fdda2aad47c4beb8c491636d70820c), [`ee19c9b`](https://github.com/mastra-ai/mastra/commit/ee19c9ba3ec3ed91feb214ad539bdc766c53bb01)]:
+  - @mastra/schema-compat@1.2.1
+  - @mastra/core@1.12.0
 ## 1.7.0-alpha.1
 ### Minor Changes

package/dist/{chunk-M7RAJAZ6.js → chunk-SUU4IAZJ.js} RENAMED Viewed

@@ -796,6 +796,11 @@ ${maybeTruncate(resultStr, maxLen)}`;
 ${maybeTruncate(argsStr, maxLen)}`;
       }
       const partType = part.type;
+      if (partType === "reasoning") {
+        const reasoning = part.reasoning;
+        if (reasoning) return maybeTruncate(reasoning, maxLen);
+        return "";
+      }
       if (partType === "image" || partType === "file") {
         const attachment = part;
         const inputAttachment = toObserverInputAttachmentPart(attachment);
@@ -810,6 +815,9 @@ ${maybeTruncate(argsStr, maxLen)}`;
   } else if (msg.content?.content) {
     content = maybeTruncate(msg.content.content, maxLen);
   }
+  if (!content && attachments.length === 0) {
+    return { text: "", attachments };
+  }
   return {
     text: `**${role}${timestampStr}:**
 ${content}`,
@@ -818,18 +826,21 @@ ${content}`,
 }
 function formatMessagesForObserver(messages, options) {
   const counter = { nextImageId: 1, nextFileId: 1 };
-  return messages.map((msg) => formatObserverMessage(msg, counter, options).text).join("\n\n---\n\n");
+  return messages.map((msg) => formatObserverMessage(msg, counter, options).text).filter(Boolean).join("\n\n---\n\n");
 }
 function buildObserverHistoryMessage(messages) {
   const counter = { nextImageId: 1, nextFileId: 1 };
   const content = [{ type: "text", text: "## New Message History to Observe\n\n" }];
-  messages.forEach((message, index) => {
+  let visibleCount = 0;
+  messages.forEach((message) => {
     const formatted = formatObserverMessage(message, counter);
-    content.push({ type: "text", text: formatted.text });
-    content.push(...formatted.attachments);
-    if (index < messages.length - 1) {
+    if (!formatted.text && formatted.attachments.length === 0) return;
+    if (visibleCount > 0) {
       content.push({ type: "text", text: "\n\n---\n\n" });
     }
+    content.push({ type: "text", text: formatted.text });
+    content.push(...formatted.attachments);
+    visibleCount++;
   });
   return {
     role: "user",
@@ -858,16 +869,22 @@ The following messages are from ${threadOrder.length} different conversation thr
   threadOrder.forEach((threadId, threadIndex) => {
     const messages = messagesByThread.get(threadId);
     if (!messages || messages.length === 0) return;
-    content.push({ type: "text", text: `<thread id="${threadId}">
-` });
-    messages.forEach((message, messageIndex) => {
+    const threadContent = [];
+    let visibleCount = 0;
+    messages.forEach((message) => {
       const formatted = formatObserverMessage(message, counter);
-      content.push({ type: "text", text: formatted.text });
-      content.push(...formatted.attachments);
-      if (messageIndex < messages.length - 1) {
-        content.push({ type: "text", text: "\n\n---\n\n" });
+      if (!formatted.text && formatted.attachments.length === 0) return;
+      if (visibleCount > 0) {
+        threadContent.push({ type: "text", text: "\n\n---\n\n" });
       }
+      threadContent.push({ type: "text", text: formatted.text });
+      threadContent.push(...formatted.attachments);
+      visibleCount++;
     });
+    if (visibleCount === 0) return;
+    content.push({ type: "text", text: `<thread id="${threadId}">
+` });
+    content.push(...threadContent);
     content.push({ type: "text", text: "\n</thread>" });
     if (threadIndex < threadOrder.length - 1) {
       content.push({ type: "text", text: "\n\n" });
@@ -878,7 +895,7 @@ The following messages are from ${threadOrder.length} different conversation thr
     content
   };
 }
-function buildMultiThreadObserverTaskPrompt(existingObservations) {
+function buildMultiThreadObserverTaskPrompt(existingObservations, threadOrder, priorMetadataByThread, wasTruncated) {
   let prompt = "";
   if (existingObservations) {
     prompt += `## Previous Observations
@@ -890,6 +907,39 @@ ${existingObservations}
 `;
     prompt += "Do not repeat these existing observations. Your new observations will be appended to the existing observations.\n\n";
   }
+  const hasTruncatedObservations = wasTruncated ?? false;
+  const threadMetadataLines = threadOrder?.map((threadId) => {
+    const metadata = priorMetadataByThread?.get(threadId);
+    if (!metadata?.currentTask && !metadata?.suggestedResponse) {
+      return "";
+    }
+    const lines = [`- thread ${threadId}`];
+    if (metadata.currentTask) {
+      lines.push(`  - prior current-task: ${metadata.currentTask}`);
+    }
+    if (metadata.suggestedResponse) {
+      lines.push(`  - prior suggested-response: ${metadata.suggestedResponse}`);
+    }
+    return lines.join("\n");
+  }).filter(Boolean).join("\n");
+  if (threadMetadataLines) {
+    prompt += `## Prior Thread Metadata
+${threadMetadataLines}
+`;
+    if (hasTruncatedObservations) {
+      prompt += `Previous observations were truncated for context budget reasons.
+`;
+      prompt += `The main agent still has full memory context outside this observer window.
+`;
+    }
+    prompt += `Use each thread's prior current-task and suggested-response as continuity hints, then update them based on that thread's new messages.
+---
+`;
+  }
   prompt += `## Your Task
 `;
@@ -978,6 +1028,32 @@ ${existingObservations}
 `;
     prompt += "Do not repeat these existing observations. Your new observations will be appended to the existing observations.\n\n";
   }
+  const hasTruncatedObservations = options?.wasTruncated ?? false;
+  const priorMetadataLines = [];
+  if (options?.priorCurrentTask) {
+    priorMetadataLines.push(`- prior current-task: ${options.priorCurrentTask}`);
+  }
+  if (options?.priorSuggestedResponse) {
+    priorMetadataLines.push(`- prior suggested-response: ${options.priorSuggestedResponse}`);
+  }
+  if (priorMetadataLines.length > 0) {
+    prompt += `## Prior Thread Metadata
+${priorMetadataLines.join("\n")}
+`;
+    if (hasTruncatedObservations) {
+      prompt += `Previous observations were truncated for context budget reasons.
+`;
+      prompt += `The main agent still has full memory context outside this observer window.
+`;
+    }
+    prompt += `Use the prior current-task and suggested-response as continuity hints, then update them based on the new messages.
+---
+`;
+  }
   prompt += `## Your Task
 `;
@@ -3271,6 +3347,7 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
         config.observation?.blockAfter ?? (config.observation?.bufferTokens ?? OBSERVATIONAL_MEMORY_DEFAULTS.observation.bufferTokens ? 1.2 : void 0),
         config.observation?.messageTokens ?? OBSERVATIONAL_MEMORY_DEFAULTS.observation.messageTokens
       ),
+      previousObserverTokens: config.observation?.previousObserverTokens ?? 2e3,
       instruction: config.observation?.instruction
     };
     this.reflectionConfig = {
@@ -3307,7 +3384,8 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
     return {
       scope: this.scope,
       observation: {
-        messageTokens: this.observationConfig.messageTokens
+        messageTokens: this.observationConfig.messageTokens,
+        previousObserverTokens: this.observationConfig.previousObserverTokens
       },
       reflection: {
         observationTokens: this.reflectionConfig.observationTokens
@@ -3387,7 +3465,8 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
       scope: this.scope,
       observation: {
         messageTokens: this.observationConfig.messageTokens,
-        model: observationModelName
+        model: observationModelName,
+        previousObserverTokens: this.observationConfig.previousObserverTokens
       },
       reflection: {
         observationTokens: this.reflectionConfig.observationTokens,
@@ -3452,6 +3531,13 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
         );
       }
     }
+    if (this.observationConfig.previousObserverTokens !== void 0 && this.observationConfig.previousObserverTokens !== false) {
+      if (!Number.isFinite(this.observationConfig.previousObserverTokens) || this.observationConfig.previousObserverTokens < 0) {
+        throw new Error(
+          `observation.previousObserverTokens must be false or a finite number >= 0, got ${this.observationConfig.previousObserverTokens}`
+        );
+      }
+    }
     if (this.reflectionConfig.bufferActivation !== void 0) {
       if (this.reflectionConfig.bufferActivation <= 0 || this.reflectionConfig.bufferActivation > 1) {
         throw new Error(
@@ -3849,6 +3935,141 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
     }
     return result;
   }
+  /**
+   * Prepare optimized observer context by applying truncation and buffered-reflection inclusion.
+   *
+   * Returns the (possibly optimized) observations string to pass as "Previous Observations"
+   * to the observer prompt. When no optimization options are set, returns the input unchanged.
+   */
+  prepareObserverContext(existingObservations, record) {
+    const { previousObserverTokens } = this.observationConfig;
+    const tokenBudget = previousObserverTokens === void 0 || previousObserverTokens === false ? void 0 : previousObserverTokens;
+    if (tokenBudget === void 0) {
+      return { context: existingObservations, wasTruncated: false };
+    }
+    const bufferedReflection = record?.bufferedReflection && record?.reflectedObservationLineCount ? record.bufferedReflection : void 0;
+    if (!existingObservations) {
+      return { context: bufferedReflection, wasTruncated: false };
+    }
+    let observations = existingObservations;
+    if (bufferedReflection && record?.reflectedObservationLineCount) {
+      const allLines = observations.split("\n");
+      const unreflectedLines = allLines.slice(record.reflectedObservationLineCount);
+      const unreflectedContent = unreflectedLines.join("\n").trim();
+      observations = unreflectedContent ? `${bufferedReflection}
+${unreflectedContent}` : bufferedReflection;
+    }
+    let wasTruncated = false;
+    if (tokenBudget !== void 0) {
+      if (tokenBudget === 0) {
+        return { context: "", wasTruncated: true };
+      }
+      const currentTokens = this.tokenCounter.countObservations(observations);
+      if (currentTokens > tokenBudget) {
+        observations = this.truncateObservationsToTokenBudget(observations, tokenBudget);
+        wasTruncated = true;
+      }
+    }
+    return { context: observations, wasTruncated };
+  }
+  /**
+   * Truncate observations to fit within a token budget.
+   *
+   * Strategy:
+   * 1. Keep a raw tail of recent observations (end of block).
+   * 2. Add a truncation marker: [X observations truncated here], placed at the hidden gap.
+   * 3. Try to preserve important observations (🔴) from older context, newest-first.
+   * 4. Enforce that at least 50% of kept observations remain raw tail observations.
+   */
+  truncateObservationsToTokenBudget(observations, budget) {
+    if (budget === 0) {
+      return "";
+    }
+    const totalTokens = this.tokenCounter.countObservations(observations);
+    if (totalTokens <= budget) {
+      return observations;
+    }
+    const lines = observations.split("\n");
+    const totalCount = lines.length;
+    const lineTokens = new Array(totalCount);
+    const isImportant = new Array(totalCount);
+    for (let i = 0; i < totalCount; i++) {
+      lineTokens[i] = this.tokenCounter.countString(lines[i]);
+      isImportant[i] = lines[i].includes("\u{1F534}");
+    }
+    const suffixTokens = new Array(totalCount + 1);
+    suffixTokens[totalCount] = 0;
+    for (let i = totalCount - 1; i >= 0; i--) {
+      suffixTokens[i] = suffixTokens[i + 1] + lineTokens[i];
+    }
+    const headImportantIndexes = [];
+    const buildCandidateString = (tailStart, selectedImportantIndexes) => {
+      const keptIndexes = [
+        ...selectedImportantIndexes,
+        ...Array.from({ length: totalCount - tailStart }, (_, i) => tailStart + i)
+      ].sort((a, b) => a - b);
+      if (keptIndexes.length === 0) {
+        return `[${totalCount} observations truncated here]`;
+      }
+      const outputLines = [];
+      let previousKeptIndex = -1;
+      for (const keptIndex of keptIndexes) {
+        const hiddenCount = keptIndex - previousKeptIndex - 1;
+        if (hiddenCount === 1) {
+          outputLines.push(lines[previousKeptIndex + 1]);
+        } else if (hiddenCount > 1) {
+          outputLines.push(`[${hiddenCount} observations truncated here]`);
+        }
+        outputLines.push(lines[keptIndex]);
+        previousKeptIndex = keptIndex;
+      }
+      const trailingHiddenCount = totalCount - previousKeptIndex - 1;
+      if (trailingHiddenCount === 1) {
+        outputLines.push(lines[totalCount - 1]);
+      } else if (trailingHiddenCount > 1) {
+        outputLines.push(`[${trailingHiddenCount} observations truncated here]`);
+      }
+      return outputLines.join("\n");
+    };
+    const estimateKeptContentCost = (tailStart, selectedImportantIndexes) => {
+      let cost = suffixTokens[tailStart];
+      for (const idx of selectedImportantIndexes) {
+        cost += lineTokens[idx];
+      }
+      return cost;
+    };
+    let bestCandidate;
+    let bestImportantCount = -1;
+    let bestRawTailLength = -1;
+    for (let tailStart = 1; tailStart < totalCount; tailStart++) {
+      if (isImportant[tailStart - 1]) {
+        headImportantIndexes.push(tailStart - 1);
+      }
+      const rawTailLength = totalCount - tailStart;
+      const maxImportantByRatio = rawTailLength;
+      let importantToKeep = Math.min(headImportantIndexes.length, maxImportantByRatio);
+      const getSelectedImportant = (count) => count > 0 ? headImportantIndexes.slice(Math.max(0, headImportantIndexes.length - count)) : [];
+      while (importantToKeep > 0 && estimateKeptContentCost(tailStart, getSelectedImportant(importantToKeep)) > budget) {
+        importantToKeep -= 1;
+      }
+      if (estimateKeptContentCost(tailStart, getSelectedImportant(importantToKeep)) > budget) {
+        continue;
+      }
+      if (importantToKeep > bestImportantCount || importantToKeep === bestImportantCount && rawTailLength > bestRawTailLength) {
+        const candidate = buildCandidateString(tailStart, getSelectedImportant(importantToKeep));
+        if (this.tokenCounter.countObservations(candidate) <= budget) {
+          bestCandidate = candidate;
+          bestImportantCount = importantToKeep;
+          bestRawTailLength = rawTailLength;
+        }
+      }
+    }
+    if (!bestCandidate) {
+      return `[${totalCount} observations truncated here]`;
+    }
+    return bestCandidate;
+  }
   /**
    * Call the Observer agent to extract observations.
    */
@@ -3857,12 +4078,17 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
     const observerMessages = [
       {
         role: "user",
-        content: buildObserverTaskPrompt(existingObservations, options)
+        content: buildObserverTaskPrompt(existingObservations, {
+          skipContinuationHints: options?.skipContinuationHints,
+          priorCurrentTask: options?.priorCurrentTask,
+          priorSuggestedResponse: options?.priorSuggestedResponse,
+          wasTruncated: options?.wasTruncated
+        })
       },
       buildObserverHistoryMessage(messagesToObserve)
     ];
     const doGenerate = async () => {
-      return this.withAbortCheck(async () => {
+      const result2 = await this.withAbortCheck(async () => {
         const streamResult = await agent.stream(observerMessages, {
           modelSettings: {
             ...this.observationConfig.modelSettings
@@ -3873,6 +4099,7 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
         });
         return streamResult.getFullOutput();
       }, abortSignal);
+      return result2;
     };
     let result = await doGenerate();
     let parsed = parseObserverOutput(result.text);
@@ -3903,17 +4130,23 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
    * Returns per-thread results with observations, currentTask, and suggestedContinuation,
    * plus the total usage for the batch.
    */
-  async callMultiThreadObserver(existingObservations, messagesByThread, threadOrder, abortSignal, requestContext) {
+  async callMultiThreadObserver(existingObservations, messagesByThread, threadOrder, priorMetadataByThread, abortSignal, requestContext, wasTruncated) {
+    const systemPrompt = buildObserverSystemPrompt(true, this.observationConfig.instruction);
     const agent = new Agent({
       id: "multi-thread-observer",
       name: "multi-thread-observer",
       model: this.observationConfig.model,
-      instructions: buildObserverSystemPrompt(true, this.observationConfig.instruction)
+      instructions: systemPrompt
     });
     const observerMessages = [
       {
         role: "user",
-        content: buildMultiThreadObserverTaskPrompt(existingObservations)
+        content: buildMultiThreadObserverTaskPrompt(
+          existingObservations,
+          threadOrder,
+          priorMetadataByThread,
+          wasTruncated
+        )
       },
       buildMultiThreadObserverHistoryMessage(messagesByThread, threadOrder)
     ];
@@ -3925,7 +4158,7 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
       this.observedMessageIds.add(msg.id);
     }
     const doGenerate = async () => {
-      return this.withAbortCheck(async () => {
+      const result2 = await this.withAbortCheck(async () => {
         const streamResult = await agent.stream(observerMessages, {
           modelSettings: {
             ...this.observationConfig.modelSettings
@@ -3936,6 +4169,7 @@ Async buffering is enabled by default \u2014 this opt-out is only needed when us
         });
         return streamResult.getFullOutput();
       }, abortSignal);
+      return result2;
     };
     let result = await doGenerate();
     let parsed = parseMultiThreadObserverOutput(result.text);
@@ -5369,12 +5603,18 @@ ${newThreadSection}`;
           );
         }
       }
-      const result = await this.callObserver(
+      const { context: observerContext, wasTruncated } = this.prepareObserverContext(
         freshRecord?.activeObservations ?? record.activeObservations,
-        messagesToObserve,
-        abortSignal,
-        { requestContext }
+        freshRecord ?? record
       );
+      const thread = await this.storage.getThreadById({ threadId });
+      const threadOMMetadata = getThreadOMMetadata(thread?.metadata);
+      const result = await this.callObserver(observerContext, messagesToObserve, abortSignal, {
+        requestContext,
+        priorCurrentTask: threadOMMetadata?.currentTask,
+        priorSuggestedResponse: threadOMMetadata?.suggestedResponse,
+        wasTruncated
+      });
       const existingObservations = freshRecord?.activeObservations ?? record.activeObservations ?? "";
       let newObservations;
       if (this.scope === "resource") {
@@ -5391,16 +5631,16 @@ ${result.observations}` : result.observations;
       const newMessageIds = messagesToObserve.map((m) => m.id);
       const existingIds = freshRecord?.observedMessageIds ?? record.observedMessageIds ?? [];
       const allObservedIds = [.../* @__PURE__ */ new Set([...Array.isArray(existingIds) ? existingIds : [], ...newMessageIds])];
-      const thread = await this.storage.getThreadById({ threadId });
-      if (thread) {
-        const newMetadata = setThreadOMMetadata(thread.metadata, {
+      const threadForMetadata = await this.storage.getThreadById({ threadId });
+      if (threadForMetadata) {
+        const newMetadata = setThreadOMMetadata(threadForMetadata.metadata, {
           suggestedResponse: result.suggestedContinuation,
           currentTask: result.currentTask,
           lastObservedMessageCursor: this.getLastObservedMessageCursor(messagesToObserve)
         });
         await this.storage.updateThread({
           id: threadId,
-          title: thread.title ?? "",
+          title: threadForMetadata.title ?? "",
           metadata: newMetadata
         });
       }
@@ -5634,12 +5874,21 @@ ${result.observations}` : result.observations;
     const bufferedChunks = this.getBufferedChunks(record);
     const bufferedChunksText = bufferedChunks.map((c) => c.observations).join("\n\n");
     const combinedObservations = this.combineObservationsForBuffering(record.activeObservations, bufferedChunksText);
+    const { context: observerContext, wasTruncated } = this.prepareObserverContext(combinedObservations, record);
+    const thread = await this.storage.getThreadById({ threadId });
+    const threadOMMetadata = getThreadOMMetadata(thread?.metadata);
     const result = await this.callObserver(
-      combinedObservations,
+      observerContext,
       messagesToBuffer,
       void 0,
       // No abort signal for background ops
-      { skipContinuationHints: true, requestContext }
+      {
+        skipContinuationHints: true,
+        requestContext,
+        priorCurrentTask: threadOMMetadata?.currentTask,
+        priorSuggestedResponse: threadOMMetadata?.suggestedResponse,
+        wasTruncated
+      }
     );
     if (!result.observations) {
       omDebug(`[OM:doAsyncBufferedObservation] empty observations returned, skipping buffer storage`);
@@ -5706,8 +5955,6 @@ ${result.observations}` : result.observations;
     }
     return `${activeObservations}
---- BUFFERED (pending activation) ---
 ${bufferedObservations}`;
   }
   /**
@@ -6067,7 +6314,11 @@ ${unreflectedContent}` : freshRecord.bufferedReflection;
     const threadMetadataMap = /* @__PURE__ */ new Map();
     for (const thread of allThreads) {
       const omMetadata = getThreadOMMetadata(thread.metadata);
-      threadMetadataMap.set(thread.id, { lastObservedAt: omMetadata?.lastObservedAt });
+      threadMetadataMap.set(thread.id, {
+        lastObservedAt: omMetadata?.lastObservedAt,
+        currentTask: omMetadata?.currentTask,
+        suggestedResponse: omMetadata?.suggestedResponse
+      });
     }
     const messagesByThread = /* @__PURE__ */ new Map();
     for (const thread of allThreads) {
@@ -6147,7 +6398,12 @@ ${unreflectedContent}` : freshRecord.bufferedReflection;
           return;
         }
       }
-      const existingObservations = freshRecord?.activeObservations ?? record.activeObservations ?? "";
+      const rawExistingObservations = freshRecord?.activeObservations ?? record.activeObservations ?? "";
+      const { context: optimizedObservations, wasTruncated } = this.prepareObserverContext(
+        rawExistingObservations,
+        freshRecord ?? record
+      );
+      const existingObservations = optimizedObservations ?? rawExistingObservations;
       for (const threadId of threadOrder) {
         const msgs = messagesByThread.get(threadId);
         if (msgs && msgs.length > 0) {
@@ -6211,12 +6467,24 @@ ${unreflectedContent}` : freshRecord.bufferedReflection;
         batches.push(currentBatch);
       }
       const batchPromises = batches.map(async (batch) => {
+        const batchPriorMetadata = /* @__PURE__ */ new Map();
+        for (const threadId of batch.threadIds) {
+          const metadata = threadMetadataMap.get(threadId);
+          if (metadata?.currentTask || metadata?.suggestedResponse) {
+            batchPriorMetadata.set(threadId, {
+              currentTask: metadata.currentTask,
+              suggestedResponse: metadata.suggestedResponse
+            });
+          }
+        }
         const batchResult = await this.callMultiThreadObserver(
           existingObservations,
           batch.threadMap,
           batch.threadIds,
+          batchPriorMetadata,
           abortSignal,
-          requestContext
+          requestContext,
+          wasTruncated
         );
         return batchResult;
       });
@@ -6247,7 +6515,7 @@ ${unreflectedContent}` : freshRecord.bufferedReflection;
           result
         });
       }
-      let currentObservations = existingObservations;
+      let currentObservations = rawExistingObservations;
       let cycleObservationTokens = 0;
       for (const obsResult of observationResults) {
         if (!obsResult) continue;
@@ -6701,5 +6969,5 @@ ${unreflectedContent}` : freshRecord.bufferedReflection;
 };
 export { OBSERVATIONAL_MEMORY_DEFAULTS, OBSERVATION_CONTEXT_INSTRUCTIONS, OBSERVATION_CONTEXT_PROMPT, OBSERVATION_CONTINUATION_HINT, OBSERVER_SYSTEM_PROMPT, ObservationalMemory, TokenCounter, buildObserverPrompt, buildObserverSystemPrompt, extractCurrentTask, formatMessagesForObserver, hasCurrentTaskSection, optimizeObservationsForContext, parseObserverOutput };
-//# sourceMappingURL=chunk-M7RAJAZ6.js.map
-//# sourceMappingURL=chunk-M7RAJAZ6.js.map
+//# sourceMappingURL=chunk-SUU4IAZJ.js.map
+//# sourceMappingURL=chunk-SUU4IAZJ.js.map