npm - @miriad-systems/nuum - Versions diffs - 0.1.5 → 0.1.6 - Mend

@miriad-systems/nuum 0.1.5 → 0.1.6

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +66 -24
package/package.json +2 -2

package/dist/index.js CHANGED Viewed

@@ -31765,6 +31765,27 @@ Please check the tool's parameter schema and try again with correct arguments.`;
       };
     };
   }
+  function prepareMessages(messages, system, cacheSystemPrompt) {
+    if (!system) {
+      return { messages, system: undefined };
+    }
+    if (!cacheSystemPrompt) {
+      return { messages, system };
+    }
+    const systemMessage = {
+      role: "system",
+      content: system,
+      providerOptions: {
+        anthropic: {
+          cacheControl: { type: "ephemeral" }
+        }
+      }
+    };
+    return {
+      messages: [systemMessage, ...messages],
+      system: undefined
+    };
+  }
   function prepareTools2(tools) {
     if (!tools)
       return;
@@ -31796,37 +31817,41 @@ Please check the tool's parameter schema and try again with correct arguments.`;
     return prepared;
   }
   async function generate(options) {
+    const { messages, system } = prepareMessages(options.messages, options.system, options.cacheSystemPrompt ?? false);
     log3.debug("generate", {
       model: options.model.modelId,
-      messageCount: options.messages.length,
-      hasTools: !!options.tools
+      messageCount: messages.length,
+      hasTools: !!options.tools,
+      cacheSystemPrompt: options.cacheSystemPrompt ?? false
     });
     return generateText({
       model: options.model,
-      messages: options.messages,
+      messages,
       tools: prepareTools2(options.tools),
       maxTokens: options.maxTokens,
       temperature: options.temperature,
       abortSignal: options.abortSignal,
-      system: options.system,
+      system,
       experimental_repairToolCall: createToolCallRepairFunction()
     });
   }
   Provider.generate = generate;
   async function stream(options) {
+    const { messages, system } = prepareMessages(options.messages, options.system, options.cacheSystemPrompt ?? false);
     log3.debug("stream", {
       model: options.model.modelId,
-      messageCount: options.messages.length,
-      hasTools: !!options.tools
+      messageCount: messages.length,
+      hasTools: !!options.tools,
+      cacheSystemPrompt: options.cacheSystemPrompt ?? false
     });
     return streamText({
       model: options.model,
-      messages: options.messages,
+      messages,
       tools: prepareTools2(options.tools),
       maxTokens: options.maxTokens,
       temperature: options.temperature,
       abortSignal: options.abortSignal,
-      system: options.system,
+      system,
       experimental_repairToolCall: createToolCallRepairFunction()
     });
   }
@@ -34330,7 +34355,6 @@ function estimateTokens(text3) {
 async function buildSystemPrompt(storage) {
   const identity = await storage.ltm.read("identity");
   const behavior = await storage.ltm.read("behavior");
-  const present = await storage.present.get();
   let prompt = `You are a coding assistant with persistent memory.
 Your memory spans across conversations, allowing you to remember past decisions, track ongoing projects, and learn user preferences.
@@ -34350,19 +34374,6 @@ ${behavior.body}
 `;
   }
-  prompt += `<present_state>
-<mission>${present.mission ?? "(none)"}</mission>
-<status>${present.status ?? "(none)"}</status>
-<tasks>
-`;
-  for (const task of present.tasks) {
-    prompt += `  <task status="${task.status}">${task.content}</task>
-`;
-  }
-  prompt += `</tasks>
-</present_state>
-`;
   prompt += `You have access to tools for file operations (read, write, edit, bash, glob, grep).
 Use tools to accomplish tasks. Always explain what you're doing.
@@ -34664,6 +34675,21 @@ function estimateSummaryTokens(input) {
 }
 // src/agent/loop.ts
 var log5 = Log.create({ service: "agent-loop" });
+function addCacheMarkers(messages) {
+  if (messages.length === 0)
+    return messages;
+  const result = [...messages];
+  const startIdx = Math.max(0, messages.length - 3);
+  for (let i = startIdx;i < messages.length; i++) {
+    result[i] = {
+      ...result[i],
+      providerOptions: {
+        anthropic: { cacheControl: { type: "ephemeral" } }
+      }
+    };
+  }
+  return result;
+}
 class AgentLoopCancelledError extends Error {
   constructor() {
@@ -34710,16 +34736,32 @@ async function runAgentLoop(options) {
       log5.info("injected mid-turn user message", { contentLength: injectedContent.length });
     }
     turnsUsed++;
+    const messagesWithCache = addCacheMarkers(messages);
     const response = await Provider.generate({
       model,
       system: systemPrompt,
-      messages,
+      messages: messagesWithCache,
       tools,
       maxTokens,
-      temperature
+      temperature,
+      cacheSystemPrompt: true
     });
     totalInputTokens += response.usage.promptTokens;
     totalOutputTokens += response.usage.completionTokens;
+    const anthropicMeta = response.providerMetadata?.anthropic;
+    if (anthropicMeta) {
+      const cacheCreation = anthropicMeta.cacheCreationInputTokens ?? 0;
+      const cacheRead = anthropicMeta.cacheReadInputTokens ?? 0;
+      const uncached = response.usage.promptTokens - cacheCreation - cacheRead;
+      log5.info("token usage", {
+        input: response.usage.promptTokens,
+        output: response.usage.completionTokens,
+        cacheWrite: cacheCreation,
+        cacheRead,
+        uncached,
+        cacheHitRate: response.usage.promptTokens > 0 ? `${Math.round(cacheRead / response.usage.promptTokens * 100)}%` : "0%"
+      });
+    }
     if (response.text) {
       finalText = response.text;
       await onText?.(response.text);

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@miriad-systems/nuum",
-  "version": "0.1.5",
+  "version": "0.1.6",
   "description": "AI coding agent with continuous memory - infinite context across sessions",
   "type": "module",
   "bin": {
@@ -11,7 +11,7 @@
     "src/storage/migrations"
   ],
   "scripts": {
-    "build": "bun build ./src/cli/index.ts --outdir ./dist --target bun && sed -i '' '1s|#!/usr/bin/env node|#!/usr/bin/env bun|' ./dist/index.js",
+    "build": "bun build ./src/cli/index.ts --outdir ./dist --target bun && node -e \"const fs=require('fs');const f='./dist/index.js';fs.writeFileSync(f,fs.readFileSync(f,'utf8').replace('#!/usr/bin/env node','#!/usr/bin/env bun'))\"",
     "dev": "bun run ./src/cli/index.ts",
     "typecheck": "tsc --noEmit",
     "test": "bun test",