npm - @sanity-labs/nuum - Versions diffs - 0.5.3 → 0.5.5 - Mend

@sanity-labs/nuum 0.5.3 → 0.5.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +66 -26
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -23485,26 +23485,33 @@ function createLTMStorage(db) {
       }
       return matches.sort((a, b) => (b.score ?? 0) - (a.score ?? 0));
     },
-    async searchFTS(query, limit = 20) {
+    async searchFTS(query, options = {}) {
+      const { limit = 20, pathPrefix } = options;
       const words = query.split(/\s+/).filter((w) => w.length > 0).map((w) => `"${w.replace(/"/g, '""')}"`).join(" OR ");
       if (!words) {
         return [];
       }
+      const pathFilter = pathPrefix ? `AND e.path LIKE ? || '%'` : "";
+      const params = pathPrefix ? [words, pathPrefix, limit] : [words, limit];
       const results = await db._rawDb.prepare(`
         SELECT
-          slug,
-          title,
+          fts.slug,
+          fts.title,
+          e.path,
           snippet(ltm_entries_fts, 2, '>>>', '<<<', '...', 32) as snippet,
-          rank
-        FROM ltm_entries_fts
+          fts.rank
+        FROM ltm_entries_fts fts
+        JOIN ltm_entries e ON e.slug = fts.slug
         WHERE ltm_entries_fts MATCH ?
-          AND slug IN (SELECT slug FROM ltm_entries WHERE archived_at IS NULL)
-        ORDER BY rank
+          AND e.archived_at IS NULL
+          ${pathFilter}
+        ORDER BY fts.rank
         LIMIT ?
-      `).all(words, limit);
+      `).all(...params);
       return results.map((r) => ({
         slug: r.slug,
         title: r.title,
+        path: r.path,
         snippet: r.snippet,
         rank: r.rank
       }));
@@ -35674,6 +35681,20 @@ function estimateSummaryTokens(input) {
 }
 // src/agent/loop.ts
 var log5 = Log.create({ service: "agent-loop" });
+var MODEL_MAX_OUTPUT_TOKENS = {
+  "claude-opus-4-6": 128000,
+  "claude-opus-4-6-20250918": 128000,
+  "claude-sonnet-4-5-20250929": 64000,
+  "claude-sonnet-4-5": 64000,
+  "claude-haiku-4-5-20251001": 64000,
+  "claude-haiku-4-5": 64000,
+  "claude-3-5-sonnet-20241022": 8192,
+  "claude-3-5-haiku-20241022": 8192
+};
+var DEFAULT_MAX_OUTPUT_TOKENS = 16384;
+function getMaxOutputTokens(modelId) {
+  return MODEL_MAX_OUTPUT_TOKENS[modelId] ?? DEFAULT_MAX_OUTPUT_TOKENS;
+}
 function addCacheMarkers(messages) {
   if (messages.length === 0)
     return messages;
@@ -35702,7 +35723,7 @@ async function runAgentLoop(options) {
     systemPrompt,
     initialMessages,
     tools,
-    maxTokens = 4096,
+    maxTokens: maxTokensOverride,
     temperature,
     maxTurns,
     abortSignal,
@@ -35713,6 +35734,12 @@ async function runAgentLoop(options) {
     onBeforeTurn,
     onThinking
   } = options;
+  const maxTokens = maxTokensOverride ?? getMaxOutputTokens(model.modelId);
+  log5.info("agent loop starting", {
+    model: model.modelId,
+    maxTokens,
+    maxTurns
+  });
   if (abortSignal?.aborted) {
     throw new AgentLoopCancelledError;
   }
@@ -35768,6 +35795,13 @@ async function runAgentLoop(options) {
         cacheHitRate: total > 0 ? `${Math.round(cacheRead / total * 100)}%` : "0%"
       });
     }
+    if (response.finishReason === "length") {
+      log5.warn("output truncated - model hit maxTokens limit", {
+        maxTokens,
+        outputTokens: response.usage.completionTokens,
+        hasToolCalls: (response.toolCalls?.length ?? 0) > 0
+      });
+    }
     if (response.text) {
       finalText = response.text;
       await onText?.(response.text);
@@ -35812,6 +35846,15 @@ async function runAgentLoop(options) {
         content: toolResultParts
       };
       messages.push(toolMsg);
+      if (response.finishReason === "length") {
+        const hadInvalidCalls = toolCallInfos.some((tc) => tc.toolName === "__invalid_tool_call__");
+        if (hadInvalidCalls) {
+          messages.push({
+            role: "user",
+            content: "[SYSTEM: Your previous output was truncated because it exceeded the output token limit. " + "Your tool call was incomplete \u2014 parameters were cut off mid-generation. " + "To fix this: break large content into multiple smaller write calls, or use bash to write incrementally. " + "Do NOT retry the same large tool call \u2014 it will truncate again.]"
+          });
+        }
+      }
       if (isDone(toolCallInfos)) {
         stopReason = "done";
         break;
@@ -36138,7 +36181,6 @@ async function runCompaction(storage, config) {
         systemPrompt: ctx.systemPrompt,
         initialMessages,
         tools,
-        maxTokens: 4096,
         temperature: 0,
         maxTurns: 5,
         isDone: stopOnTool("finish_distillation"),
@@ -36244,7 +36286,7 @@ async function runSubAgent(storage, config) {
     extractResult,
     tier = "workhorse",
     maxTurns = 20,
-    maxTokens = 4096,
+    maxTokens,
     temperature = 0,
     onToolResult
   } = config;
@@ -36431,8 +36473,7 @@ async function runReflection(storage, question) {
     finishToolName: "finish_reflection",
     extractResult: getAnswer,
     tier: "workhorse",
-    maxTurns: 20,
-    maxTokens: 4096
+    maxTurns: 20
   });
   const answer = result.result ?? "Unable to find relevant information.";
   activity.reflection.complete(`${result.turnsUsed} turns, ${answer.length} chars`);
@@ -36836,7 +36877,6 @@ async function runResearch(storage, topic) {
     },
     tier: "workhorse",
     maxTurns: MAX_RESEARCH_TURNS,
-    maxTokens: 8192,
     onToolResult: (toolCallId) => {
       const toolResult = getLastResult(toolCallId);
       if (!toolResult)
@@ -45371,8 +45411,8 @@ var Mcp;
 })(Mcp ||= {});
 // src/version.ts
-var VERSION = "0.5.3";
-var GIT_HASH = "a2a5ddc";
+var VERSION = "0.5.5";
+var GIT_HASH = "9c9c471";
 var VERSION_STRING = `nuum v${VERSION} (${GIT_HASH})`;
 // src/tool/mcp-status.ts
@@ -45577,24 +45617,26 @@ Returns: [{ slug, title, path, snippet }, ...] ranked by relevance`,
   async execute(args, ctx) {
     const { ltm } = ctx.extra;
     const { query, path: path9, limit } = args;
-    const results = await ltm.search(query, path9);
-    const limited = results.slice(0, limit ?? 10);
+    const results = await ltm.searchFTS(query, {
+      limit: limit ?? 10,
+      pathPrefix: path9
+    });
     ctx.metadata({
       title: `ltm_search("${query}")`,
       metadata: { operation: "search" }
     });
-    if (limited.length === 0) {
+    if (results.length === 0) {
       return {
         title: `ltm_search("${query}")`,
         metadata: { operation: "search" },
         output: `No entries found matching "${query}"`
       };
     }
-    const formatted = limited.map((r) => ({
-      slug: r.entry.slug,
-      title: r.entry.title,
-      path: r.entry.path,
-      snippet: r.entry.body.slice(0, 150) + (r.entry.body.length > 150 ? "..." : "")
+    const formatted = results.map((r) => ({
+      slug: r.slug,
+      title: r.title,
+      path: r.path,
+      snippet: r.snippet
     }));
     return {
       title: `ltm_search("${query}")`,
@@ -46890,7 +46932,6 @@ async function runConsolidation(storage, messages) {
     },
     tier: "workhorse",
     maxTurns: MAX_CONSOLIDATION_TURNS,
-    maxTokens: 2048,
     onToolResult: (toolCallId) => {
       const toolResult = getLastResult(toolCallId);
       if (!toolResult)
@@ -47432,7 +47473,6 @@ async function runAgent(prompt, options) {
     systemPrompt: ctx.systemPrompt,
     initialMessages,
     tools,
-    maxTokens: 8192,
     maxTurns: MAX_TURNS,
     abortSignal,
     onText: async (text3) => {

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@sanity-labs/nuum",
-  "version": "0.5.3",
+  "version": "0.5.5",
   "description": "AI coding agent with continuous memory - infinite context across sessions",
   "type": "module",
   "bin": {