npm - @link-assistant/hive-mind - Versions diffs - 1.46.8 → 1.46.9 - Mend

@link-assistant/hive-mind 1.46.8 → 1.46.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/CHANGELOG.md +7 -0
package/package.json +1 -1
package/src/claude.budget-stats.lib.mjs +64 -34
package/src/claude.lib.mjs +5 -5

package/CHANGELOG.md CHANGED Viewed

@@ -1,9 +1,16 @@
 # @link-assistant/hive-mind
+## 1.46.9
+### Patch Changes
+- 8104fad: Fix wrong context window calculation showing impossible percentages like 250% (Issue #1539). When peakContextUsage is unknown (e.g. sub-agent models from result JSON only), skip the context window input tokens display entirely instead of falling back to cumulative totals across all requests, which are not valid per-request context window metrics.
 ## 1.46.8
 ### Patch Changes
+- Fix wrong context window calculation showing impossible percentages like 250% (Issue #1539). When peakContextUsage is unknown (e.g. sub-agent models from result JSON only), skip the context window input tokens display entirely instead of falling back to cumulative totals across all requests, which are not valid per-request context window metrics.
 - bcf2b9b: Retry on network issues and minimize terminal/log output differences (#1536): add ghRetry/ghCmdRetry utilities with exponential backoff for transient network errors (TCP reset, TLS timeout, connection refused, unexpected EOF). Apply retry to critical gh CLI calls: accept-invite, repository setup, auto-fork permission check, visibility detection, write permission check. Log stderr to log file on command failure for terminal/log parity. Add 'unexpected eof' to transient error detection patterns.
 ## 1.46.7

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@link-assistant/hive-mind",
-  "version": "1.46.8",
+  "version": "1.46.9",
   "description": "AI-powered issue solver and hive mind for collaborative problem solving",
   "main": "src/hive.mjs",
   "type": "module",

package/src/claude.budget-stats.lib.mjs CHANGED Viewed

@@ -158,16 +158,19 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
   const subSessions = tokenUsage?.subSessions || [];
   const hasMultipleSubSessions = subSessions.length > 1;
+  const peakContext = usage.peakContextUsage || 0;
   if (hasMultipleSubSessions) {
     for (let i = 0; i < subSessions.length; i++) {
       const sub = subSessions[i];
       const subPeak = sub.peakContextUsage || 0;
-      const subCumulative = (sub.inputTokens || 0) + (sub.cacheCreationTokens || 0) + (sub.cacheReadTokens || 0);
-      const contextValue = subPeak > 0 ? subPeak : subCumulative;
+      // Issue #1539: Only use peak per-request context for context window display.
+      // Cumulative totals across all requests can exceed the context limit and produce
+      // impossible percentages (e.g. 250%). When peak is unknown, skip context display.
       const parts = [];
-      if (contextLimit && contextValue > 0) {
-        const pct = ((contextValue / contextLimit) * 100).toFixed(0);
-        parts.push(`${formatNumber(contextValue)} / ${formatNumber(contextLimit)} input tokens (${pct}%)`);
+      if (contextLimit && subPeak > 0) {
+        const pct = ((subPeak / contextLimit) * 100).toFixed(0);
+        parts.push(`${formatNumber(subPeak)} / ${formatNumber(contextLimit)} input tokens (${pct}%)`);
       }
       if (outputLimit) {
         const outPct = ((sub.outputTokens / outputLimit) * 100).toFixed(0);
@@ -177,15 +180,12 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
         await log(`        ${i + 1}. Context window: ${parts.join(', ')}`);
       }
     }
-  } else {
-    // Single sub-session: single-line format
-    const peakContext = usage.peakContextUsage || 0;
-    const cumulativeContext = usage.inputTokens + usage.cacheCreationTokens + usage.cacheReadTokens;
-    const contextValue = peakContext > 0 ? peakContext : cumulativeContext;
+  } else if (peakContext > 0) {
+    // Single sub-session with known peak: single-line format
     const parts = [];
-    if (contextLimit && contextValue > 0) {
-      const pct = ((contextValue / contextLimit) * 100).toFixed(0);
-      parts.push(`${formatNumber(contextValue)} / ${formatNumber(contextLimit)} input tokens (${pct}%)`);
+    if (contextLimit) {
+      const pct = ((peakContext / contextLimit) * 100).toFixed(0);
+      parts.push(`${formatNumber(peakContext)} / ${formatNumber(contextLimit)} input tokens (${pct}%)`);
     }
     if (outputLimit) {
       const outPct = ((usage.outputTokens / outputLimit) * 100).toFixed(0);
@@ -195,6 +195,8 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
       await log(`        Context window: ${parts.join(', ')}`);
     }
   }
+  // Issue #1539: When peakContextUsage is unknown, skip context window line entirely.
+  // Cumulative totals are shown on the Total line below — no duplication needed.
   // Cumulative totals — single line
   const totalInputNonCached = usage.inputTokens + usage.cacheCreationTokens;
@@ -202,6 +204,11 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
   let totalLine = `${formatNumber(totalInputNonCached)}`;
   if (cachedTokens > 0) totalLine += ` + ${formatNumber(cachedTokens)} cached`;
   totalLine += ` input tokens, ${formatNumber(usage.outputTokens)} output tokens`;
+  // Issue #1539: When peakContextUsage is unknown, embed output percentage in Total line
+  if (peakContext === 0 && outputLimit) {
+    const outPct = ((usage.outputTokens / outputLimit) * 100).toFixed(0);
+    totalLine += ` (${outPct}% of ${formatNumber(outputLimit)} output limit)`;
+  }
   await log(`        Total: ${totalLine}`);
 };
@@ -230,6 +237,15 @@ export const mergeResultModelUsage = (modelUsage, resultModelUsage) => {
       if (resultUsage.costUSD != null) {
         modelUsage[modelId]._resultCostUSD = resultUsage.costUSD;
       }
+      // Issue #1539: Extract model limits from result JSON for sub-agent models
+      // Claude Code's result event includes contextWindow and maxOutputTokens per model,
+      // which we use as fallback when modelInfo API is unavailable.
+      if (resultUsage.contextWindow) {
+        modelUsage[modelId]._resultContextWindow = resultUsage.contextWindow;
+      }
+      if (resultUsage.maxOutputTokens) {
+        modelUsage[modelId]._resultMaxOutputTokens = resultUsage.maxOutputTokens;
+      }
     } else {
       const jsonlUsage = modelUsage[modelId];
       const jsonlTotal = jsonlUsage.inputTokens + jsonlUsage.cacheCreationTokens + jsonlUsage.cacheReadTokens + jsonlUsage.outputTokens;
@@ -244,6 +260,13 @@ export const mergeResultModelUsage = (modelUsage, resultModelUsage) => {
       if (resultUsage.costUSD != null) {
         jsonlUsage._resultCostUSD = resultUsage.costUSD;
       }
+      // Issue #1539: Also extract model limits from result JSON as fallback
+      if (resultUsage.contextWindow) {
+        jsonlUsage._resultContextWindow = resultUsage.contextWindow;
+      }
+      if (resultUsage.maxOutputTokens) {
+        jsonlUsage._resultMaxOutputTokens = resultUsage.maxOutputTokens;
+      }
     }
   }
 };
@@ -274,36 +297,35 @@ const formatSubSessionsList = (subSessions, contextLimit, outputLimit) => {
   let result = '';
   for (let i = 0; i < subSessions.length; i++) {
     const sub = subSessions[i];
+    // Issue #1539: Only use peak per-request context; skip context display when unknown
     const subPeakContext = sub.peakContextUsage || 0;
-    // Cumulative fallback: inputTokens + cacheCreationTokens + cacheReadTokens for this sub-session
-    const subCumulative = (sub.inputTokens || 0) + (sub.cacheCreationTokens || 0) + (sub.cacheReadTokens || 0);
-    result += formatContextOutputLine(subPeakContext, contextLimit, sub.outputTokens, outputLimit, `${i + 1}. `, subCumulative);
+    result += formatContextOutputLine(subPeakContext, contextLimit, sub.outputTokens, outputLimit, `${i + 1}. `);
   }
   return result;
 };
 /**
  * Issue #1526: Build a single-line context window + output tokens string.
+ * Issue #1539: Only show context window when peakContext > 0 (per-request peak known).
+ * When peakContext is 0 (unknown), context part is omitted to avoid misleading percentages.
  * Format: "- Context window: X / Y input tokens (Z%), A / B output tokens (W%)"
- * When only one of context or output limits is available, shows just that part.
- * @param {number} peakContext - Peak context usage (0 if unknown)
+ * @param {number} peakContext - Peak context usage (0 if unknown — context display skipped)
  * @param {number} contextLimit - Context window limit (null if unknown)
  * @param {number} outputTokens - Output tokens used
  * @param {number} outputLimit - Output token limit (null if unknown)
  * @param {string} [prefix='- '] - Line prefix
  * @returns {string} Formatted line or empty string
  */
-const formatContextOutputLine = (peakContext, contextLimit, outputTokens, outputLimit, prefix = '- ', cumulativeContext = 0) => {
+const formatContextOutputLine = (peakContext, contextLimit, outputTokens, outputLimit, prefix = '- ') => {
   const parts = [];
   if (contextLimit) {
-    // Use peakContextUsage when available (per-request peak from JSONL tracking).
-    // Fall back to cumulative total (inputTokens + cacheCreationTokens + cacheReadTokens)
-    // when peak is unknown (e.g., model only from result JSON, not in JSONL).
-    // Issue #1526: Never skip context display — always show what data we have.
-    const contextValue = peakContext > 0 ? peakContext : cumulativeContext;
-    if (contextValue > 0) {
-      const pct = ((contextValue / contextLimit) * 100).toFixed(0);
-      parts.push(`${formatTokensCompact(contextValue)} / ${formatTokensCompact(contextLimit)} input tokens (${pct}%)`);
+    // Issue #1539: Only use peak per-request context for context window display.
+    // When peak is unknown (e.g., model only from result JSON, not in JSONL),
+    // skip context display. Cumulative totals across all requests are not valid
+    // context window metrics and produce impossible percentages (e.g. 250%).
+    if (peakContext > 0) {
+      const pct = ((peakContext / contextLimit) * 100).toFixed(0);
+      parts.push(`${formatTokensCompact(peakContext)} / ${formatTokensCompact(contextLimit)} input tokens (${pct}%)`);
     }
   }
   if (outputLimit) {
@@ -322,7 +344,8 @@ const formatContextOutputLine = (peakContext, contextLimit, outputTokens, output
  * Sub-sessions are shown as a global section (not duplicated per model) since JSONL
  * sub-session tracking is global across all models.
  * Issue #1526: Shorter output format — context window + output tokens on single line.
- * Fix: exclude cacheReadTokens from context window fallback calculation (cumulative ≠ per-request).
+ * Issue #1539: Only display context window when peak per-request usage is known.
+ * Cumulative totals are never used as context window metrics (they can exceed model limits).
  * @param {Object} tokenUsage - Token usage data from calculateSessionTokens or buildAgentBudgetStats
  * @returns {string} Formatted markdown string for PR comment
  */
@@ -358,17 +381,17 @@ export const buildBudgetStatsString = tokenUsage => {
       if (isMultiModel) stats += `\n\n**${modelName}:**`;
+      const peakContext = usage.peakContextUsage || 0;
       if (!isMultiModel && hasMultipleSubSessions) {
         // Single-model + multiple sub-sessions: show numbered sub-sessions under that model
         stats += formatSubSessionsList(subSessions, contextLimit, outputLimit);
-      } else {
+      } else if (peakContext > 0) {
         // Issue #1526: Single line format for context window + output tokens
-        // Use peakContextUsage when available; fall back to cumulative total when peak is unknown
-        // (e.g., for result-JSON-sourced sub-agent models where only cumulative totals are available)
-        const peakContext = usage.peakContextUsage || 0;
-        const cumulativeContext = usage.inputTokens + usage.cacheCreationTokens + usage.cacheReadTokens;
-        stats += formatContextOutputLine(peakContext, contextLimit, usage.outputTokens, outputLimit, '- ', cumulativeContext);
+        stats += formatContextOutputLine(peakContext, contextLimit, usage.outputTokens, outputLimit, '- ');
       }
+      // Issue #1539: When peakContextUsage is unknown, skip context window line entirely.
+      // Cumulative totals are shown on the Total line below — no duplication needed.
       // Cumulative totals per model: input tokens + cached shown separately
       // Issue #1526: Shorter format — single "Total:" line
@@ -378,6 +401,13 @@ export const buildBudgetStatsString = tokenUsage => {
       if (cachedTokens > 0) totalLine += ` + ${formatTokensCompact(cachedTokens)} cached`;
       totalLine += ` input tokens, ${formatTokensCompact(usage.outputTokens)} output tokens`;
+      // Issue #1539: When peakContextUsage is unknown (no per-request data), embed
+      // output token percentage in the Total line so no data is lost.
+      if (peakContext === 0 && outputLimit) {
+        const outPct = ((usage.outputTokens / outputLimit) * 100).toFixed(0);
+        totalLine += ` (${outPct}% of ${formatTokensCompact(outputLimit)} output limit)`;
+      }
       // Issue #1508: Show per-model cost when available
       if (usage.costUSD !== null && usage.costUSD !== undefined) {
         totalLine += `, $${usage.costUSD.toFixed(6)} cost`;

package/src/claude.lib.mjs CHANGED Viewed

@@ -498,13 +498,10 @@ export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsag
   }
   // Initialize per-model usage tracking
   const modelUsage = {};
-  // Issue #1501: Deduplicate JSONL entries by message ID (upstream: anthropics/claude-code#6805)
-  // Claude Code's stream-json mode splits single API responses with multiple content blocks
-  // into separate JSONL entries, each with the same message ID and identical usage stats.
+  // Issue #1501: Deduplicate JSONL entries by message ID (stream-json splits responses)
   const seenMessageIds = new Set();
   let duplicateCount = 0;
   // Issue #1501: Track peak context usage per request (not cumulative)
-  // The context window limit is per-request, so we track the max single-request fill.
   const peakContextByModel = {};
   let globalPeakContext = 0;
   // Issue #1491: Track sub-sessions between compactification events
@@ -610,7 +607,10 @@ export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsag
         usage.costUSD = usage._resultCostUSD ?? null;
         usage.costBreakdown = null;
         usage.modelName = modelId;
-        usage.modelInfo = null;
+        // Issue #1539: Use contextWindow/maxOutputTokens from result JSON as fallback model limits
+        const ctx = usage._resultContextWindow,
+          out = usage._resultMaxOutputTokens;
+        usage.modelInfo = ctx || out ? { limit: { context: ctx || null, output: out || null } } : null;
       }
     }
     // Calculate grand totals across all models