npm - @link-assistant/hive-mind - Versions diffs - 1.62.0 → 1.63.0 - Mend

@link-assistant/hive-mind 1.62.0 → 1.63.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

package/CHANGELOG.md +12 -0
package/README.hi.md +4 -2
package/README.md +18 -15
package/README.ru.md +4 -2
package/README.zh.md +17 -15
package/package.json +1 -1
package/src/bidirectional-interactive.lib.mjs +1 -1
package/src/claude.budget-stats.lib.mjs +49 -30
package/src/claude.lib.mjs +11 -15
package/src/config.lib.mjs +1 -0
package/src/gemini.lib.mjs +611 -0
package/src/gemini.prompts.lib.mjs +236 -0
package/src/hive.config.lib.mjs +1 -1
package/src/interactive-mode.lib.mjs +1 -1
package/src/models/index.mjs +39 -8
package/src/solve.config.lib.mjs +4 -4
package/src/solve.mjs +33 -0
package/src/solve.restart-shared.lib.mjs +47 -1
package/src/solve.results.lib.mjs +1 -1
package/src/solve.validation.lib.mjs +8 -0
package/src/task.config.lib.mjs +1 -1
package/src/task.mjs +1 -1
package/src/telegram-bot.mjs +4 -4
package/src/telegram-solve-command.lib.mjs +1 -0
package/src/telegram-solve-queue-command.lib.mjs +1 -1
package/src/telegram-solve-queue.helpers.lib.mjs +12 -1
package/src/telegram-solve-queue.lib.mjs +37 -20
package/src/usage-limit.lib.mjs +1 -1

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,17 @@
 # @link-assistant/hive-mind
+## 1.63.0
+### Minor Changes
+- b7b0721: Add direct Google Gemini CLI support for solve, hive, queueing, model validation, structured stream JSON parsing, and Telegram `/gemini` aliases.
+## 1.62.1
+### Patch Changes
+- a683edf: Fix budget stats restored-context input accounting so sub-session lines include cache reads, use `sub-sessions` wording, and no longer render the obsolete `peak request:` label.
 ## 1.62.0
 ### Minor Changes

package/README.hi.md CHANGED Viewed

@@ -343,7 +343,7 @@ solve <issue-url> [options]
 | विकल्प                   | संक्षिप्त | विवरण                                                       | डिफ़ॉल्ट |
 | ------------------------ | --------- | ----------------------------------------------------------- | -------- |
-| `--tool`                 |           | AI टूल (claude, opencode, codex, agent, qwen)               | claude   |
+| `--tool`                 |           | AI टूल (claude, opencode, codex, agent, gemini, qwen)       | claude   |
 | `--verbose`              | `-v`      | विस्तृत लॉगिंग सक्षम करें                                   | false    |
 | `--attach-logs`          |           | PR में लॉग संलग्न करें (⚠️ संवेदनशील डेटा उजागर हो सकता है) | false    |
 | `--auto-init-repository` |           | खाली रेपो स्वतः-आरंभ करें (README.md बनाता है)              | false    |
@@ -370,7 +370,7 @@ hive <github-url> [options]
 | विकल्प                   | संक्षिप्त | विवरण                                                       | डिफ़ॉल्ट |
 | ------------------------ | --------- | ----------------------------------------------------------- | -------- |
-| `--tool`                 |           | AI टूल (claude, opencode, codex, agent, qwen)               | claude   |
+| `--tool`                 |           | AI टूल (claude, opencode, codex, agent, gemini, qwen)       | claude   |
 | `--concurrency`          | `-c`      | समानांतर वर्कर की संख्या                                    | 2        |
 | `--skip-issues-with-prs` | `-s`      | मौजूदा PR वाले इश्यू छोड़ें                                 | false    |
 | `--verbose`              | `-v`      | विस्तृत लॉगिंग सक्षम करें                                   | false    |
@@ -462,12 +462,14 @@ Aliases:
 /codex /solve --tool codex के बराबर है
 /opencode /solve --tool opencode के बराबर है
 /agent /solve --tool agent के बराबर है
+/gemini /solve --tool gemini के बराबर है
 /qwen /solve --tool qwen के बराबर है
 Tool alias examples:
 /codex https://github.com/owner/repo/issues/123 --model gpt-5.5
 /opencode https://github.com/owner/repo/issues/123 --model grok-code-fast-1
 /agent https://github.com/owner/repo/issues/123 --model nemotron-3-super-free
+/gemini https://github.com/owner/repo/issues/123 --model flash
 /qwen https://github.com/owner/repo/issues/123 --model qwen3-coder-plus
 Free Models (with --tool agent):

package/README.md CHANGED Viewed

@@ -350,13 +350,13 @@ solve <issue-url> [options]
 **Other useful options:**
-| Option                   | Alias | Description                                      | Default |
-| ------------------------ | ----- | ------------------------------------------------ | ------- |
-| `--tool`                 |       | AI tool (claude, opencode, codex, agent, qwen)   | claude  |
-| `--verbose`              | `-v`  | Enable verbose logging                           | false   |
-| `--attach-logs`          |       | Attach logs to PR (⚠️ may expose sensitive data) | false   |
-| `--auto-init-repository` |       | Auto-initialize empty repos (creates README.md)  | false   |
-| `--help`                 | `-h`  | Show all available options                       | -       |
+| Option                   | Alias | Description                                            | Default |
+| ------------------------ | ----- | ------------------------------------------------------ | ------- |
+| `--tool`                 |       | AI tool (claude, opencode, codex, agent, gemini, qwen) | claude  |
+| `--verbose`              | `-v`  | Enable verbose logging                                 | false   |
+| `--attach-logs`          |       | Attach logs to PR (⚠️ may expose sensitive data)       | false   |
+| `--auto-init-repository` |       | Auto-initialize empty repos (creates README.md)        | false   |
+| `--help`                 | `-h`  | Show all available options                             | -       |
 > **📖 Full options list**: See [docs/CONFIGURATION.md](./docs/CONFIGURATION.md#solve-options) for all available options including forking, auto-continue, watch mode, and experimental features.
@@ -377,14 +377,14 @@ hive <github-url> [options]
 **Other useful options:**
-| Option                   | Alias | Description                                       | Default |
-| ------------------------ | ----- | ------------------------------------------------- | ------- |
-| `--tool`                 |       | AI tool (claude, opencode, codex, agent, qwen)    | claude  |
-| `--concurrency`          | `-c`  | Number of parallel workers                        | 2       |
-| `--skip-issues-with-prs` | `-s`  | Skip issues with existing PRs                     | false   |
-| `--verbose`              | `-v`  | Enable verbose logging                            | false   |
-| `--attach-logs`          |       | Attach logs to PRs (⚠️ may expose sensitive data) | false   |
-| `--help`                 | `-h`  | Show all available options                        | -       |
+| Option                   | Alias | Description                                            | Default |
+| ------------------------ | ----- | ------------------------------------------------------ | ------- |
+| `--tool`                 |       | AI tool (claude, opencode, codex, agent, gemini, qwen) | claude  |
+| `--concurrency`          | `-c`  | Number of parallel workers                             | 2       |
+| `--skip-issues-with-prs` | `-s`  | Skip issues with existing PRs                          | false   |
+| `--verbose`              | `-v`  | Enable verbose logging                                 | false   |
+| `--attach-logs`          |       | Attach logs to PRs (⚠️ may expose sensitive data)      | false   |
+| `--help`                 | `-h`  | Show all available options                             | -       |
 > **📖 Full options list**: See [docs/CONFIGURATION.md](./docs/CONFIGURATION.md#hive-options) for all available options including project monitoring, YouTrack integration, and experimental features.
@@ -469,12 +469,14 @@ Aliases:
 /codex is equivalent to /solve --tool codex
 /opencode is equivalent to /solve --tool opencode
 /agent is equivalent to /solve --tool agent
+/gemini is equivalent to /solve --tool gemini
 /qwen is equivalent to /solve --tool qwen
 Tool alias examples:
 /codex https://github.com/owner/repo/issues/123 --model gpt-5.5
 /opencode https://github.com/owner/repo/issues/123 --model grok-code-fast-1
 /agent https://github.com/owner/repo/issues/123 --model nemotron-3-super-free
+/gemini https://github.com/owner/repo/issues/123 --model flash
 /qwen https://github.com/owner/repo/issues/123 --model qwen3-coder-plus
 Free Models (with --tool agent):
@@ -497,6 +499,7 @@ Current tool defaults in Hive Mind:
 | `codex`    | `gpt-5.5` preferred, with runtime fallback to local catalog | Codex runs with `reasoning_effort=none` unless you pass `--think` or `--thinking-budget` |
 | `opencode` | `grok-code-fast-1`                                          | No extra thinking prompt is added for the default model                                  |
 | `agent`    | `nemotron-3-super-free`                                     | No extra thinking prompt is added for the default model                                  |
+| `gemini`   | `flash`                                                     | No extra thinking prompt is added for the default model                                  |
 | `qwen`     | `qwen3-coder-plus`                                          | No extra thinking prompt is added for the default model                                  |
 See [docs/CONFIGURATION.md](./docs/CONFIGURATION.md) for the full per-tool defaults and reasoning mappings.

package/README.ru.md CHANGED Viewed

@@ -343,7 +343,7 @@ solve <issue-url> [options]
 | Параметр                 | Сокр. | Описание                                                              | По умолчанию |
 | ------------------------ | ----- | --------------------------------------------------------------------- | ------------ |
-| `--tool`                 |       | Инструмент ИИ (claude, opencode, codex, agent, qwen)                  | claude       |
+| `--tool`                 |       | Инструмент ИИ (claude, opencode, codex, agent, gemini, qwen)          | claude       |
 | `--verbose`              | `-v`  | Включить подробное логирование                                        | false        |
 | `--attach-logs`          |       | Прикрепить логи к PR (⚠️ может раскрыть конфиденциальные данные)      | false        |
 | `--auto-init-repository` |       | Автоматически инициализировать пустые репозитории (создаёт README.md) | false        |
@@ -370,7 +370,7 @@ hive <github-url> [options]
 | Параметр                 | Сокр. | Описание                                                          | По умолчанию |
 | ------------------------ | ----- | ----------------------------------------------------------------- | ------------ |
-| `--tool`                 |       | Инструмент ИИ (claude, opencode, codex, agent, qwen)              | claude       |
+| `--tool`                 |       | Инструмент ИИ (claude, opencode, codex, agent, gemini, qwen)      | claude       |
 | `--concurrency`          | `-c`  | Количество параллельных воркеров                                  | 2            |
 | `--skip-issues-with-prs` | `-s`  | Пропускать задачи с существующими PR                              | false        |
 | `--verbose`              | `-v`  | Включить подробное логирование                                    | false        |
@@ -463,12 +463,14 @@ Aliases:
 /codex эквивалентна /solve --tool codex
 /opencode эквивалентна /solve --tool opencode
 /agent эквивалентна /solve --tool agent
+/gemini эквивалентна /solve --tool gemini
 /qwen эквивалентна /solve --tool qwen
 Tool alias examples:
 /codex https://github.com/owner/repo/issues/123 --model gpt-5.5
 /opencode https://github.com/owner/repo/issues/123 --model grok-code-fast-1
 /agent https://github.com/owner/repo/issues/123 --model nemotron-3-super-free
+/gemini https://github.com/owner/repo/issues/123 --model flash
 /qwen https://github.com/owner/repo/issues/123 --model qwen3-coder-plus
 Free Models (with --tool agent):

package/README.zh.md CHANGED Viewed

@@ -341,13 +341,13 @@ solve <issue-url> [options]
 **其他常用选项：**
-| 选项                     | 简写 | 描述                                            | 默认值 |
-| ------------------------ | ---- | ----------------------------------------------- | ------ |
-| `--tool`                 |      | AI 工具（claude、opencode、codex、agent、qwen） | claude |
-| `--verbose`              | `-v` | 启用详细日志                                    | false  |
-| `--attach-logs`          |      | 将日志附加到 PR（⚠️ 可能暴露敏感数据）          | false  |
-| `--auto-init-repository` |      | 自动初始化空仓库（创建 README.md）              | false  |
-| `--help`                 | `-h` | 显示所有可用选项                                | -      |
+| 选项                     | 简写 | 描述                                                    | 默认值 |
+| ------------------------ | ---- | ------------------------------------------------------- | ------ |
+| `--tool`                 |      | AI 工具（claude、opencode、codex、agent、gemini、qwen） | claude |
+| `--verbose`              | `-v` | 启用详细日志                                            | false  |
+| `--attach-logs`          |      | 将日志附加到 PR（⚠️ 可能暴露敏感数据）                  | false  |
+| `--auto-init-repository` |      | 自动初始化空仓库（创建 README.md）                      | false  |
+| `--help`                 | `-h` | 显示所有可用选项                                        | -      |
 > **📖 完整选项列表**：包含 Fork、自动续行、监视模式及实验性功能在内的所有可用选项，请参见 [docs/CONFIGURATION.zh.md](./docs/CONFIGURATION.zh.md#solve-options)。
@@ -368,14 +368,14 @@ hive <github-url> [options]
 **其他常用选项：**
-| 选项                     | 简写 | 描述                                            | 默认值 |
-| ------------------------ | ---- | ----------------------------------------------- | ------ |
-| `--tool`                 |      | AI 工具（claude、opencode、codex、agent、qwen） | claude |
-| `--concurrency`          | `-c` | 并行工作进程数量                                | 2      |
-| `--skip-issues-with-prs` | `-s` | 跳过已有 PR 的 Issue                            | false  |
-| `--verbose`              | `-v` | 启用详细日志                                    | false  |
-| `--attach-logs`          |      | 将日志附加到 PR（⚠️ 可能暴露敏感数据）          | false  |
-| `--help`                 | `-h` | 显示所有可用选项                                | -      |
+| 选项                     | 简写 | 描述                                                    | 默认值 |
+| ------------------------ | ---- | ------------------------------------------------------- | ------ |
+| `--tool`                 |      | AI 工具（claude、opencode、codex、agent、gemini、qwen） | claude |
+| `--concurrency`          | `-c` | 并行工作进程数量                                        | 2      |
+| `--skip-issues-with-prs` | `-s` | 跳过已有 PR 的 Issue                                    | false  |
+| `--verbose`              | `-v` | 启用详细日志                                            | false  |
+| `--attach-logs`          |      | 将日志附加到 PR（⚠️ 可能暴露敏感数据）                  | false  |
+| `--help`                 | `-h` | 显示所有可用选项                                        | -      |
 > **📖 完整选项列表**：包含项目监控、YouTrack 集成及实验性功能在内的所有可用选项，请参见 [docs/CONFIGURATION.zh.md](./docs/CONFIGURATION.zh.md#hive-options)。
@@ -459,12 +459,14 @@ Aliases:
 /codex 等同于 /solve --tool codex
 /opencode 等同于 /solve --tool opencode
 /agent 等同于 /solve --tool agent
+/gemini 等同于 /solve --tool gemini
 /qwen 等同于 /solve --tool qwen
 Tool alias examples:
 /codex https://github.com/owner/repo/issues/123 --model gpt-5.5
 /opencode https://github.com/owner/repo/issues/123 --model grok-code-fast-1
 /agent https://github.com/owner/repo/issues/123 --model nemotron-3-super-free
+/gemini https://github.com/owner/repo/issues/123 --model flash
 /qwen https://github.com/owner/repo/issues/123 --model qwen3-coder-plus
 Free Models (with --tool agent):

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@link-assistant/hive-mind",
-  "version": "1.62.0",
+  "version": "1.63.0",
   "description": "AI-powered issue solver and hive mind for collaborative problem solving",
   "main": "src/hive.mjs",
   "type": "module",

package/src/bidirectional-interactive.lib.mjs CHANGED Viewed

@@ -851,7 +851,7 @@ export const createBidirectionalHandler = options => {
 /**
  * Check if bidirectional interactive mode is supported for the given tool
  *
- * @param {string} tool - Tool name (claude, opencode, codex)
+ * @param {string} tool - Tool name (claude, opencode, codex, agent, gemini)
  * @returns {boolean} Whether bidirectional interactive mode is supported
  */
 export const isBidirectionalModeSupported = tool => {

package/src/claude.budget-stats.lib.mjs CHANGED Viewed

@@ -19,6 +19,10 @@ export const createEmptySubSessionUsage = () => ({
   peakOutputUsage: 0,
 });
+export const getRawRequestInputTokens = usage => (usage?.input_tokens || 0) + (usage?.cache_creation_input_tokens || 0) + (usage?.cache_read_input_tokens || 0);
+export const getUsageInputTokens = usage => (usage?.inputTokens || 0) + (usage?.cacheCreationTokens || 0) + (usage?.cacheReadTokens || 0);
 /**
  * Helper: accumulates token usage from a JSONL entry into a model usage map
  * @param {Object} modelUsageMap - Map of model ID to usage data
@@ -185,9 +189,10 @@ export const dumpBudgetTrace = async (usage, tokenUsage, log) => {
   const source = usage._sourceResultJson ? 'jsonl + result-event' : 'jsonl';
   await log(`\n      📊 [budget-trace] ${modelName}`, { verbose: true });
-  // Issue #1710 R5: peak request is `input + cache_creation` (cache reads
-  // tracked separately on the cumulative line).
-  await log(`         peak request:    ${formatNumber(peak)}${limit.context ? ` / ${formatNumber(limit.context)} context` : ''} (largest single-request input + cache_creation, excludes cache_read)`, { verbose: true });
+  // Issue #1737: peak input is the largest request's total input footprint:
+  // input + cache_creation + cache_read. The cumulative line still keeps those
+  // buckets split for cost and accounting review.
+  await log(`         peak input:      ${formatNumber(peak)}${limit.context ? ` / ${formatNumber(limit.context)} context` : ''} (largest request input + cache_creation + cache_read)`, { verbose: true });
   await log(`         cumulative:      input ${formatNumber(inputs)}, cache_write ${formatNumber(writes)} (5m ${formatNumber(writes5m)} / 1h ${formatNumber(writes1h)}), cache_read ${formatNumber(reads)}, output ${formatNumber(outputs)}`, { verbose: true });
   // Issue #1710 R1: web_search is now billed in calculateModelCost. The trace
   // still surfaces the implied dollar cost so the residual remains debuggable
@@ -234,17 +239,15 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
   if (hasMultipleSubSessions) {
     // Issue #1600: Unified format — numbered list without "Context window:" prefix.
-    // Issue #1710 R3/R5: Peak input is `input + cache_creation` (cache reads
-    // are tracked separately on the Total line), and the bullet is now
-    // labelled "peak request:" so a reader does not try to reconcile it with
-    // the cumulative Total figure.
+    // Issue #1737: Show peak input pressure per sub-session without the
+    // confusing "peak request:" label.
     for (let i = 0; i < subSessions.length; i++) {
       const sub = subSessions[i];
       const subPeak = sub.peakContextUsage || 0;
       const parts = [];
       if (contextLimit && subPeak > 0) {
         const pct = ((subPeak / contextLimit) * 100).toFixed(0);
-        parts.push(`peak request: ${formatNumber(subPeak)} / ${formatNumber(contextLimit)} (${pct}%) input tokens`);
+        parts.push(`${formatNumber(subPeak)} / ${formatNumber(contextLimit)} (${pct}%) input tokens`);
       }
       if (outputLimit) {
         const outPct = ((sub.outputTokens / outputLimit) * 100).toFixed(0);
@@ -258,7 +261,7 @@ export const displayBudgetStats = async (usage, tokenUsage, log) => {
     const parts = [];
     if (contextLimit) {
       const pct = ((peakContext / contextLimit) * 100).toFixed(0);
-      parts.push(`peak request: ${formatNumber(peakContext)} / ${formatNumber(contextLimit)} (${pct}%) input tokens`);
+      parts.push(`${formatNumber(peakContext)} / ${formatNumber(contextLimit)} (${pct}%) input tokens`);
     }
     if (outputLimit) {
       const outPct = ((usage.outputTokens / outputLimit) * 100).toFixed(0);
@@ -361,6 +364,17 @@ const formatTokensCompact = tokens => {
   return tokens.toLocaleString();
 };
+const formatInputContextPart = (inputTokens, contextLimit, format) => {
+  if (contextLimit && inputTokens > 0) {
+    const pct = ((inputTokens / contextLimit) * 100).toFixed(0);
+    return `${format(inputTokens)} / ${format(contextLimit)} (${pct}%) input tokens`;
+  }
+  if (inputTokens > 0) {
+    return `${format(inputTokens)} input tokens`;
+  }
+  return null;
+};
 /**
  * Issue #1710: Build the cumulative input-tokens phrase for the Total / fallback
  * lines, splitting cache writes and cache reads so neither category is ever
@@ -422,10 +436,10 @@ const formatSubSessionsList = (subSessions, contextLimit, outputLimit) => {
 /**
  * Issue #1600: Build a single-line context + output tokens string (unified format, no "Context window:" prefix).
- * Issue #1710 R3/R5: The input figure is the peak per-request `input + cache_creation`
- * (cache reads excluded). Labelling it "peak request:" lets readers tell it apart
- * from the cumulative Total line.
- * @param {number} peakContext - Peak context usage (0 if unknown — context display skipped)
+ * Issue #1737: The input figure is the peak restored-context input for the
+ * sub-session/request (`input + cache_creation + cache_read`), without the old
+ * "peak request:" label.
+ * @param {number} peakContext - Peak input usage (0 if unknown — context display skipped)
  * @param {number} contextLimit - Context window limit (null if unknown)
  * @param {number} outputTokens - Output tokens used
  * @param {number} outputLimit - Output token limit (null if unknown)
@@ -434,9 +448,9 @@ const formatSubSessionsList = (subSessions, contextLimit, outputLimit) => {
  */
 const formatContextOutputLine = (peakContext, contextLimit, outputTokens, outputLimit, prefix = '- ') => {
   const parts = [];
-  if (contextLimit && peakContext > 0) {
-    const pct = ((peakContext / contextLimit) * 100).toFixed(0);
-    parts.push(`peak request: ${formatTokensCompact(peakContext)} / ${formatTokensCompact(contextLimit)} (${pct}%) input tokens`);
+  const inputPart = formatInputContextPart(peakContext, contextLimit, formatTokensCompact);
+  if (inputPart) {
+    parts.push(inputPart);
   }
   if (outputLimit) {
     const outPct = ((outputTokens / outputLimit) * 100).toFixed(0);
@@ -547,16 +561,16 @@ export const buildBudgetStatsString = (tokenUsage, subAgentCalls = null) => {
       if (isMultiModel) {
         // Issue #1590: Show sub-agent call count alongside model name
-        // Issue #1600: Show session segment count for primary model
+        // Issue #1737: Use "sub-sessions" for compactification-bounded sections.
         if (callCount > 1) {
           stats += `\n\n**${modelName}:** (${callCount} sub-agent calls)`;
         } else if (showSubSessions) {
-          stats += `\n\n**${modelName}:** (${subSessions.length} session segments)`;
+          stats += `\n\n**${modelName}:** (${subSessions.length} sub-sessions)`;
         } else {
           stats += `\n\n**${modelName}:**`;
         }
       } else if (showSubSessions) {
-        stats += `\n\n**${modelName}:** (${subSessions.length} session segments)`;
+        stats += `\n\n**${modelName}:** (${subSessions.length} sub-sessions)`;
       }
       const peakContext = usage.peakContextUsage || 0;
@@ -568,20 +582,25 @@ export const buildBudgetStatsString = (tokenUsage, subAgentCalls = null) => {
         stats += formatContextOutputLine(peakContext, contextLimit, usage.outputTokens, outputLimit, '- ');
       } else if (outputLimit && callCount <= 1) {
         // Issue #1600: Sub-agent single sessions previously showed only an output line.
-        // Issue #1710 R2: Always surface the cumulative input information too — sub-agent
+        // Issue #1737: Always surface total input information too — sub-agent
         // models (e.g. Haiku) never appear as the responding model in the parent JSONL,
         // so peakContext stays at 0; without this fallback the rendered comment loses
-        // the sub-agent's input-token information entirely. Cache writes / reads are
-        // split via the same helper used for the Total line so the two lines stay
-        // arithmetically consistent.
-        const inputPhrase = buildCumulativeInputPhrase({
-          input: usage.inputTokens || 0,
-          cacheWrites: usage.cacheCreationTokens || 0,
-          cacheReads: usage.cacheReadTokens || 0,
-          format: formatTokensCompact,
-        });
+        // the sub-agent's input-token information entirely. The detail line is
+        // deliberately simple; the Total line below keeps the cache split.
+        const parts = [];
+        const isResultSingleCall = usage._sourceResultJson || callCount > 0;
+        const inputPart = isResultSingleCall
+          ? formatInputContextPart(getUsageInputTokens(usage), contextLimit, formatTokensCompact)
+          : buildCumulativeInputPhrase({
+              input: usage.inputTokens || 0,
+              cacheWrites: usage.cacheCreationTokens || 0,
+              cacheReads: usage.cacheReadTokens || 0,
+              format: formatTokensCompact,
+            });
+        if (inputPart) parts.push(inputPart);
         const outPct = ((usage.outputTokens / outputLimit) * 100).toFixed(0);
-        stats += `\n- ${inputPhrase}, ${formatTokensCompact(usage.outputTokens)} / ${formatTokensCompact(outputLimit)} (${outPct}%) output tokens`;
+        parts.push(`${formatTokensCompact(usage.outputTokens)} / ${formatTokensCompact(outputLimit)} (${outPct}%) output tokens`);
+        stats += `\n- ${parts.join(', ')}`;
       }
       // Cumulative totals per model: input tokens + cached shown separately.

package/src/claude.lib.mjs CHANGED Viewed

@@ -15,7 +15,7 @@ import { setupBidirectionalHandler, finalizeBidirectionalHandler, validateBidire
 import { initProgressMonitoring } from './solve.progress-monitoring.lib.mjs';
 import { sanitizeObjectStrings } from './unicode-sanitization.lib.mjs';
 import Decimal from 'decimal.js-light';
-import { displayBudgetStats, createEmptySubSessionUsage, accumulateModelUsage, displayModelUsage, displayCostComparison, mergeResultModelUsage, createSubAgentCallEntry, accumulateSubAgentUsage } from './claude.budget-stats.lib.mjs';
+import { displayBudgetStats, createEmptySubSessionUsage, accumulateModelUsage, displayModelUsage, displayCostComparison, mergeResultModelUsage, createSubAgentCallEntry, accumulateSubAgentUsage, getRawRequestInputTokens } from './claude.budget-stats.lib.mjs';
 import { buildClaudeResumeCommand } from './claude.command-builder.lib.mjs';
 import { SESSION_FORCE_KILLED_MARKER, postTrackedComment } from './tool-comments.lib.mjs'; // Issue #1625
 import { handleClaudeRuntimeSwitch } from './claude.runtime-switch.lib.mjs'; // see issue #1141
@@ -394,9 +394,10 @@ export const checkModelVisionCapability = async modelId => {
 // this file under the 1500-line repo cap (see check-file-line-limits CI job).
 import { calculateModelCost } from './claude.cost.lib.mjs';
 export { calculateModelCost };
-export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsage = null) => {
+export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsage = null, options = {}) => {
   const os = (await use('os')).default;
-  const homeDir = os.homedir();
+  const homeDir = options.homeDir || os.homedir();
+  const fetchModelInfoForUsage = options.fetchModelInfo || fetchModelInfo;
   // Construct the path to the session JSONL file
   // Format: ~/.claude/projects/<project-dir>/<session-id>.jsonl
   // The project directory name is the full path with slashes replaced by dashes
@@ -454,15 +455,12 @@ export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsag
             seenMessageIds.add(msgId);
           }
           accumulateModelUsage(modelUsage, entry);
-          // Issue #1501: Track peak context usage per single API request
-          // Issue #1710: Exclude cache_read_input_tokens — sub-sessions and
-          // per-request peaks should reflect *new* input the model received,
-          // not cached prompt context. Cache reads remain visible in the
-          // cumulative Total line as `(X + Y cached)`. This makes the
-          // peak-request value reconcilable with the cumulative non-cached
-          // input figure (instead of mixing semantics across the two lines).
+          // Issue #1737: Track peak restored-context input per request.
+          // Anthropic splits a request's input into input_tokens,
+          // cache_creation_input_tokens, and cache_read_input_tokens; all three
+          // count toward "how much context will be restored if I resume here".
           const usage = entry.message.usage;
-          const requestContext = (usage.input_tokens || 0) + (usage.cache_creation_input_tokens || 0);
+          const requestContext = getRawRequestInputTokens(usage);
           const model = entry.message.model;
           if (requestContext > (peakContextByModel[model] || 0)) {
             peakContextByModel[model] = requestContext;
@@ -500,7 +498,7 @@ export const calculateSessionTokens = async (sessionId, tempDir, resultModelUsag
     }
     // Fetch model information for each model
     const modelInfoPromises = Object.keys(modelUsage).map(async modelId => {
-      const modelInfo = await fetchModelInfo(modelId);
+      const modelInfo = await fetchModelInfoForUsage(modelId);
       return { modelId, modelInfo };
     });
     const modelInfoResults = await Promise.all(modelInfoPromises);
@@ -1295,9 +1293,7 @@ export const executeClaudeCommand = async params => {
               await log(`\n⚠️  JSONL deduplication: skipped ${tokenUsage.duplicateEntriesSkipped} duplicate entries (upstream: anthropics/claude-code#6805)`, { verbose: true });
             }
             if (tokenUsage.peakContextUsage > 0) {
-              // Issue #1710: rename so the metric matches the new definition (input + cache_creation,
-              // excluding cache_read). Cache reads are still visible separately on the Total line.
-              await log(`📊 Peak single-request input (excl. cache reads): ${formatNumber(tokenUsage.peakContextUsage)} tokens`, { verbose: true });
+              await log(`📊 Peak restored-context input: ${formatNumber(tokenUsage.peakContextUsage)} tokens`, { verbose: true });
             }
             await log('\n💰 Token Usage Summary:');
             // Display per-model breakdown

package/src/config.lib.mjs CHANGED Viewed

@@ -51,6 +51,7 @@ const parseFloatWithDefault = (envVar, defaultValue) => {
 export const timeouts = {
   claudeCli: parseIntWithDefault('HIVE_MIND_CLAUDE_TIMEOUT_SECONDS', 60) * 1000,
   opencodeCli: parseIntWithDefault('HIVE_MIND_OPENCODE_TIMEOUT_SECONDS', 60) * 1000,
+  geminiCli: parseIntWithDefault('HIVE_MIND_GEMINI_TIMEOUT_SECONDS', 60) * 1000,
   codexCli: parseIntWithDefault('HIVE_MIND_CODEX_TIMEOUT_SECONDS', 60) * 1000,
   qwenCli: parseIntWithDefault('HIVE_MIND_QWEN_TIMEOUT_SECONDS', 60) * 1000,
   githubApiDelay: parseIntWithDefault('HIVE_MIND_GITHUB_API_DELAY_MS', 5000),