npm - @build-astron-co/nimbus - Versions diffs - 0.2.0 - Mend

@build-astron-co/nimbus 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (313) hide show

package/LICENSE +21 -0
package/README.md +628 -0
package/bin/nimbus +38 -0
package/package.json +80 -0
package/src/__tests__/app.test.ts +76 -0
package/src/__tests__/audit.test.ts +877 -0
package/src/__tests__/circuit-breaker.test.ts +116 -0
package/src/__tests__/cli-run.test.ts +115 -0
package/src/__tests__/context-manager.test.ts +502 -0
package/src/__tests__/context.test.ts +242 -0
package/src/__tests__/enterprise.test.ts +401 -0
package/src/__tests__/generator.test.ts +433 -0
package/src/__tests__/hooks.test.ts +582 -0
package/src/__tests__/init.test.ts +436 -0
package/src/__tests__/intent-parser.test.ts +229 -0
package/src/__tests__/llm-router.test.ts +209 -0
package/src/__tests__/lsp.test.ts +293 -0
package/src/__tests__/modes.test.ts +336 -0
package/src/__tests__/permissions.test.ts +338 -0
package/src/__tests__/serve.test.ts +275 -0
package/src/__tests__/sessions.test.ts +227 -0
package/src/__tests__/sharing.test.ts +288 -0
package/src/__tests__/snapshots.test.ts +581 -0
package/src/__tests__/state-db.test.ts +334 -0
package/src/__tests__/stream-with-tools.test.ts +732 -0
package/src/__tests__/subagents.test.ts +176 -0
package/src/__tests__/system-prompt.test.ts +169 -0
package/src/__tests__/tool-converter.test.ts +256 -0
package/src/__tests__/tool-schemas.test.ts +397 -0
package/src/__tests__/tools.test.ts +143 -0
package/src/__tests__/version.test.ts +49 -0
package/src/agent/compaction-agent.ts +227 -0
package/src/agent/context-manager.ts +435 -0
package/src/agent/context.ts +427 -0
package/src/agent/deploy-preview.ts +426 -0
package/src/agent/index.ts +68 -0
package/src/agent/loop.ts +717 -0
package/src/agent/modes.ts +429 -0
package/src/agent/permissions.ts +466 -0
package/src/agent/subagents/base.ts +116 -0
package/src/agent/subagents/cost.ts +51 -0
package/src/agent/subagents/explore.ts +42 -0
package/src/agent/subagents/general.ts +54 -0
package/src/agent/subagents/index.ts +102 -0
package/src/agent/subagents/infra.ts +59 -0
package/src/agent/subagents/security.ts +69 -0
package/src/agent/system-prompt.ts +436 -0
package/src/app.ts +122 -0
package/src/audit/activity-log.ts +290 -0
package/src/audit/compliance-checker.ts +540 -0
package/src/audit/cost-tracker.ts +318 -0
package/src/audit/index.ts +23 -0
package/src/audit/security-scanner.ts +596 -0
package/src/auth/guard.ts +75 -0
package/src/auth/index.ts +56 -0
package/src/auth/oauth.ts +455 -0
package/src/auth/providers.ts +470 -0
package/src/auth/sso.ts +113 -0
package/src/auth/store.ts +505 -0
package/src/auth/types.ts +187 -0
package/src/build.ts +141 -0
package/src/cli/index.ts +16 -0
package/src/cli/init.ts +854 -0
package/src/cli/openapi-spec.ts +356 -0
package/src/cli/run.ts +237 -0
package/src/cli/serve-auth.ts +80 -0
package/src/cli/serve.ts +462 -0
package/src/cli/web.ts +67 -0
package/src/cli.ts +1417 -0
package/src/clients/core-engine-client.ts +227 -0
package/src/clients/enterprise-client.ts +334 -0
package/src/clients/generator-client.ts +351 -0
package/src/clients/git-client.ts +627 -0
package/src/clients/github-client.ts +410 -0
package/src/clients/helm-client.ts +504 -0
package/src/clients/index.ts +80 -0
package/src/clients/k8s-client.ts +497 -0
package/src/clients/llm-client.ts +161 -0
package/src/clients/rest-client.ts +130 -0
package/src/clients/service-discovery.ts +33 -0
package/src/clients/terraform-client.ts +482 -0
package/src/clients/tools-client.ts +1843 -0
package/src/clients/ws-client.ts +115 -0
package/src/commands/analyze/index.ts +352 -0
package/src/commands/apply/helm.ts +473 -0
package/src/commands/apply/index.ts +213 -0
package/src/commands/apply/k8s.ts +454 -0
package/src/commands/apply/terraform.ts +582 -0
package/src/commands/ask.ts +167 -0
package/src/commands/audit/index.ts +238 -0
package/src/commands/auth-cloud.ts +294 -0
package/src/commands/auth-list.ts +134 -0
package/src/commands/auth-profile.ts +121 -0
package/src/commands/auth-status.ts +141 -0
package/src/commands/aws/ec2.ts +501 -0
package/src/commands/aws/iam.ts +397 -0
package/src/commands/aws/index.ts +133 -0
package/src/commands/aws/lambda.ts +396 -0
package/src/commands/aws/rds.ts +439 -0
package/src/commands/aws/s3.ts +439 -0
package/src/commands/aws/vpc.ts +393 -0
package/src/commands/aws-discover.ts +649 -0
package/src/commands/aws-terraform.ts +805 -0
package/src/commands/azure/aks.ts +376 -0
package/src/commands/azure/functions.ts +253 -0
package/src/commands/azure/index.ts +116 -0
package/src/commands/azure/storage.ts +478 -0
package/src/commands/azure/vm.ts +355 -0
package/src/commands/billing/index.ts +256 -0
package/src/commands/chat.ts +314 -0
package/src/commands/config.ts +346 -0
package/src/commands/cost/cloud-cost-estimator.ts +266 -0
package/src/commands/cost/estimator.ts +79 -0
package/src/commands/cost/index.ts +594 -0
package/src/commands/cost/parsers/terraform.ts +273 -0
package/src/commands/cost/parsers/types.ts +25 -0
package/src/commands/cost/pricing/aws.ts +544 -0
package/src/commands/cost/pricing/azure.ts +499 -0
package/src/commands/cost/pricing/gcp.ts +396 -0
package/src/commands/cost/pricing/index.ts +40 -0
package/src/commands/demo.ts +250 -0
package/src/commands/doctor.ts +794 -0
package/src/commands/drift/index.ts +439 -0
package/src/commands/explain.ts +277 -0
package/src/commands/feedback.ts +389 -0
package/src/commands/fix.ts +324 -0
package/src/commands/fs/index.ts +402 -0
package/src/commands/gcp/compute.ts +325 -0
package/src/commands/gcp/functions.ts +271 -0
package/src/commands/gcp/gke.ts +438 -0
package/src/commands/gcp/iam.ts +344 -0
package/src/commands/gcp/index.ts +129 -0
package/src/commands/gcp/storage.ts +284 -0
package/src/commands/generate-helm.ts +1249 -0
package/src/commands/generate-k8s.ts +1560 -0
package/src/commands/generate-terraform.ts +1460 -0
package/src/commands/gh/index.ts +863 -0
package/src/commands/git/index.ts +1343 -0
package/src/commands/helm/index.ts +1126 -0
package/src/commands/help.ts +539 -0
package/src/commands/history.ts +142 -0
package/src/commands/import.ts +868 -0
package/src/commands/index.ts +367 -0
package/src/commands/init.ts +1046 -0
package/src/commands/k8s/index.ts +1137 -0
package/src/commands/login.ts +631 -0
package/src/commands/logout.ts +83 -0
package/src/commands/onboarding.ts +228 -0
package/src/commands/plan/display.ts +279 -0
package/src/commands/plan/index.ts +599 -0
package/src/commands/preview.ts +452 -0
package/src/commands/questionnaire.ts +1270 -0
package/src/commands/resume.ts +55 -0
package/src/commands/team/index.ts +346 -0
package/src/commands/template.ts +232 -0
package/src/commands/tf/index.ts +1034 -0
package/src/commands/upgrade.ts +550 -0
package/src/commands/usage/index.ts +134 -0
package/src/commands/version.ts +170 -0
package/src/compat/index.ts +2 -0
package/src/compat/runtime.ts +12 -0
package/src/compat/sqlite.ts +107 -0
package/src/config/index.ts +17 -0
package/src/config/manager.ts +530 -0
package/src/config/safety-policy.ts +358 -0
package/src/config/schema.ts +125 -0
package/src/config/types.ts +527 -0
package/src/context/context-db.ts +199 -0
package/src/demo/index.ts +349 -0
package/src/demo/scenarios/full-journey.ts +229 -0
package/src/demo/scenarios/getting-started.ts +127 -0
package/src/demo/scenarios/helm-release.ts +341 -0
package/src/demo/scenarios/k8s-deployment.ts +194 -0
package/src/demo/scenarios/terraform-vpc.ts +170 -0
package/src/demo/types.ts +92 -0
package/src/engine/cost-estimator.ts +438 -0
package/src/engine/diagram-generator.ts +256 -0
package/src/engine/drift-detector.ts +902 -0
package/src/engine/executor.ts +1035 -0
package/src/engine/index.ts +76 -0
package/src/engine/orchestrator.ts +636 -0
package/src/engine/planner.ts +720 -0
package/src/engine/safety.ts +743 -0
package/src/engine/verifier.ts +770 -0
package/src/enterprise/audit.ts +348 -0
package/src/enterprise/auth.ts +270 -0
package/src/enterprise/billing.ts +822 -0
package/src/enterprise/index.ts +17 -0
package/src/enterprise/teams.ts +443 -0
package/src/generator/best-practices.ts +1608 -0
package/src/generator/helm.ts +630 -0
package/src/generator/index.ts +37 -0
package/src/generator/intent-parser.ts +514 -0
package/src/generator/kubernetes.ts +976 -0
package/src/generator/terraform.ts +1867 -0
package/src/history/index.ts +8 -0
package/src/history/manager.ts +322 -0
package/src/history/types.ts +34 -0
package/src/hooks/config.ts +432 -0
package/src/hooks/engine.ts +391 -0
package/src/hooks/index.ts +4 -0
package/src/llm/auth-bridge.ts +198 -0
package/src/llm/circuit-breaker.ts +140 -0
package/src/llm/config-loader.ts +201 -0
package/src/llm/cost-calculator.ts +171 -0
package/src/llm/index.ts +8 -0
package/src/llm/model-aliases.ts +115 -0
package/src/llm/provider-registry.ts +63 -0
package/src/llm/providers/anthropic.ts +433 -0
package/src/llm/providers/bedrock.ts +477 -0
package/src/llm/providers/google.ts +405 -0
package/src/llm/providers/ollama.ts +767 -0
package/src/llm/providers/openai-compatible.ts +340 -0
package/src/llm/providers/openai.ts +328 -0
package/src/llm/providers/openrouter.ts +338 -0
package/src/llm/router.ts +1035 -0
package/src/llm/types.ts +232 -0
package/src/lsp/client.ts +298 -0
package/src/lsp/languages.ts +116 -0
package/src/lsp/manager.ts +278 -0
package/src/mcp/client.ts +402 -0
package/src/mcp/index.ts +5 -0
package/src/mcp/manager.ts +133 -0
package/src/nimbus.ts +214 -0
package/src/plugins/index.ts +27 -0
package/src/plugins/loader.ts +334 -0
package/src/plugins/manager.ts +376 -0
package/src/plugins/types.ts +284 -0
package/src/scanners/cicd-scanner.ts +258 -0
package/src/scanners/cloud-scanner.ts +466 -0
package/src/scanners/framework-scanner.ts +469 -0
package/src/scanners/iac-scanner.ts +388 -0
package/src/scanners/index.ts +539 -0
package/src/scanners/language-scanner.ts +276 -0
package/src/scanners/package-manager-scanner.ts +277 -0
package/src/scanners/types.ts +172 -0
package/src/sessions/manager.ts +365 -0
package/src/sessions/types.ts +44 -0
package/src/sharing/sync.ts +296 -0
package/src/sharing/viewer.ts +97 -0
package/src/snapshots/index.ts +2 -0
package/src/snapshots/manager.ts +530 -0
package/src/state/artifacts.ts +147 -0
package/src/state/audit.ts +137 -0
package/src/state/billing.ts +240 -0
package/src/state/checkpoints.ts +117 -0
package/src/state/config.ts +67 -0
package/src/state/conversations.ts +14 -0
package/src/state/credentials.ts +154 -0
package/src/state/db.ts +58 -0
package/src/state/index.ts +26 -0
package/src/state/messages.ts +115 -0
package/src/state/projects.ts +123 -0
package/src/state/schema.ts +236 -0
package/src/state/sessions.ts +147 -0
package/src/state/teams.ts +200 -0
package/src/telemetry.ts +108 -0
package/src/tools/aws-ops.ts +952 -0
package/src/tools/azure-ops.ts +579 -0
package/src/tools/file-ops.ts +593 -0
package/src/tools/gcp-ops.ts +625 -0
package/src/tools/git-ops.ts +773 -0
package/src/tools/github-ops.ts +799 -0
package/src/tools/helm-ops.ts +943 -0
package/src/tools/index.ts +17 -0
package/src/tools/k8s-ops.ts +819 -0
package/src/tools/schemas/converter.ts +184 -0
package/src/tools/schemas/devops.ts +612 -0
package/src/tools/schemas/index.ts +73 -0
package/src/tools/schemas/standard.ts +1144 -0
package/src/tools/schemas/types.ts +705 -0
package/src/tools/terraform-ops.ts +862 -0
package/src/types/ambient.d.ts +193 -0
package/src/types/config.ts +83 -0
package/src/types/drift.ts +116 -0
package/src/types/enterprise.ts +335 -0
package/src/types/index.ts +20 -0
package/src/types/plan.ts +44 -0
package/src/types/request.ts +65 -0
package/src/types/response.ts +54 -0
package/src/types/service.ts +51 -0
package/src/ui/App.tsx +997 -0
package/src/ui/DeployPreview.tsx +169 -0
package/src/ui/Header.tsx +68 -0
package/src/ui/InputBox.tsx +350 -0
package/src/ui/MessageList.tsx +585 -0
package/src/ui/PermissionPrompt.tsx +151 -0
package/src/ui/StatusBar.tsx +158 -0
package/src/ui/ToolCallDisplay.tsx +409 -0
package/src/ui/chat-ui.ts +853 -0
package/src/ui/index.ts +33 -0
package/src/ui/ink/index.ts +711 -0
package/src/ui/streaming.ts +176 -0
package/src/ui/types.ts +57 -0
package/src/utils/analytics.ts +72 -0
package/src/utils/cost-warning.ts +27 -0
package/src/utils/env.ts +46 -0
package/src/utils/errors.ts +69 -0
package/src/utils/event-bus.ts +38 -0
package/src/utils/index.ts +24 -0
package/src/utils/logger.ts +171 -0
package/src/utils/rate-limiter.ts +121 -0
package/src/utils/service-auth.ts +49 -0
package/src/utils/validation.ts +53 -0
package/src/version.ts +4 -0
package/src/watcher/index.ts +163 -0
package/src/wizard/approval.ts +383 -0
package/src/wizard/index.ts +25 -0
package/src/wizard/prompts.ts +338 -0
package/src/wizard/types.ts +171 -0
package/src/wizard/ui.ts +556 -0
package/src/wizard/wizard.ts +304 -0
package/tsconfig.json +24 -0

package/src/agent/compaction-agent.ts ADDED Viewed

@@ -0,0 +1,227 @@
+/**
+ * Compaction Agent
+ *
+ * Uses a fast LLM model (haiku) to summarize earlier conversation context
+ * while preserving key information needed for continuity.
+ *
+ * The compaction agent is invoked automatically by the context manager
+ * when the conversation exceeds the configured threshold, or manually
+ * by the user via a `/compact` command in the TUI.
+ *
+ * Key design decisions:
+ * - Uses the cheapest available model (haiku alias) to minimize cost.
+ * - Truncates very long tool outputs before sending to the summarizer.
+ * - Falls back to a simple extractive summary if the LLM call fails.
+ * - Preserves all technical details, file paths, and decisions.
+ *
+ * @module agent/compaction-agent
+ */
+import type { LLMRouter } from '../llm/router';
+import { getTextContent, type LLMMessage } from '../llm/types';
+import { ContextManager, estimateTokens, type CompactionResult } from './context-manager';
+// ---------------------------------------------------------------------------
+// Public Types
+// ---------------------------------------------------------------------------
+/** Options for running compaction. */
+export interface CompactionOptions {
+  /** LLM Router instance for making summary calls. */
+  router: LLMRouter;
+  /** Optional focus area for the summary (e.g. "terraform changes"). */
+  focusArea?: string;
+  /** Model to use for compaction (default: haiku). */
+  model?: string;
+}
+// ---------------------------------------------------------------------------
+// Constants
+// ---------------------------------------------------------------------------
+/** The system prompt given to the compaction model. */
+const COMPACTION_SYSTEM_PROMPT = `You are a conversation summarizer for the Nimbus CLI agent. Your job is to create a concise summary of a conversation between a user and an AI assistant that helps with cloud infrastructure and DevOps tasks.
+Rules:
+1. Preserve ALL important technical details: file paths, resource names, configuration values, error messages, decisions made.
+2. Preserve the user's original intent and any requirements they specified.
+3. Preserve the current state of any ongoing work (what was done, what remains).
+4. Remove conversational filler, repeated information, and verbose tool outputs.
+5. Use bullet points for clarity.
+6. Keep the summary under 2000 tokens.
+7. Structure the summary as:
+   - **User's Goal**: What the user is trying to accomplish
+   - **Key Decisions**: Important choices that were made
+   - **Work Completed**: What actions were taken and their results
+   - **Current State**: Where things stand now
+   - **Pending Items**: What still needs to be done (if any)`;
+// ---------------------------------------------------------------------------
+// Public API
+// ---------------------------------------------------------------------------
+/**
+ * Run the compaction agent to summarize a set of messages.
+ *
+ * Splits the conversation into messages to preserve and messages to
+ * summarize (using the context manager's selection logic), sends the
+ * latter to a fast LLM for summarization, then reassembles a compacted
+ * message array.
+ *
+ * @param messages - The full conversation message array.
+ * @param contextManager - The context manager instance (provides selection logic).
+ * @param options - Compaction options (router, model, focus area).
+ * @returns The compacted messages and a result summary.
+ */
+export async function runCompaction(
+  messages: LLMMessage[],
+  contextManager: ContextManager,
+  options: CompactionOptions
+): Promise<{ messages: LLMMessage[]; result: CompactionResult }> {
+  const { preserved, toSummarize } = contextManager.selectPreservedMessages(messages);
+  // Nothing to summarize -- return early
+  if (toSummarize.length === 0) {
+    const totalTokens = messages.reduce(
+      (sum, m) => sum + estimateTokens(getTextContent(m.content)),
+      0
+    );
+    return {
+      messages,
+      result: {
+        originalTokens: totalTokens,
+        compactedTokens: totalTokens,
+        savedTokens: 0,
+        summaryPreserved: false,
+      },
+    };
+  }
+  // Format messages for the summarizer
+  const conversationText = formatMessagesForSummary(toSummarize);
+  const originalTokens = estimateTokens(conversationText);
+  // Build the user prompt for the summarizer
+  let userPrompt = `Please summarize the following conversation between a user and the Nimbus AI assistant:\n\n${conversationText}`;
+  if (options.focusArea) {
+    userPrompt += `\n\nPay special attention to: ${options.focusArea}`;
+  }
+  // Call the LLM for summarization using a fast, cheap model
+  const model = options.model ?? 'haiku';
+  let summary: string;
+  try {
+    const response = await options.router.route({
+      messages: [
+        { role: 'system', content: COMPACTION_SYSTEM_PROMPT },
+        { role: 'user', content: userPrompt },
+      ],
+      model,
+      maxTokens: 2048,
+    });
+    summary = response.content;
+  } catch {
+    // If LLM call fails, fall back to a simple extractive summary
+    summary = fallbackSummary(toSummarize);
+  }
+  // Reassemble the compacted message array
+  const compactedMessages = contextManager.buildCompactedMessages(preserved, summary);
+  const compactedTokens = compactedMessages.reduce(
+    (sum, m) => sum + estimateTokens(getTextContent(m.content)),
+    0
+  );
+  return {
+    messages: compactedMessages,
+    result: {
+      originalTokens,
+      compactedTokens,
+      savedTokens: originalTokens - estimateTokens(summary),
+      summaryPreserved: true,
+    },
+  };
+}
+/**
+ * Run manual compaction from a `/compact` command.
+ *
+ * Creates a temporary context manager with default settings and
+ * delegates to {@link runCompaction}.
+ *
+ * @param messages - The full conversation message array.
+ * @param options - Compaction options plus an optional max token override.
+ * @returns The compacted messages and a result summary.
+ */
+export async function runManualCompaction(
+  messages: LLMMessage[],
+  options: CompactionOptions & { maxContextTokens?: number }
+): Promise<{ messages: LLMMessage[]; result: CompactionResult }> {
+  const contextManager = new ContextManager({
+    maxContextTokens: options.maxContextTokens,
+    preserveRecentMessages: 5,
+  });
+  return runCompaction(messages, contextManager, options);
+}
+// ---------------------------------------------------------------------------
+// Internal Helpers
+// ---------------------------------------------------------------------------
+/**
+ * Format messages into a readable conversation transcript.
+ *
+ * Each message is labelled with its role. Very long tool outputs are
+ * truncated to avoid overwhelming the summarizer model. Tool call
+ * metadata is included inline for context.
+ */
+function formatMessagesForSummary(messages: LLMMessage[]): string {
+  const parts: string[] = [];
+  for (const msg of messages) {
+    const role = msg.role === 'user' ? 'User' : msg.role === 'assistant' ? 'Assistant' : 'Tool';
+    const content = getTextContent(msg.content);
+    // Truncate very long tool outputs to keep summarizer input manageable
+    const truncated = content.length > 2000 ? `${content.slice(0, 2000)}... [truncated]` : content;
+    parts.push(`[${role}]: ${truncated}`);
+    // Include tool call info if present
+    if (msg.toolCalls) {
+      for (const tc of msg.toolCalls) {
+        parts.push(`  [Tool Call: ${tc.function.name}(${tc.function.arguments.slice(0, 200)})]`);
+      }
+    }
+  }
+  return parts.join('\n\n');
+}
+/**
+ * Fallback summary when the LLM is unavailable.
+ *
+ * Produces a simple extractive summary by listing message counts
+ * and the first few user messages. This is better than nothing when
+ * the compaction model cannot be reached.
+ */
+function fallbackSummary(messages: LLMMessage[]): string {
+  const userMessages = messages.filter(m => m.role === 'user');
+  const assistantMessages = messages.filter(m => m.role === 'assistant');
+  const parts: string[] = ['**Conversation Summary (auto-generated)**\n'];
+  parts.push(
+    `- ${userMessages.length} user messages and ${assistantMessages.length} assistant responses`
+  );
+  // Extract key topics from user messages
+  for (const msg of userMessages.slice(0, 5)) {
+    const content = getTextContent(msg.content);
+    if (content.length > 0) {
+      parts.push(`- User asked: "${content.slice(0, 150)}${content.length > 150 ? '...' : ''}"`);
+    }
+  }
+  return parts.join('\n');
+}

package/src/agent/context-manager.ts ADDED Viewed

@@ -0,0 +1,435 @@
+/**
+ * Context Manager — Token Tracking & Auto-Compact
+ *
+ * Tracks cumulative token usage across the agent loop and triggers
+ * automatic context compaction when usage exceeds a configurable
+ * threshold (default 85% of the model's context window).
+ *
+ * The manager provides:
+ * - Token estimation for messages, system prompts, and tool definitions.
+ * - A breakdown of how the context budget is being consumed.
+ * - Message selection logic for deciding what to preserve vs. summarize.
+ * - A builder for reassembling messages after compaction.
+ *
+ * Configuration can be supplied via constructor options or read from the
+ * Nimbus config database (keys: `context.auto_compact_threshold`,
+ * `context.max_file_injection`).
+ *
+ * @module agent/context-manager
+ */
+import { getTextContent, type LLMMessage } from '../llm/types';
+import { getConfig } from '../state/config';
+// ---------------------------------------------------------------------------
+// Public Types
+// ---------------------------------------------------------------------------
+/** Detailed breakdown of how the context window budget is being used. */
+export interface ContextBreakdown {
+  /** Tokens consumed by the base system prompt (excluding NIMBUS.md). */
+  systemPrompt: number;
+  /** Tokens consumed by NIMBUS.md instructions within the system prompt. */
+  nimbusInstructions: number;
+  /** Tokens consumed by all conversation messages. */
+  messages: number;
+  /** Tokens consumed by tool definition schemas. */
+  toolDefinitions: number;
+  /** Sum of all token categories. */
+  total: number;
+  /** Total available budget (model context window size). */
+  budget: number;
+  /** Percentage of budget currently in use (0-100). */
+  usagePercent: number;
+}
+/** Result of a compaction operation. */
+export interface CompactionResult {
+  /** Token count of the messages that were summarized. */
+  originalTokens: number;
+  /** Token count of the compacted message array. */
+  compactedTokens: number;
+  /** Tokens saved by compaction (originalTokens - summary tokens). */
+  savedTokens: number;
+  /** Whether a proper LLM summary was produced (false = fallback used). */
+  summaryPreserved: boolean;
+}
+/** Configuration options for the context manager. */
+export interface ContextManagerOptions {
+  /** Max context window tokens (default: auto-detected from model, fallback 200000). */
+  maxContextTokens?: number;
+  /** Model identifier — used to auto-detect context window size. */
+  model?: string;
+  /** Threshold percentage to trigger auto-compact (0.0 - 1.0, default: 0.85). */
+  autoCompactThreshold?: number;
+  /** Number of recent messages to always preserve during compaction (default: 5). */
+  preserveRecentMessages?: number;
+  /** NIMBUS.md section keys that should always remain in context. */
+  alwaysInContext?: string[];
+}
+// ---------------------------------------------------------------------------
+// Per-Model Context Window Sizes
+// ---------------------------------------------------------------------------
+/**
+ * Known context window sizes (in tokens) for popular models.
+ *
+ * When a model is not listed here, the manager falls back to the
+ * `maxContextTokens` option (default: 200 000).
+ */
+const MODEL_CONTEXT_WINDOWS: Record<string, number> = {
+  // Anthropic
+  'claude-opus-4-20250514': 200_000,
+  'claude-sonnet-4-20250514': 200_000,
+  'claude-haiku-4-20250514': 200_000,
+  'claude-3-5-sonnet-20241022': 200_000,
+  'claude-3-5-haiku-20241022': 200_000,
+  'claude-3-opus-20240229': 200_000,
+  'claude-3-sonnet-20240229': 200_000,
+  'claude-3-haiku-20240307': 200_000,
+  // OpenAI
+  'gpt-4o': 128_000,
+  'gpt-4o-mini': 128_000,
+  'gpt-4-turbo': 128_000,
+  'gpt-4': 8_192,
+  'gpt-3.5-turbo': 16_385,
+  o1: 200_000,
+  'o1-mini': 128_000,
+  'o1-preview': 128_000,
+  'o3-mini': 200_000,
+  // Google
+  'gemini-2.0-flash-exp': 1_048_576,
+  'gemini-1.5-pro': 2_097_152,
+  'gemini-1.5-flash': 1_048_576,
+  // Groq (Llama)
+  'llama-3.1-70b-versatile': 131_072,
+  'llama-3.1-8b-instant': 131_072,
+  'llama-3.3-70b-versatile': 131_072,
+  // DeepSeek
+  'deepseek-chat': 64_000,
+  'deepseek-coder': 64_000,
+  'deepseek-reasoner': 64_000,
+  // Local (Ollama defaults — dynamic lookup can override)
+  'llama3.2': 128_000,
+  mistral: 32_768,
+  codellama: 16_384,
+};
+/**
+ * Look up the context window size for a model identifier.
+ *
+ * Tries exact match first, then prefix match (for versioned model IDs
+ * like `claude-sonnet-4-20250514`), then returns `null` if unknown.
+ */
+export function getModelContextWindow(model: string): number | null {
+  // Exact match
+  if (MODEL_CONTEXT_WINDOWS[model] !== undefined) {
+    return MODEL_CONTEXT_WINDOWS[model];
+  }
+  // Prefix match: e.g., "gpt-4o-2024-08-06" should match "gpt-4o"
+  for (const [key, value] of Object.entries(MODEL_CONTEXT_WINDOWS)) {
+    if (model.startsWith(key)) {
+      return value;
+    }
+  }
+  return null;
+}
+// ---------------------------------------------------------------------------
+// Token Estimation Utilities
+// ---------------------------------------------------------------------------
+/**
+ * Rough token estimate based on character count.
+ *
+ * Uses the common heuristic of ~4 characters per token, which is a
+ * reasonable average across English text and source code.
+ *
+ * @param text - The text to estimate.
+ * @returns Approximate token count (rounded up).
+ */
+export function estimateTokens(text: string): number {
+  return Math.ceil(text.length / 4);
+}
+/**
+ * Estimate token count for a single LLM message.
+ *
+ * Accounts for the message content, structural overhead (role, framing),
+ * and any tool calls embedded in the message.
+ *
+ * @param message - The LLM message to estimate.
+ * @returns Approximate token count.
+ */
+export function estimateMessageTokens(message: LLMMessage): number {
+  let tokens = 0;
+  tokens += estimateTokens(getTextContent(message.content));
+  // Add overhead for role and message structure
+  tokens += 4;
+  // Tool calls add extra tokens for name, arguments, and JSON structure
+  if (message.toolCalls) {
+    for (const tc of message.toolCalls) {
+      tokens += estimateTokens(tc.function.name);
+      tokens += estimateTokens(tc.function.arguments);
+      tokens += 10; // structural overhead per tool call
+    }
+  }
+  return tokens;
+}
+// ---------------------------------------------------------------------------
+// ContextManager Class
+// ---------------------------------------------------------------------------
+/**
+ * Manages context window budget and auto-compaction decisions.
+ *
+ * Create one instance per agent session. The manager does not hold
+ * conversation state itself -- it operates on message arrays passed in
+ * by the caller.
+ */
+export class ContextManager {
+  private maxContextTokens: number;
+  private autoCompactThreshold: number;
+  private preserveRecentMessages: number;
+  private alwaysInContext: string[];
+  constructor(options?: ContextManagerOptions) {
+    // Try loading from config DB, fall back to options/defaults
+    const configThreshold = getConfigSafe('context.auto_compact_threshold');
+    // Auto-detect context window from model if provided, then options, then default
+    const modelWindow = options?.model ? getModelContextWindow(options.model) : null;
+    this.maxContextTokens = options?.maxContextTokens ?? modelWindow ?? 200_000;
+    this.autoCompactThreshold = configThreshold ?? options?.autoCompactThreshold ?? 0.85;
+    this.preserveRecentMessages = options?.preserveRecentMessages ?? 5;
+    this.alwaysInContext = options?.alwaysInContext ?? [];
+  }
+  /**
+   * Check whether auto-compaction should be triggered.
+   *
+   * Returns `true` if the estimated token usage is at or above the
+   * configured threshold percentage of the context window.
+   *
+   * @param systemPrompt - The full system prompt string.
+   * @param messages - Current conversation messages.
+   * @param toolDefinitionsTokens - Pre-computed token count for tool schemas.
+   * @returns `true` if compaction should run.
+   */
+  shouldCompact(
+    systemPrompt: string,
+    messages: LLMMessage[],
+    toolDefinitionsTokens: number
+  ): boolean {
+    const usage = this.calculateUsage(systemPrompt, messages, toolDefinitionsTokens);
+    return usage.usagePercent >= this.autoCompactThreshold * 100;
+  }
+  /**
+   * Calculate a detailed context usage breakdown.
+   *
+   * Separates the system prompt into base instructions and NIMBUS.md
+   * content (if present), and sums up messages and tool definitions
+   * to produce a full picture of context window consumption.
+   *
+   * @param systemPrompt - The full system prompt string.
+   * @param messages - Current conversation messages.
+   * @param toolDefinitionsTokens - Pre-computed token count for tool schemas.
+   * @returns A {@link ContextBreakdown} with per-category token counts.
+   */
+  calculateUsage(
+    systemPrompt: string,
+    messages: LLMMessage[],
+    toolDefinitionsTokens: number
+  ): ContextBreakdown {
+    const systemPromptTokens = estimateTokens(systemPrompt);
+    // Separate NIMBUS.md instructions if they appear in system prompt
+    const nimbusMarker = '# NIMBUS.md';
+    const nimbusIdx = systemPrompt.indexOf(nimbusMarker);
+    let nimbusInstructionsTokens = 0;
+    let baseSystemTokens = systemPromptTokens;
+    if (nimbusIdx >= 0) {
+      const nimbusContent = systemPrompt.slice(nimbusIdx);
+      nimbusInstructionsTokens = estimateTokens(nimbusContent);
+      baseSystemTokens = systemPromptTokens - nimbusInstructionsTokens;
+    }
+    const messagesTokens = messages.reduce((sum, msg) => sum + estimateMessageTokens(msg), 0);
+    const total = systemPromptTokens + messagesTokens + toolDefinitionsTokens;
+    const usagePercent =
+      this.maxContextTokens > 0 ? Math.round((total / this.maxContextTokens) * 100) : 0;
+    return {
+      systemPrompt: baseSystemTokens,
+      nimbusInstructions: nimbusInstructionsTokens,
+      messages: messagesTokens,
+      toolDefinitions: toolDefinitionsTokens,
+      total,
+      budget: this.maxContextTokens,
+      usagePercent,
+    };
+  }
+  /**
+   * Select which messages to preserve during compaction.
+   *
+   * Preservation rules:
+   * - The first message is always kept (initial user context).
+   * - The last N messages are always kept (recent conversation).
+   * - Tool messages near the recent window are kept (active tool state).
+   * - Previous compaction summary blocks are always kept.
+   * - Everything else is marked for summarization.
+   *
+   * @param messages - The full conversation message array.
+   * @returns An object with `preserved` and `toSummarize` arrays.
+   */
+  selectPreservedMessages(messages: LLMMessage[]): {
+    preserved: LLMMessage[];
+    toSummarize: LLMMessage[];
+  } {
+    if (messages.length <= this.preserveRecentMessages + 1) {
+      return { preserved: [...messages], toSummarize: [] };
+    }
+    const preserved: LLMMessage[] = [];
+    const toSummarize: LLMMessage[] = [];
+    for (let i = 0; i < messages.length; i++) {
+      const msg = messages[i];
+      const isFirst = i === 0;
+      const isRecent = i >= messages.length - this.preserveRecentMessages;
+      const hasActiveTools =
+        msg.role === 'tool' && i >= messages.length - this.preserveRecentMessages - 2;
+      // Always preserve summary blocks (from previous compactions)
+      const isSummary = getTextContent(msg.content).startsWith('[Context Summary]');
+      if (isFirst || isRecent || hasActiveTools || isSummary) {
+        preserved.push(msg);
+      } else {
+        toSummarize.push(msg);
+      }
+    }
+    return { preserved, toSummarize };
+  }
+  /**
+   * Build the compacted message array by inserting a summary.
+   *
+   * Places the summary as a user message immediately after the first
+   * preserved message, then appends all remaining preserved messages.
+   * The summary is wrapped with `[Context Summary]` markers so future
+   * compaction passes can identify and preserve it.
+   *
+   * @param preserved - Messages to keep verbatim.
+   * @param summary - The LLM-generated (or fallback) summary text.
+   * @returns A new message array ready to replace the original.
+   */
+  buildCompactedMessages(preserved: LLMMessage[], summary: string): LLMMessage[] {
+    const result: LLMMessage[] = [];
+    // Keep the first preserved message (typically the first user message)
+    if (preserved.length > 0) {
+      result.push(preserved[0]);
+    }
+    // Insert the summary as a user message with a clear marker
+    result.push({
+      role: 'user' as const,
+      content: `[Context Summary] The following is a summary of the earlier conversation:\n\n${summary}\n\n---\nThe conversation continues below.`,
+    });
+    // Append remaining preserved messages
+    for (let i = 1; i < preserved.length; i++) {
+      result.push(preserved[i]);
+    }
+    return result;
+  }
+  /**
+   * Get the current configuration values.
+   *
+   * Useful for displaying context status in the TUI.
+   */
+  getConfig(): {
+    maxContextTokens: number;
+    autoCompactThreshold: number;
+    preserveRecentMessages: number;
+  } {
+    return {
+      maxContextTokens: this.maxContextTokens,
+      autoCompactThreshold: this.autoCompactThreshold,
+      preserveRecentMessages: this.preserveRecentMessages,
+    };
+  }
+  /**
+   * Update the max context tokens.
+   *
+   * Call this when the model changes mid-session so the compaction
+   * threshold adjusts to the new model's context window.
+   *
+   * @param tokens - The new maximum context window size.
+   */
+  setMaxContextTokens(tokens: number): void {
+    this.maxContextTokens = tokens;
+  }
+  /**
+   * Update the context window based on a model identifier.
+   *
+   * Looks up the model's known context window size. If the model is
+   * not in the built-in map, the current budget is left unchanged.
+   *
+   * @param model - The model identifier (e.g., "gpt-4o", "claude-sonnet-4-20250514").
+   * @returns `true` if the budget was updated, `false` if model is unknown.
+   */
+  setModel(model: string): boolean {
+    // Strip provider prefix (e.g., "openai/gpt-4o" → "gpt-4o")
+    const stripped = model.includes('/') ? model.split('/').slice(1).join('/') : model;
+    const window = getModelContextWindow(stripped);
+    if (window !== null) {
+      this.maxContextTokens = window;
+      return true;
+    }
+    return false;
+  }
+}
+// ---------------------------------------------------------------------------
+// Internal Helpers
+// ---------------------------------------------------------------------------
+/**
+ * Safely read a config value without crashing if the DB is not ready.
+ *
+ * During early initialization the SQLite database may not yet be open.
+ * This wrapper catches any error and returns `null` so the constructor
+ * can fall back to provided options or built-in defaults.
+ */
+function getConfigSafe(key: string): any | null {
+  try {
+    return getConfig(key);
+  } catch {
+    return null;
+  }
+}