npm - @nuvin/nuvin-core - Versions diffs - 1.1.2 → 1.3.0 - Mend

@nuvin/nuvin-core 1.1.2 → 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/index.js CHANGED Viewed

@@ -36,6 +36,345 @@ var AgentEventTypes = {
   SubAgentCompleted: "sub_agent_completed"
 };
+// metrics.ts
+var createEmptySnapshot = () => ({
+  totalTokens: 0,
+  totalPromptTokens: 0,
+  totalCompletionTokens: 0,
+  totalCachedTokens: 0,
+  totalReasoningTokens: 0,
+  requestCount: 0,
+  llmCallCount: 0,
+  toolCallCount: 0,
+  totalTimeMs: 0,
+  totalCost: 0,
+  currentTokens: 0,
+  currentPromptTokens: 0,
+  currentCompletionTokens: 0,
+  currentCachedTokens: 0,
+  currentCost: 0
+});
+var NoopMetricsPort = class {
+  recordLLMCall(_usage, _cost) {
+  }
+  recordToolCall() {
+  }
+  recordRequestComplete(_responseTimeMs) {
+  }
+  setContextWindow(_limit, _usage) {
+  }
+  reset() {
+  }
+  getSnapshot() {
+    return createEmptySnapshot();
+  }
+};
+var InMemoryMetricsPort = class {
+  snapshot = createEmptySnapshot();
+  onChange;
+  constructor(onChange) {
+    this.onChange = onChange;
+  }
+  emit() {
+    this.onChange?.({ ...this.snapshot });
+  }
+  recordLLMCall(usage, cost) {
+    const prompt = usage.prompt_tokens ?? 0;
+    const completion = usage.completion_tokens ?? 0;
+    const total = usage.total_tokens ?? prompt + completion;
+    const cached = usage.prompt_tokens_details?.cached_tokens ?? 0;
+    const reasoning = usage.reasoning_tokens ?? usage.completion_tokens_details?.reasoning_tokens ?? 0;
+    const actualCost = cost ?? usage.cost ?? 0;
+    this.snapshot.totalTokens += total;
+    this.snapshot.totalPromptTokens += prompt;
+    this.snapshot.totalCompletionTokens += completion;
+    this.snapshot.totalCachedTokens += cached;
+    this.snapshot.totalReasoningTokens += reasoning;
+    this.snapshot.totalCost += actualCost;
+    this.snapshot.llmCallCount += 1;
+    this.snapshot.currentTokens = total;
+    this.snapshot.currentPromptTokens = prompt;
+    this.snapshot.currentCompletionTokens = completion;
+    this.snapshot.currentCachedTokens = cached;
+    this.snapshot.currentCost = actualCost;
+    this.emit();
+  }
+  recordToolCall() {
+    this.snapshot.toolCallCount += 1;
+    this.emit();
+  }
+  recordRequestComplete(responseTimeMs) {
+    this.snapshot.requestCount += 1;
+    this.snapshot.totalTimeMs += responseTimeMs;
+    this.emit();
+  }
+  setContextWindow(limit, usage) {
+    this.snapshot.contextWindowLimit = limit;
+    this.snapshot.contextWindowUsage = usage;
+    this.emit();
+  }
+  reset() {
+    this.snapshot = createEmptySnapshot();
+    this.emit();
+  }
+  getSnapshot() {
+    return { ...this.snapshot };
+  }
+  setOnChange(fn) {
+    this.onChange = fn;
+  }
+};
+// clock.ts
+var SystemClock = class {
+  now() {
+    return Date.now();
+  }
+  iso(dateMs) {
+    return new Date(dateMs ?? Date.now()).toISOString();
+  }
+};
+// id.ts
+var SimpleId = class {
+  uuid() {
+    return "xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx".replace(/[xy]/g, (c) => {
+      const r = Math.random() * 16 | 0;
+      const v = c === "x" ? r : r & 3 | 8;
+      return v.toString(16);
+    });
+  }
+};
+// cost.ts
+var SimpleCost = class {
+  estimate(_model, usage) {
+    return usage?.cost;
+  }
+};
+// reminders.ts
+var NoopReminders = class {
+  enhance(content, _opts) {
+    return [content];
+  }
+};
+// context.ts
+var toProviderContent = (content) => {
+  if (content === null || content === void 0) {
+    return "";
+  }
+  if (typeof content === "string") {
+    return content;
+  }
+  if (content.type === "parts") {
+    const providerParts = [];
+    for (const part of content.parts) {
+      if (part.type === "text") {
+        if (part.text.length > 0) {
+          providerParts.push({ type: "text", text: part.text });
+        }
+        continue;
+      }
+      const label = part.altText ?? (part.name ? `Image attachment: ${part.name}` : void 0);
+      if (label) {
+        providerParts.push({ type: "text", text: label });
+      }
+      const url = `data:${part.mimeType};base64,${part.data}`;
+      providerParts.push({ type: "image_url", image_url: { url } });
+    }
+    return providerParts.length > 0 ? providerParts : [];
+  }
+  return [];
+};
+var SimpleContextBuilder = class {
+  toProviderMessages(history, systemPrompt, newUserContent) {
+    const transformed = [];
+    for (const m of history) {
+      const providerContent = toProviderContent(m.content);
+      if (m.role === "user") {
+        transformed.push({ role: "user", content: providerContent ?? "" });
+      } else if (m.role === "assistant") {
+        if (m.tool_calls && m.tool_calls.length > 0) {
+          transformed.push({
+            ...m,
+            role: "assistant",
+            content: providerContent ?? null,
+            tool_calls: m.tool_calls
+          });
+        } else {
+          transformed.push({
+            ...m,
+            role: "assistant",
+            content: providerContent ?? ""
+          });
+        }
+      } else if (m.role === "tool") {
+        if (m.tool_call_id) {
+          transformed.push({
+            role: "tool",
+            content: typeof providerContent === "string" ? providerContent : providerContent ?? "",
+            tool_call_id: m.tool_call_id,
+            name: m.name
+          });
+        }
+      }
+    }
+    const userMsgs = newUserContent.map((c) => ({
+      role: "user",
+      content: toProviderContent(c) ?? ""
+    }));
+    return [{ role: "system", content: systemPrompt }, ...transformed, ...userMsgs];
+  }
+};
+// persistent/memory.ts
+var InMemoryMemory = class {
+  store = /* @__PURE__ */ new Map();
+  async get(key) {
+    return this.store.get(key) ?? [];
+  }
+  async set(key, items) {
+    this.store.set(key, [...items]);
+  }
+  async append(key, items) {
+    const existing = this.store.get(key) ?? [];
+    this.store.set(key, [...existing, ...items]);
+  }
+  async delete(key) {
+    this.store.delete(key);
+  }
+  async keys() {
+    return Array.from(this.store.keys());
+  }
+  async clear() {
+    this.store.clear();
+  }
+  async exportSnapshot() {
+    const snap = {};
+    for (const [k, v] of this.store.entries()) snap[k] = [...v];
+    return snap;
+  }
+  async importSnapshot(snapshot) {
+    this.store.clear();
+    for (const [k, v] of Object.entries(snapshot)) this.store.set(k, [...v]);
+  }
+};
+var JsonFileMemoryPersistence = class {
+  constructor(filename = "history.json") {
+    this.filename = filename;
+  }
+  async load() {
+    try {
+      const fs10 = await import("fs");
+      if (!fs10.existsSync(this.filename)) return {};
+      const text = fs10.readFileSync(this.filename, "utf-8");
+      const data = JSON.parse(text);
+      return typeof data === "object" && data ? data : {};
+    } catch {
+      console.warn(`Failed to load memory from ${this.filename}`);
+      return {};
+    }
+  }
+  async save(snapshot) {
+    try {
+      const fs10 = await import("fs");
+      const path9 = await import("path");
+      const dir = path9.dirname(this.filename);
+      if (dir && dir !== "." && !fs10.existsSync(dir)) {
+        fs10.mkdirSync(dir, { recursive: true });
+      }
+      fs10.writeFileSync(this.filename, JSON.stringify(snapshot, null, 2), "utf-8");
+    } catch (err2) {
+      console.warn(`Failed to save memory to ${this.filename}`, err2);
+    }
+  }
+};
+var PersistedMemory = class {
+  constructor(persistence) {
+    this.persistence = persistence;
+  }
+  inner = new InMemoryMemory();
+  initialized = false;
+  async ensureInitialized() {
+    if (this.initialized) return;
+    const snap = await this.persistence.load();
+    if (snap && typeof snap === "object") await this.inner.importSnapshot(snap);
+    this.initialized = true;
+  }
+  async save() {
+    const snap = await this.inner.exportSnapshot();
+    await this.persistence.save(snap);
+  }
+  async get(key) {
+    await this.ensureInitialized();
+    return this.inner.get(key);
+  }
+  async set(key, items) {
+    await this.ensureInitialized();
+    await this.inner.set(key, items);
+    await this.save();
+  }
+  async append(key, items) {
+    await this.ensureInitialized();
+    await this.inner.append(key, items);
+    await this.save();
+  }
+  async delete(key) {
+    await this.ensureInitialized();
+    await this.inner.delete(key);
+    await this.save();
+  }
+  async keys() {
+    await this.ensureInitialized();
+    return this.inner.keys();
+  }
+  async clear() {
+    await this.ensureInitialized();
+    await this.inner.clear();
+    await this.save();
+  }
+  async exportSnapshot() {
+    await this.ensureInitialized();
+    return this.inner.exportSnapshot();
+  }
+  async importSnapshot(snapshot) {
+    await this.ensureInitialized();
+    await this.inner.importSnapshot(snapshot);
+    await this.save();
+  }
+};
+// events.ts
+var NoopEventPort = class {
+  emit(_event) {
+  }
+};
+var PersistingConsoleEventPort = class {
+  memory;
+  maxPerConversation;
+  writeQueue = Promise.resolve();
+  constructor(opts) {
+    this.memory = opts?.memory ?? new PersistedMemory(new JsonFileMemoryPersistence(opts?.filename || "events.json"));
+    this.maxPerConversation = opts?.maxPerConversation ?? 500;
+  }
+  async emit(event) {
+    this.writeQueue = this.writeQueue.then(async () => {
+      try {
+        const key = event?.conversationId ?? "default";
+        const existing = await this.memory.get(key);
+        const next = [...existing, { ...event }];
+        const max = this.maxPerConversation;
+        const trimmed = max > 0 && next.length > max ? next.slice(next.length - max) : next;
+        await this.memory.set(key, trimmed);
+      } catch {
+      }
+    });
+    return this.writeQueue;
+  }
+};
 // orchestrator.ts
 var removeAttachmentTokens = (value, attachments) => {
   return attachments.reduce((acc, attachment) => {
@@ -107,9 +446,29 @@ var resolveDisplayText = (text, attachments, provided) => {
 var AgentOrchestrator = class {
   constructor(cfg, deps) {
     this.cfg = cfg;
-    this.deps = deps;
+    this.memory = deps.memory;
+    this.tools = deps.tools;
+    this.llm = deps.llm;
+    this.context = deps.context ?? this.context;
+    this.ids = deps.ids ?? this.ids;
+    this.clock = deps.clock ?? this.clock;
+    this.cost = deps.cost ?? this.cost;
+    this.reminders = deps.reminders ?? this.reminders;
+    this.metrics = deps.metrics ?? this.metrics;
+    this.events = deps.events ?? this.events;
   }
   pendingApprovals = /* @__PURE__ */ new Map();
+  context = new SimpleContextBuilder();
+  ids = new SimpleId();
+  clock = new SystemClock();
+  cost = new SimpleCost();
+  reminders = new NoopReminders();
+  // private llm: LLMPort;
+  metrics = new NoopMetricsPort();
+  events = new NoopEventPort();
+  llm;
+  tools;
+  memory;
   /**
    * Updates the agent configuration dynamically after initialization.
    * This allows for runtime changes to model, provider, and other settings.
@@ -122,26 +481,26 @@ var AgentOrchestrator = class {
    * This preserves conversation history, MCP connections, and other state.
    */
   setLLM(newLLM) {
-    this.deps.llm = newLLM;
+    this.llm = newLLM;
   }
   /**
    * Updates the tool port without reinitializing the entire orchestrator.
    * This preserves conversation history and other state while adding/removing tools.
    */
   setTools(newTools) {
-    this.deps.tools = newTools;
+    this.tools = newTools;
   }
   /**
    * Gets the current tool port.
    */
   getTools() {
-    return this.deps.tools;
+    return this.tools;
   }
   /**
    * Gets the current LLM port.
    */
   getLLM() {
-    return this.deps.llm;
+    return this.llm;
   }
   /**
    * Gets the current agent configuration.
@@ -155,14 +514,26 @@ var AgentOrchestrator = class {
    * MCP servers, and other state.
    */
   setMemory(newMemory) {
-    this.deps.memory = newMemory;
+    this.memory = newMemory;
   }
   /**
    * Updates the event port without reinitializing the entire orchestrator.
    * This is useful when switching to a new session with a different event log file.
    */
   setEvents(newEvents) {
-    this.deps.events = newEvents;
+    this.events = newEvents;
+  }
+  /**
+   * Updates the metrics port without reinitializing the entire orchestrator.
+   */
+  setMetrics(newMetrics) {
+    this.metrics = newMetrics;
+  }
+  /**
+   * Gets the current metrics port.
+   */
+  getMetrics() {
+    return this.metrics;
   }
   /**
    * Determines if a tool should bypass approval requirements.
@@ -175,10 +546,10 @@ var AgentOrchestrator = class {
   }
   async handleToolDenial(denialMessage, conversationId, messageId, accumulatedMessages, turnHistory, originalToolCalls, assistantContent, usage) {
     const assistantMsg = {
-      id: this.deps.ids.uuid(),
+      id: this.ids.uuid(),
       role: "assistant",
       content: assistantContent ?? null,
-      timestamp: this.deps.clock.iso(),
+      timestamp: this.clock.iso(),
       tool_calls: originalToolCalls,
       usage
     };
@@ -201,15 +572,15 @@ var AgentOrchestrator = class {
         id: toolCall.id,
         role: "tool",
         content: toolDenialResult,
-        timestamp: this.deps.clock.iso(),
+        timestamp: this.clock.iso(),
         tool_call_id: toolCall.id,
         name: toolCall.function.name
       };
       turnHistory.push(toolMsg);
       toolResultMsgs.push(toolMsg);
     }
-    await this.deps.memory.append(conversationId, [assistantMsg, ...toolResultMsgs]);
-    await this.deps.events?.emit({
+    await this.memory.append(conversationId, [assistantMsg, ...toolResultMsgs]);
+    await this.events?.emit({
       type: AgentEventTypes.AssistantMessage,
       conversationId,
       messageId,
@@ -247,15 +618,19 @@ var AgentOrchestrator = class {
   }
   async send(content, opts = {}) {
     const convo = opts.conversationId ?? "default";
-    const t0 = this.deps.clock.now();
-    const msgId = this.deps.ids.uuid();
-    const history = await this.deps.memory.get(convo);
+    const t0 = this.clock.now();
+    const msgId = this.ids.uuid();
+    const history = await this.memory.get(convo);
     let providerMsgs;
     let userMessages;
     let userDisplay;
     let enhanced;
+    const _llm = this.getLLM();
+    if (!_llm) {
+      throw new Error("LLM provider not set");
+    }
     if (opts.retry) {
-      providerMsgs = this.deps.context.toProviderMessages(history, this.cfg.systemPrompt, []);
+      providerMsgs = this.context.toProviderMessages(history, this.cfg.systemPrompt, []);
       userMessages = [];
       userDisplay = "[Retry]";
       enhanced = [];
@@ -266,7 +641,7 @@ var AgentOrchestrator = class {
         attachments: Array.isArray(content.attachments) ? content.attachments : []
       };
       const attachments = normalized.attachments;
-      enhanced = this.deps.reminders.enhance(normalized.text, { conversationId: convo });
+      enhanced = this.reminders.enhance(normalized.text, { conversationId: convo });
       const enhancedCombined = enhanced.join("\n");
       const messageParts = buildMessageParts(enhancedCombined, attachments);
       let userContent;
@@ -279,16 +654,16 @@ var AgentOrchestrator = class {
       } else {
         userContent = enhancedCombined;
       }
-      providerMsgs = this.deps.context.toProviderMessages(history, this.cfg.systemPrompt, [userContent]);
+      providerMsgs = this.context.toProviderMessages(history, this.cfg.systemPrompt, [userContent]);
       userDisplay = resolveDisplayText(normalized.text, attachments, normalized.displayText);
-      const userTimestamp = this.deps.clock.iso();
-      userMessages = [{ id: this.deps.ids.uuid(), role: "user", content: userContent, timestamp: userTimestamp }];
-      await this.deps.memory.append(convo, userMessages);
+      const userTimestamp = this.clock.iso();
+      userMessages = [{ id: this.ids.uuid(), role: "user", content: userContent, timestamp: userTimestamp }];
+      await this.memory.append(convo, userMessages);
     }
     if (opts.signal?.aborted) throw new Error("Aborted");
-    const toolDefs = this.deps.tools.getToolDefinitions(this.cfg.enabledTools ?? []);
+    const toolDefs = this.tools.getToolDefinitions(this.cfg.enabledTools ?? []);
     const toolNames = toolDefs.map((t) => t.function.name);
-    await this.deps.events?.emit({
+    await this.events?.emit({
       type: AgentEventTypes.MessageStarted,
       conversationId: convo,
       messageId: msgId,
@@ -315,17 +690,166 @@ var AgentOrchestrator = class {
     let toolApprovalDenied = false;
     let denialMessage = "";
     let finalResponseSaved = false;
-    try {
-      if (opts.stream && typeof this.deps.llm.streamCompletion === "function") {
+    if (opts.stream && typeof _llm.streamCompletion === "function") {
+      let isFirstChunk = true;
+      result = await _llm.streamCompletion(
+        params,
+        {
+          onChunk: async (delta, usage) => {
+            streamedAssistantContent += delta;
+            const cleanDelta = isFirstChunk ? delta.replace(/^\n+/, "") : delta;
+            isFirstChunk = false;
+            const chunkEvent = {
+              type: AgentEventTypes.AssistantChunk,
+              conversationId: convo,
+              messageId: msgId,
+              delta: cleanDelta,
+              ...usage && { usage }
+            };
+            await this.events?.emit(chunkEvent);
+          },
+          onStreamFinish: async (finishReason, usage) => {
+            if (usage) {
+              const cost = this.cost.estimate(this.cfg.model, usage);
+              this.metrics?.recordLLMCall?.(usage, cost);
+            }
+            const finishEvent = {
+              type: AgentEventTypes.StreamFinish,
+              conversationId: convo,
+              messageId: msgId,
+              ...finishReason && { finishReason },
+              ...usage && { usage }
+            };
+            await this.events?.emit(finishEvent);
+          }
+        },
+        opts.signal
+      );
+    } else {
+      result = await _llm.generateCompletion(params, opts.signal);
+      if (result.usage) {
+        const cost = this.cost.estimate(this.cfg.model, result.usage);
+        this.metrics?.recordLLMCall?.(result.usage, cost);
+      }
+    }
+    if (!result.tool_calls?.length && result.content && !finalResponseSaved) {
+      const content2 = opts.stream ? streamedAssistantContent : result.content;
+      const assistantMsg = {
+        id: msgId,
+        role: "assistant",
+        content: content2,
+        timestamp: this.clock.iso(),
+        usage: result.usage
+      };
+      await this.memory.append(convo, [assistantMsg]);
+      finalResponseSaved = true;
+      if (content2.trim()) {
+        const messageEvent = {
+          type: AgentEventTypes.AssistantMessage,
+          conversationId: convo,
+          messageId: msgId,
+          content: content2,
+          ...result.usage && { usage: result.usage }
+        };
+        await this.events?.emit(messageEvent);
+      }
+    }
+    while (result.tool_calls?.length) {
+      if (result.content?.trim()) {
+        const messageEvent = {
+          type: AgentEventTypes.AssistantMessage,
+          conversationId: convo,
+          messageId: msgId,
+          content: result.content,
+          ...result.usage && { usage: result.usage }
+        };
+        await this.events?.emit(messageEvent);
+      }
+      if (opts.signal?.aborted) throw new Error("Aborted");
+      await this.events?.emit({
+        type: AgentEventTypes.ToolCalls,
+        conversationId: convo,
+        messageId: msgId,
+        toolCalls: result.tool_calls,
+        usage: result.usage
+      });
+      const approvalResult = await this.processToolApproval(
+        result.tool_calls,
+        convo,
+        msgId,
+        accumulatedMessages,
+        turnHistory,
+        result.content,
+        result.usage
+      );
+      if (approvalResult.wasDenied) {
+        denialMessage = approvalResult.denialMessage || "";
+        toolApprovalDenied = true;
+        break;
+      }
+      const approvedCalls = approvalResult.approvedCalls;
+      const invocations = this.toInvocations(approvedCalls);
+      if (opts.signal?.aborted) throw new Error("Aborted");
+      const toolResults = await this.tools.executeToolCalls(
+        invocations,
+        {
+          conversationId: convo,
+          agentId: this.cfg.id,
+          messageId: msgId,
+          eventPort: this.events
+        },
+        this.cfg.maxToolConcurrency ?? 3,
+        opts.signal
+      );
+      allToolResults.push(...toolResults);
+      const assistantMsg = {
+        id: this.ids.uuid(),
+        role: "assistant",
+        content: result.content ?? null,
+        timestamp: this.clock.iso(),
+        tool_calls: approvedCalls,
+        usage: result.usage
+      };
+      const toolResultMsgs = [];
+      for (const tr of toolResults) {
+        const contentStr = tr.status === "error" ? String(tr.result) : typeof tr.result === "string" ? tr.result : JSON.stringify(tr.result);
+        toolResultMsgs.push({
+          id: tr.id,
+          role: "tool",
+          content: contentStr,
+          timestamp: this.clock.iso(),
+          tool_call_id: tr.id,
+          name: tr.name
+        });
+        this.metrics?.recordToolCall?.();
+        await this.events?.emit({
+          type: AgentEventTypes.ToolResult,
+          conversationId: convo,
+          messageId: msgId,
+          result: tr
+        });
+      }
+      await this.memory.append(convo, [assistantMsg, ...toolResultMsgs]);
+      const { usage: _usage, ...extraField } = result;
+      accumulatedMessages.push({
+        ...extraField,
+        role: "assistant",
+        content: result.content ?? null,
+        tool_calls: approvedCalls
+      });
+      for (const tr of toolResults) {
+        const contentStr = tr.status === "error" ? String(tr.result) : typeof tr.result === "string" ? tr.result : JSON.stringify(tr.result);
+        accumulatedMessages.push({ role: "tool", content: contentStr, tool_call_id: tr.id, name: tr.name });
+      }
+      if (opts.signal?.aborted) throw new Error("Aborted");
+      streamedAssistantContent = "";
+      if (opts.stream && typeof _llm.streamCompletion === "function") {
         let isFirstChunk = true;
-        result = await this.deps.llm.streamCompletion(
-          params,
+        result = await _llm.streamCompletion(
+          { ...params, messages: accumulatedMessages },
           {
             onChunk: async (delta, usage) => {
-              try {
-                streamedAssistantContent += delta;
-              } catch {
-              }
+              streamedAssistantContent += delta;
               const cleanDelta = isFirstChunk ? delta.replace(/^\n+/, "") : delta;
               isFirstChunk = false;
               const chunkEvent = {
@@ -335,9 +859,13 @@ var AgentOrchestrator = class {
                 delta: cleanDelta,
                 ...usage && { usage }
               };
-              await this.deps.events?.emit(chunkEvent);
+              await this.events?.emit(chunkEvent);
             },
             onStreamFinish: async (finishReason, usage) => {
+              if (usage) {
+                const cost = this.cost.estimate(this.cfg.model, usage);
+                this.metrics?.recordLLMCall?.(usage, cost);
+              }
               const finishEvent = {
                 type: AgentEventTypes.StreamFinish,
                 conversationId: convo,
@@ -345,24 +873,28 @@ var AgentOrchestrator = class {
                 ...finishReason && { finishReason },
                 ...usage && { usage }
               };
-              await this.deps.events?.emit(finishEvent);
+              await this.events?.emit(finishEvent);
             }
           },
           opts.signal
         );
       } else {
-        result = await this.deps.llm.generateCompletion(params, opts.signal);
+        result = await _llm.generateCompletion({ ...params, messages: accumulatedMessages }, opts.signal);
+        if (result.usage) {
+          const cost = this.cost.estimate(this.cfg.model, result.usage);
+          this.metrics?.recordLLMCall?.(result.usage, cost);
+        }
       }
       if (!result.tool_calls?.length && result.content && !finalResponseSaved) {
         const content2 = opts.stream ? streamedAssistantContent : result.content;
-        const assistantMsg = {
+        const assistantMsg2 = {
           id: msgId,
           role: "assistant",
           content: content2,
-          timestamp: this.deps.clock.iso(),
+          timestamp: this.clock.iso(),
           usage: result.usage
         };
-        await this.deps.memory.append(convo, [assistantMsg]);
+        await this.memory.append(convo, [assistantMsg2]);
         finalResponseSaved = true;
         if (content2.trim()) {
           const messageEvent = {
@@ -372,199 +904,56 @@ var AgentOrchestrator = class {
             content: content2,
             ...result.usage && { usage: result.usage }
           };
-          await this.deps.events?.emit(messageEvent);
-        }
-      }
-      while (result.tool_calls?.length) {
-        if (result.content?.trim()) {
-          const messageEvent = {
-            type: AgentEventTypes.AssistantMessage,
-            conversationId: convo,
-            messageId: msgId,
-            content: result.content,
-            ...result.usage && { usage: result.usage }
-          };
-          await this.deps.events?.emit(messageEvent);
-        }
-        if (opts.signal?.aborted) throw new Error("Aborted");
-        await this.deps.events?.emit({
-          type: AgentEventTypes.ToolCalls,
-          conversationId: convo,
-          messageId: msgId,
-          toolCalls: result.tool_calls,
-          usage: result.usage
-        });
-        const approvalResult = await this.processToolApproval(
-          result.tool_calls,
-          convo,
-          msgId,
-          accumulatedMessages,
-          turnHistory,
-          result.content,
-          result.usage
-        );
-        if (approvalResult.wasDenied) {
-          denialMessage = approvalResult.denialMessage || "";
-          toolApprovalDenied = true;
-          break;
-        }
-        const approvedCalls = approvalResult.approvedCalls;
-        const invocations = this.toInvocations(approvedCalls);
-        if (opts.signal?.aborted) throw new Error("Aborted");
-        const toolResults = await this.deps.tools.executeToolCalls(
-          invocations,
-          {
-            conversationId: convo,
-            agentId: this.cfg.id,
-            messageId: msgId,
-            eventPort: this.deps.events
-          },
-          this.cfg.maxToolConcurrency ?? 3,
-          opts.signal
-        );
-        allToolResults.push(...toolResults);
-        const assistantMsg = {
-          id: this.deps.ids.uuid(),
-          role: "assistant",
-          content: result.content ?? null,
-          timestamp: this.deps.clock.iso(),
-          tool_calls: approvedCalls,
-          usage: result.usage
-        };
-        const toolResultMsgs = [];
-        for (const tr of toolResults) {
-          const contentStr = tr.status === "error" ? String(tr.result) : typeof tr.result === "string" ? tr.result : JSON.stringify(tr.result);
-          toolResultMsgs.push({
-            id: tr.id,
-            role: "tool",
-            content: contentStr,
-            timestamp: this.deps.clock.iso(),
-            tool_call_id: tr.id,
-            name: tr.name
-          });
-          await this.deps.events?.emit({
-            type: AgentEventTypes.ToolResult,
-            conversationId: convo,
-            messageId: msgId,
-            result: tr
-          });
-        }
-        await this.deps.memory.append(convo, [assistantMsg, ...toolResultMsgs]);
-        accumulatedMessages.push({ role: "assistant", content: result.content ?? null, tool_calls: approvedCalls });
-        for (const tr of toolResults) {
-          const contentStr = tr.status === "error" ? String(tr.result) : typeof tr.result === "string" ? tr.result : JSON.stringify(tr.result);
-          accumulatedMessages.push({ role: "tool", content: contentStr, tool_call_id: tr.id, name: tr.name });
-        }
-        if (opts.signal?.aborted) throw new Error("Aborted");
-        streamedAssistantContent = "";
-        if (opts.stream && typeof this.deps.llm.streamCompletion === "function") {
-          let isFirstChunk = true;
-          result = await this.deps.llm.streamCompletion(
-            { ...params, messages: accumulatedMessages },
-            {
-              onChunk: async (delta, usage) => {
-                try {
-                  streamedAssistantContent += delta;
-                } catch {
-                }
-                const cleanDelta = isFirstChunk ? delta.replace(/^\n+/, "") : delta;
-                isFirstChunk = false;
-                const chunkEvent = {
-                  type: AgentEventTypes.AssistantChunk,
-                  conversationId: convo,
-                  messageId: msgId,
-                  delta: cleanDelta,
-                  ...usage && { usage }
-                };
-                await this.deps.events?.emit(chunkEvent);
-              },
-              onStreamFinish: async (finishReason, usage) => {
-                const finishEvent = {
-                  type: AgentEventTypes.StreamFinish,
-                  conversationId: convo,
-                  messageId: msgId,
-                  ...finishReason && { finishReason },
-                  ...usage && { usage }
-                };
-                await this.deps.events?.emit(finishEvent);
-              }
-            },
-            opts.signal
-          );
-        } else {
-          result = await this.deps.llm.generateCompletion({ ...params, messages: accumulatedMessages }, opts.signal);
-        }
-        if (!result.tool_calls?.length && result.content && !finalResponseSaved) {
-          const content2 = opts.stream ? streamedAssistantContent : result.content;
-          const assistantMsg2 = {
-            id: msgId,
-            role: "assistant",
-            content: content2,
-            timestamp: this.deps.clock.iso(),
-            usage: result.usage
-          };
-          await this.deps.memory.append(convo, [assistantMsg2]);
-          finalResponseSaved = true;
-          if (content2.trim()) {
-            const messageEvent = {
-              type: AgentEventTypes.AssistantMessage,
-              conversationId: convo,
-              messageId: msgId,
-              content: content2,
-              ...result.usage && { usage: result.usage }
-            };
-            await this.deps.events?.emit(messageEvent);
-          }
+          await this.events?.emit(messageEvent);
         }
       }
-      const t1 = this.deps.clock.now();
-      const timestamp = this.deps.clock.iso();
-      const shouldEmitFinalMessage = result.content?.trim() && !toolApprovalDenied && !finalResponseSaved;
-      if (shouldEmitFinalMessage) {
-        const messageEvent = {
-          type: AgentEventTypes.AssistantMessage,
-          conversationId: convo,
-          messageId: msgId,
-          content: result.content,
-          ...result.usage && { usage: result.usage }
-        };
-        await this.deps.events?.emit(messageEvent);
-      }
-      const responseContent = toolApprovalDenied ? denialMessage : result.content;
-      const resp = {
-        id: msgId,
-        content: responseContent,
-        role: MessageRoles.Assistant,
-        timestamp,
-        metadata: {
-          model: this.cfg.model,
-          provider: "echo",
-          agentId: this.cfg.id,
-          responseTime: t1 - t0,
-          promptTokens: result.usage?.prompt_tokens,
-          completionTokens: result.usage?.completion_tokens,
-          totalTokens: result.usage?.total_tokens,
-          estimatedCost: this.deps.cost.estimate(this.cfg.model, result.usage),
-          toolCalls: allToolResults.length
-        }
-      };
-      await this.deps.events?.emit({
-        type: AgentEventTypes.Done,
+    }
+    const t1 = this.clock.now();
+    const timestamp = this.clock.iso();
+    this.metrics?.recordRequestComplete?.(t1 - t0);
+    const shouldEmitFinalMessage = result.content?.trim() && !toolApprovalDenied && !finalResponseSaved;
+    if (shouldEmitFinalMessage) {
+      const messageEvent = {
+        type: AgentEventTypes.AssistantMessage,
         conversationId: convo,
         messageId: msgId,
-        responseTimeMs: t1 - t0,
-        usage: result.usage
-      });
-      return resp;
-    } catch (err2) {
-      throw err2;
-    }
+        content: result.content,
+        ...result.usage && { usage: result.usage }
+      };
+      await this.events?.emit(messageEvent);
+    }
+    const responseContent = toolApprovalDenied ? denialMessage : result.content;
+    const resp = {
+      id: msgId,
+      content: responseContent,
+      role: MessageRoles.Assistant,
+      timestamp,
+      metadata: {
+        model: this.cfg.model,
+        provider: "echo",
+        agentId: this.cfg.id,
+        responseTime: t1 - t0,
+        promptTokens: result.usage?.prompt_tokens,
+        completionTokens: result.usage?.completion_tokens,
+        totalTokens: result.usage?.total_tokens,
+        estimatedCost: this.cost.estimate(this.cfg.model, result.usage),
+        toolCalls: allToolResults.length
+      }
+    };
+    await this.events?.emit({
+      type: AgentEventTypes.Done,
+      conversationId: convo,
+      messageId: msgId,
+      responseTimeMs: t1 - t0,
+      usage: result.usage
+    });
+    return resp;
   }
   async waitForToolApproval(toolCalls, conversationId, messageId) {
-    const approvalId = this.deps.ids.uuid();
+    const approvalId = this.ids.uuid();
     return new Promise((resolve6, reject) => {
       this.pendingApprovals.set(approvalId, { resolve: resolve6, reject });
-      this.deps.events?.emit({
+      this.events?.emit({
         type: AgentEventTypes.ToolApprovalRequired,
         conversationId,
         messageId,
@@ -593,71 +982,11 @@ var AgentOrchestrator = class {
       let parameters = {};
       try {
         parameters = JSON.parse(tc.function.arguments || "{}");
-      } catch {
-        parameters = {};
-      }
-      return { id: tc.id, name: tc.function.name, parameters };
-    });
-  }
-};
-// context.ts
-var toProviderContent = (content) => {
-  if (content === null || content === void 0) {
-    return "";
-  }
-  if (typeof content === "string") {
-    return content;
-  }
-  if (content.type === "parts") {
-    const providerParts = [];
-    for (const part of content.parts) {
-      if (part.type === "text") {
-        if (part.text.length > 0) {
-          providerParts.push({ type: "text", text: part.text });
-        }
-        continue;
-      }
-      const label = part.altText ?? (part.name ? `Image attachment: ${part.name}` : void 0);
-      if (label) {
-        providerParts.push({ type: "text", text: label });
-      }
-      const url = `data:${part.mimeType};base64,${part.data}`;
-      providerParts.push({ type: "image_url", image_url: { url } });
-    }
-    return providerParts.length > 0 ? providerParts : [];
-  }
-  return [];
-};
-var SimpleContextBuilder = class {
-  toProviderMessages(history, systemPrompt, newUserContent) {
-    const transformed = [];
-    for (const m of history) {
-      const providerContent = toProviderContent(m.content);
-      if (m.role === "user") {
-        transformed.push({ role: "user", content: providerContent ?? "" });
-      } else if (m.role === "assistant") {
-        if (m.tool_calls && m.tool_calls.length > 0) {
-          transformed.push({ role: "assistant", content: providerContent ?? null, tool_calls: m.tool_calls });
-        } else {
-          transformed.push({ role: "assistant", content: providerContent ?? "" });
-        }
-      } else if (m.role === "tool") {
-        if (m.tool_call_id) {
-          transformed.push({
-            role: "tool",
-            content: typeof providerContent === "string" ? providerContent : providerContent ?? "",
-            tool_call_id: m.tool_call_id,
-            name: m.name
-          });
-        }
+      } catch {
+        parameters = {};
       }
-    }
-    const userMsgs = newUserContent.map((c) => ({
-      role: "user",
-      content: toProviderContent(c) ?? ""
-    }));
-    return [{ role: "system", content: systemPrompt }, ...transformed, ...userMsgs];
+      return { id: tc.id, name: tc.function.name, parameters };
+    });
   }
 };
@@ -922,7 +1251,12 @@ async function buildTree(dir, rootDir, gitignore, options, depth, fileCount) {
   if (depth >= options.maxDepth || fileCount.count >= options.maxFiles) {
     return [];
   }
-  const entries = await fs2.readdir(dir, { withFileTypes: true });
+  let entries;
+  try {
+    entries = await fs2.readdir(dir, { withFileTypes: true });
+  } catch {
+    return [];
+  }
   const lines = [];
   const sortedEntries = entries.sort((a, b) => {
     if (a.isDirectory() && !b.isDirectory()) return -1;
@@ -966,123 +1300,6 @@ async function generateFolderTree(rootDir, options = {}) {
   return [header, ...lines].join("\n");
 }
-// persistent/memory.ts
-var InMemoryMemory = class {
-  store = /* @__PURE__ */ new Map();
-  async get(key) {
-    return this.store.get(key) ?? [];
-  }
-  async set(key, items) {
-    this.store.set(key, [...items]);
-  }
-  async append(key, items) {
-    const existing = this.store.get(key) ?? [];
-    this.store.set(key, [...existing, ...items]);
-  }
-  async delete(key) {
-    this.store.delete(key);
-  }
-  async keys() {
-    return Array.from(this.store.keys());
-  }
-  async clear() {
-    this.store.clear();
-  }
-  async exportSnapshot() {
-    const snap = {};
-    for (const [k, v] of this.store.entries()) snap[k] = [...v];
-    return snap;
-  }
-  async importSnapshot(snapshot) {
-    this.store.clear();
-    for (const [k, v] of Object.entries(snapshot)) this.store.set(k, [...v]);
-  }
-};
-var JsonFileMemoryPersistence = class {
-  constructor(filename = "history.json") {
-    this.filename = filename;
-  }
-  async load() {
-    try {
-      const fs10 = await import("fs");
-      if (!fs10.existsSync(this.filename)) return {};
-      const text = fs10.readFileSync(this.filename, "utf-8");
-      const data = JSON.parse(text);
-      return typeof data === "object" && data ? data : {};
-    } catch {
-      console.warn(`Failed to load memory from ${this.filename}`);
-      return {};
-    }
-  }
-  async save(snapshot) {
-    try {
-      const fs10 = await import("fs");
-      const path9 = await import("path");
-      const dir = path9.dirname(this.filename);
-      if (dir && dir !== "." && !fs10.existsSync(dir)) {
-        fs10.mkdirSync(dir, { recursive: true });
-      }
-      fs10.writeFileSync(this.filename, JSON.stringify(snapshot, null, 2), "utf-8");
-    } catch (err2) {
-      console.warn(`Failed to save memory to ${this.filename}`, err2);
-    }
-  }
-};
-var PersistedMemory = class {
-  constructor(persistence) {
-    this.persistence = persistence;
-  }
-  inner = new InMemoryMemory();
-  initialized = false;
-  async ensureInitialized() {
-    if (this.initialized) return;
-    const snap = await this.persistence.load();
-    if (snap && typeof snap === "object") await this.inner.importSnapshot(snap);
-    this.initialized = true;
-  }
-  async save() {
-    const snap = await this.inner.exportSnapshot();
-    await this.persistence.save(snap);
-  }
-  async get(key) {
-    await this.ensureInitialized();
-    return this.inner.get(key);
-  }
-  async set(key, items) {
-    await this.ensureInitialized();
-    await this.inner.set(key, items);
-    await this.save();
-  }
-  async append(key, items) {
-    await this.ensureInitialized();
-    await this.inner.append(key, items);
-    await this.save();
-  }
-  async delete(key) {
-    await this.ensureInitialized();
-    await this.inner.delete(key);
-    await this.save();
-  }
-  async keys() {
-    await this.ensureInitialized();
-    return this.inner.keys();
-  }
-  async clear() {
-    await this.ensureInitialized();
-    await this.inner.clear();
-    await this.save();
-  }
-  async exportSnapshot() {
-    await this.ensureInitialized();
-    return this.inner.exportSnapshot();
-  }
-  async importSnapshot(snapshot) {
-    await this.ensureInitialized();
-    await this.inner.importSnapshot(snapshot);
-    await this.save();
-  }
-};
 // persistent/metadata-memory.ts
 var MemoryPortMetadataAdapter = class {
   constructor(memory, prefix = "__metadata__") {
@@ -1217,6 +1434,27 @@ var ConversationStore = class {
     };
     await this.metadataMemory.set(conversationId, updatedMetadata);
   }
+  async recordRequestMetrics(conversationId, metrics) {
+    const metadata = await this.metadataMemory.get(conversationId);
+    const updatedMetadata = {
+      ...metadata,
+      promptTokens: (metadata?.promptTokens ?? 0) + (metrics.promptTokens ?? 0),
+      completionTokens: (metadata?.completionTokens ?? 0) + (metrics.completionTokens ?? 0),
+      totalTokens: (metadata?.totalTokens ?? 0) + (metrics.totalTokens ?? 0),
+      requestCount: (metadata?.requestCount ?? 0) + 1,
+      toolCallCount: (metadata?.toolCallCount ?? 0) + (metrics.toolCalls ?? 0),
+      totalTimeMs: (metadata?.totalTimeMs ?? 0) + (metrics.responseTimeMs ?? 0),
+      totalPrice: (metadata?.totalPrice ?? 0) + (metrics.cost ?? 0),
+      contextWindow: {
+        promptTokens: metrics.promptTokens,
+        completionTokens: metrics.completionTokens,
+        totalTokens: metrics.totalTokens
+      },
+      updatedAt: (/* @__PURE__ */ new Date()).toISOString()
+    };
+    await this.metadataMemory.set(conversationId, updatedMetadata);
+    return updatedMetadata;
+  }
   async updateTopic(conversationId, topic) {
     const metadata = await this.metadataMemory.get(conversationId);
     const updatedMetadata = {
@@ -1279,41 +1517,6 @@ var ConversationContext = class {
   }
 };
-// id.ts
-var SimpleId = class {
-  uuid() {
-    return "xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx".replace(/[xy]/g, (c) => {
-      const r = Math.random() * 16 | 0;
-      const v = c === "x" ? r : r & 3 | 8;
-      return v.toString(16);
-    });
-  }
-};
-// clock.ts
-var SystemClock = class {
-  now() {
-    return Date.now();
-  }
-  iso(dateMs) {
-    return new Date(dateMs ?? Date.now()).toISOString();
-  }
-};
-// cost.ts
-var SimpleCost = class {
-  estimate(_model, usage) {
-    return usage?.cost;
-  }
-};
-// reminders.ts
-var NoopReminders = class {
-  enhance(content, _opts) {
-    return [content];
-  }
-};
 // todo-store.ts
 var TodoStore = class {
   constructor(memory) {
@@ -3612,9 +3815,12 @@ var AgentFilePersistence = class {
    * Load all agents from the agents directory
    */
   async loadAll() {
-    this.ensureAgentsDir();
     const agents = [];
     try {
+      this.ensureAgentsDir();
+      if (!fs8.existsSync(this.agentsDir)) {
+        return agents;
+      }
       const files = fs8.readdirSync(this.agentsDir);
       const yamlFiles = files.filter((f) => f.endsWith(".yaml") || f.endsWith(".yml"));
       for (const file of yamlFiles) {
@@ -3627,8 +3833,7 @@ var AgentFilePersistence = class {
           console.warn(`Failed to load agent from ${file}:`, error);
         }
       }
-    } catch (error) {
-      console.warn("Failed to read agents directory:", error);
+    } catch (_error) {
     }
     return agents;
   }
@@ -3717,6 +3922,7 @@ var AgentFilePersistence = class {
 function mergeChoices(choices) {
   const contentParts = [];
   const mergedToolCalls = [];
+  const extraFields = {};
   const collectText = (value) => {
     if (typeof value === "string") {
       const trimmed = value.trim();
@@ -3737,10 +3943,20 @@ function mergeChoices(choices) {
     if (!msg) continue;
     collectText(msg.content);
     if (Array.isArray(msg.tool_calls)) mergedToolCalls.push(...msg.tool_calls);
+    const knownKeys = ["content", "tool_calls", "role"];
+    for (const key of Object.keys(msg)) {
+      if (!knownKeys.includes(key)) {
+        extraFields[key] = msg[key];
+      }
+    }
   }
   const content = contentParts.join("\n\n");
   const tool_calls = mergedToolCalls.length ? mergedToolCalls : void 0;
-  return { content, ...tool_calls ? { tool_calls } : {} };
+  return {
+    content,
+    ...tool_calls ? { tool_calls } : {},
+    ...extraFields
+  };
 }
 function normalizeUsage(usage) {
   if (!usage) return void 0;
@@ -3748,6 +3964,7 @@ function normalizeUsage(usage) {
   const prompt_tokens = usage.prompt_tokens ?? (typeof usageObj.input_tokens === "number" ? usageObj.input_tokens : void 0);
   const completion_tokens = usage.completion_tokens ?? (typeof usageObj.output_tokens === "number" ? usageObj.output_tokens : void 0);
   const total_tokens = usage.total_tokens ?? (prompt_tokens != null && completion_tokens != null ? prompt_tokens + completion_tokens : void 0);
+  const cost = usage.cost ?? (typeof usageObj.estimated_cost === "number" ? usageObj.estimated_cost : void 0);
   return {
     prompt_tokens,
     completion_tokens,
@@ -3755,7 +3972,7 @@ function normalizeUsage(usage) {
     ...usage.reasoning_tokens !== void 0 && { reasoning_tokens: usage.reasoning_tokens },
     ...usage.prompt_tokens_details && { prompt_tokens_details: usage.prompt_tokens_details },
     ...usage.completion_tokens_details && { completion_tokens_details: usage.completion_tokens_details },
-    ...usage.cost !== void 0 && { cost: usage.cost },
+    ...cost !== void 0 && { cost },
     ...usage.cost_details && { cost_details: usage.cost_details }
   };
 }
@@ -3901,6 +4118,7 @@ var BaseLLM = class {
     const mergedToolCalls = [];
     let usage;
     let lastFinishReason;
+    const extraFields = {};
     const flushEvent = (rawEvent) => {
       const lines = rawEvent.split("\n");
       const dataLines = [];
@@ -3941,6 +4159,16 @@ var BaseLLM = class {
               handlers.onChunk?.(textDelta);
             }
           }
+          const knownKeys = ["role", "content", "tool_calls"];
+          for (const key of Object.keys(delta)) {
+            if (knownKeys.includes(key)) continue;
+            const val = delta[key];
+            if (typeof val === "string") {
+              extraFields[key] = (extraFields[key] || "") + val;
+            } else if (val !== void 0 && val !== null) {
+              extraFields[key] = val;
+            }
+          }
           const toolDeltas = Array.isArray(delta.tool_calls) ? delta.tool_calls : [];
           for (const td of toolDeltas) {
             let toolCall;
@@ -3948,6 +4176,7 @@ var BaseLLM = class {
               toolCall = mergedToolCalls.find((tc) => tc.id === td.id);
               if (!toolCall) {
                 toolCall = {
+                  ...td,
                   id: td.id,
                   type: "function",
                   function: { name: td.function?.name ?? "", arguments: "" }
@@ -3994,7 +4223,12 @@ var BaseLLM = class {
     if (buffer.trim()) flushEvent(buffer);
     content = content.replace(/^\n+/, "");
     const tool_calls = mergedToolCalls.length ? mergedToolCalls : void 0;
-    return { content, ...tool_calls ? { tool_calls } : {}, ...usage ? { usage } : {} };
+    return {
+      content,
+      ...tool_calls ? { tool_calls } : {},
+      ...usage ? { usage } : {},
+      ...extraFields
+    };
   }
 };
@@ -4364,8 +4598,9 @@ var GithubAuthTransport = class {
       method: "GET",
       headers: {
         Authorization: `Bearer ${this.accessToken}`,
-        "user-agent": "GitHubCopilotChat/0.31.3",
-        "editor-version": "vscode/1.104.2",
+        "user-agent": "GitHubCopilotChat/0.33.1",
+        "editor-version": "vscode/1.106.1",
+        "x-github-api-version": "2025-10-01",
         accept: "application/json"
       },
       signal
@@ -4454,11 +4689,12 @@ var GithubAuthTransport = class {
     return res;
   }
   async postStream(url, body, headers, signal) {
-    if (!this.apiKey && this.accessToken) {
+    let hdrs = this.makeAuthHeaders({ Accept: "text/event-stream", ...headers || {} }, body);
+    if ((!this.apiKey || !hdrs.Authorization) && this.accessToken) {
       await this.exchangeToken(signal);
+      hdrs = this.makeAuthHeaders({ Accept: "text/event-stream", ...headers || {} }, body);
     }
     const fullUrl = this.buildFullUrl(url);
-    const hdrs = this.makeAuthHeaders({ Accept: "text/event-stream", ...headers || {} }, body);
     let res = await this.inner.postStream(fullUrl, body, hdrs, signal);
     if (res.status === 401 && this.accessToken) {
       await this.exchangeToken(signal);
@@ -4529,6 +4765,105 @@ function createTransport(inner, defaultBaseUrl, apiKey, baseUrl, version) {
   return new SimpleBearerAuthTransport(inner, defaultBaseUrl, apiKey, baseUrl, version);
 }
+// llm-providers/model-limits.ts
+function normalizeModelLimits(provider, model) {
+  switch (provider.toLowerCase()) {
+    case "github": {
+      const capabilities = model.capabilities;
+      const limits = capabilities?.limits;
+      const contextWindow = limits?.max_context_window_tokens;
+      if (!contextWindow) return null;
+      return {
+        contextWindow,
+        maxOutput: limits?.max_output_tokens
+      };
+    }
+    case "deepinfra": {
+      const metadata = model.metadata;
+      const contextLength = metadata?.context_length;
+      if (!contextLength) return null;
+      return {
+        contextWindow: contextLength,
+        maxOutput: metadata?.max_tokens
+      };
+    }
+    case "moonshot": {
+      const contextLength = model.context_length;
+      if (!contextLength) return null;
+      return { contextWindow: contextLength };
+    }
+    case "openrouter": {
+      const topProvider = model.top_provider;
+      const contextLength = model.context_length ?? topProvider?.context_length;
+      if (!contextLength) return null;
+      return {
+        contextWindow: contextLength,
+        maxOutput: topProvider?.max_completion_tokens
+      };
+    }
+    default: {
+      const contextLength = model.context_length;
+      if (!contextLength) return null;
+      return { contextWindow: contextLength };
+    }
+  }
+}
+var FALLBACK_LIMITS = {
+  zai: {
+    "glm-4.6": { contextWindow: 2e5, maxOutput: 128e3 }
+  },
+  openrouter: {
+    "anthropic/claude-sonnet-4": { contextWindow: 2e5, maxOutput: 16e3 },
+    "anthropic/claude-3.5-sonnet": { contextWindow: 2e5, maxOutput: 8192 },
+    "openai/gpt-4o": { contextWindow: 128e3, maxOutput: 16384 },
+    "openai/gpt-4.1": { contextWindow: 128e3, maxOutput: 32768 },
+    "openai/gpt-4o-mini": { contextWindow: 128e3, maxOutput: 16384 },
+    "google/gemini-pro-1.5": { contextWindow: 2097152, maxOutput: 8192 },
+    "meta-llama/llama-3.1-70b-instruct": { contextWindow: 131072, maxOutput: 131072 }
+  },
+  github: {
+    "gpt-4.1": { contextWindow: 128e3, maxOutput: 16384 },
+    "gpt-4o": { contextWindow: 128e3, maxOutput: 16384 },
+    "gpt-4o-mini": { contextWindow: 128e3, maxOutput: 16384 },
+    "claude-sonnet-4": { contextWindow: 2e5, maxOutput: 16e3 },
+    "claude-3.5-sonnet": { contextWindow: 2e5, maxOutput: 8192 },
+    o1: { contextWindow: 2e5, maxOutput: 1e5 },
+    "o1-mini": { contextWindow: 128e3, maxOutput: 65536 }
+  },
+  deepinfra: {
+    "meta-llama/Meta-Llama-3.1-70B-Instruct": { contextWindow: 131072, maxOutput: 131072 },
+    "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": { contextWindow: 131072, maxOutput: 131072 },
+    "Qwen/Qwen2.5-72B-Instruct": { contextWindow: 131072, maxOutput: 131072 }
+  },
+  moonshot: {
+    "moonshot-v1-8k": { contextWindow: 8192 },
+    "moonshot-v1-32k": { contextWindow: 32768 },
+    "moonshot-v1-128k": { contextWindow: 131072 },
+    "kimi-k2-turbo-preview": { contextWindow: 262144 }
+  },
+  anthropic: {
+    "claude-sonnet-4-5": { contextWindow: 2e5, maxOutput: 16e3 },
+    "claude-3-5-sonnet-20241022": { contextWindow: 2e5, maxOutput: 8192 },
+    "claude-3-opus-20240229": { contextWindow: 2e5, maxOutput: 4096 },
+    "claude-3-haiku-20240307": { contextWindow: 2e5, maxOutput: 4096 }
+  }
+};
+function getFallbackLimits(provider, model) {
+  const providerLimits = FALLBACK_LIMITS[provider.toLowerCase()];
+  if (!providerLimits) return null;
+  return providerLimits[model] ?? null;
+}
+function normalizeModelInfo(provider, model) {
+  const id = model.id;
+  const name = model.name ?? id;
+  const limits = normalizeModelLimits(provider, model);
+  return {
+    id,
+    name,
+    ...limits ? { limits } : {}
+  };
+}
 // llm-providers/llm-github.ts
 var GithubLLM = class extends BaseLLM {
   opts;
@@ -4552,6 +4887,49 @@ var GithubLLM = class extends BaseLLM {
       accessToken: this.opts.accessToken
     });
   }
+  async getModels(signal) {
+    const res = await this.getTransport().get("/models", void 0, signal);
+    if (!res.ok) {
+      const text = await res.text();
+      throw new LLMError(text || `Failed to fetch models: ${res.status}`, res.status);
+    }
+    const body = await res.json();
+    return body.data.map((m) => normalizeModelInfo("github", m));
+  }
+  handleError(error, model) {
+    if (error instanceof LLMError) {
+      try {
+        const errorBody = JSON.parse(error.message);
+        if (errorBody?.error?.code === "unsupported_api_for_model") {
+          throw new LLMError(
+            `The model '${model}' is not supported for chat completions. Please select a different model using '/model'.`,
+            error.statusCode,
+            false
+            // Not retryable
+          );
+        }
+      } catch (e) {
+        if (e instanceof LLMError && e.message.includes("not supported")) {
+          throw e;
+        }
+      }
+    }
+    throw error;
+  }
+  async generateCompletion(params, signal) {
+    try {
+      return await super.generateCompletion(params, signal);
+    } catch (error) {
+      this.handleError(error, params.model);
+    }
+  }
+  async streamCompletion(params, handlers, signal) {
+    try {
+      return await super.streamCompletion(params, handlers, signal);
+    } catch (error) {
+      this.handleError(error, params.model);
+    }
+  }
 };
 // llm-providers/llm-anthropic-aisdk.ts
@@ -5049,11 +5427,13 @@ var GenericLLM = class extends BaseLLM {
   opts;
   includeUsage;
   modelConfig;
+  providerName;
   constructor(baseUrl, modelConfig, opts = {}) {
-    const { enablePromptCaching = false, includeUsage = false, ...restOpts } = opts;
+    const { enablePromptCaching = false, includeUsage = false, providerName = "unknown", ...restOpts } = opts;
     super(opts.apiUrl || baseUrl, { enablePromptCaching });
     this.includeUsage = includeUsage;
     this.modelConfig = modelConfig;
+    this.providerName = providerName;
     this.opts = restOpts;
   }
   createTransport() {
@@ -5071,7 +5451,10 @@ var GenericLLM = class extends BaseLLM {
       throw new Error("Provider does not support getModels");
     }
     if (Array.isArray(this.modelConfig)) {
-      return this.modelConfig.map((m) => typeof m === "string" ? { id: m } : m);
+      return this.modelConfig.map((m) => {
+        const raw = typeof m === "string" ? { id: m } : m;
+        return normalizeModelInfo(this.providerName, raw);
+      });
     }
     if (typeof this.modelConfig === "string") {
       const transport2 = this.createTransport();
@@ -5081,7 +5464,7 @@ var GenericLLM = class extends BaseLLM {
         throw new Error(`Failed to fetch models: ${res2.status} ${text}`);
       }
       const data2 = await res2.json();
-      return data2.data;
+      return data2.data.map((m) => normalizeModelInfo(this.providerName, m));
     }
     const transport = this.createTransport();
     const res = await transport.get("/models", void 0, signal);
@@ -5090,7 +5473,7 @@ var GenericLLM = class extends BaseLLM {
       throw new Error(`Failed to fetch models: ${res.status} ${text}`);
     }
     const data = await res.json();
-    return data.data;
+    return data.data.map((m) => normalizeModelInfo(this.providerName, m));
   }
   async generateCompletion(params, signal) {
     let enhancedParams = params;
@@ -5149,6 +5532,7 @@ function createLLM(providerName, options = {}, customProviders) {
   const modelConfig = normalizeModelConfig(config);
   return new GenericLLM(config.baseUrl, modelConfig, {
     ...options,
+    providerName: config.name,
     enablePromptCaching: options.enablePromptCaching ?? config.features.promptCaching,
     includeUsage: options.includeUsage ?? config.features.includeUsage
   });
@@ -5434,31 +5818,6 @@ function isValidConfig(value) {
   }
   return true;
 }
-// events.ts
-var PersistingConsoleEventPort = class {
-  memory;
-  maxPerConversation;
-  writeQueue = Promise.resolve();
-  constructor(opts) {
-    this.memory = opts?.memory ?? new PersistedMemory(new JsonFileMemoryPersistence(opts?.filename || "events.json"));
-    this.maxPerConversation = opts?.maxPerConversation ?? 500;
-  }
-  async emit(event) {
-    this.writeQueue = this.writeQueue.then(async () => {
-      try {
-        const key = event?.conversationId ?? "default";
-        const existing = await this.memory.get(key);
-        const next = [...existing, { ...event }];
-        const max = this.maxPerConversation;
-        const trimmed = max > 0 && next.length > max ? next.slice(next.length - max) : next;
-        await this.memory.set(key, trimmed);
-      } catch {
-      }
-    });
-    return this.writeQueue;
-  }
-};
 export {
   AGENT_CREATOR_SYSTEM_PROMPT,
   AgentEventTypes,
@@ -5482,11 +5841,13 @@ export {
   GithubLLM,
   InMemoryMemory,
   InMemoryMetadata,
+  InMemoryMetricsPort,
   JsonFileMemoryPersistence,
   LLMError,
   LLMResolver,
   MCPToolPort,
   MemoryPortMetadataAdapter,
+  NoopMetricsPort,
   NoopReminders,
   PersistedMemory,
   PersistingConsoleEventPort,
@@ -5499,10 +5860,14 @@ export {
   buildAgentCreationPrompt,
   buildInjectedSystem,
   canonicalizeTerminalPaste,
+  createEmptySnapshot,
   createLLM,
   generateFolderTree,
   getAvailableProviders,
+  getFallbackLimits,
   loadMCPConfig,
+  normalizeModelInfo,
+  normalizeModelLimits,
   normalizeNewlines,
   renderTemplate,
   resolveBackspaces,