npm - @vellumai/assistant - Versions diffs - 0.8.2 → 0.8.3 - Mend

@vellumai/assistant 0.8.2 → 0.8.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (231) hide show

package/ARCHITECTURE.md +11 -12
package/docker-entrypoint.sh +13 -1
package/docker-init-apt-root.sh +79 -6
package/openapi.yaml +336 -21
package/package.json +1 -1
package/src/__tests__/agent-loop-exit-reason.test.ts +272 -0
package/src/__tests__/agent-loop-provider-error-recording.test.ts +195 -0
package/src/__tests__/compactor-tail-resolution.test.ts +107 -1
package/src/__tests__/config-get-vision-flag.test.ts +136 -0
package/src/__tests__/config-loader-backfill.test.ts +115 -18
package/src/__tests__/context-token-estimator.test.ts +30 -65
package/src/__tests__/conversation-agent-loop.test.ts +57 -1
package/src/__tests__/conversation-media-retry.test.ts +19 -8
package/src/__tests__/conversation-runtime-assembly.test.ts +26 -4
package/src/__tests__/date-context.test.ts +45 -0
package/src/__tests__/external-plugin-loader.test.ts +91 -19
package/src/__tests__/guardian-action-no-hardcoded-copy.test.ts +0 -1
package/src/__tests__/guardian-dispatch.test.ts +1 -0
package/src/__tests__/heartbeat-service.test.ts +24 -164
package/src/__tests__/helpers/channel-test-adapter.ts +0 -2
package/src/__tests__/host-app-control-proxy.test.ts +241 -0
package/src/__tests__/host-proxy-preactivation.test.ts +200 -13
package/src/__tests__/injector-background-turn.test.ts +153 -0
package/src/__tests__/injector-chain.test.ts +5 -0
package/src/__tests__/lifecycle-memory-v2-seed.test.ts +9 -2
package/src/__tests__/llm-callsite-catalog.test.ts +25 -0
package/src/__tests__/llm-catalog-parity.test.ts +3 -0
package/src/__tests__/llm-request-log-agent-loop-exit-reason.test.ts +116 -0
package/src/__tests__/llm-request-log-error-payload.test.ts +138 -0
package/src/__tests__/llm-request-log-source-clickhouse.test.ts +2 -0
package/src/__tests__/llm-resolver.test.ts +255 -2
package/src/__tests__/managed-profile-guard.test.ts +10 -0
package/src/__tests__/notification-decision-fallback.test.ts +0 -91
package/src/__tests__/notification-decision-strategy.test.ts +14 -31
package/src/__tests__/notification-deep-link.test.ts +15 -0
package/src/__tests__/notification-guardian-path.test.ts +1 -2
package/src/__tests__/notification-platform-adapter.test.ts +5 -4
package/src/__tests__/notification-telegram-adapter.test.ts +1 -0
package/src/__tests__/notification-vellum-adapter.test.ts +113 -0
package/src/__tests__/openai-provider.test.ts +218 -3
package/src/__tests__/openai-responses-cutover-guard.test.ts +3 -3
package/src/__tests__/openrouter-provider-only.test.ts +51 -3
package/src/__tests__/openrouter-token-estimation.test.ts +34 -25
package/src/__tests__/platform-proxy-context.test.ts +6 -1
package/src/__tests__/plugin-tool-contribution.test.ts +3 -3
package/src/__tests__/plugin-types.test.ts +2 -2
package/src/__tests__/provider-catalog-visibility.test.ts +16 -0
package/src/__tests__/provider-platform-proxy-integration.test.ts +27 -25
package/src/__tests__/secret-routes-platform-proxy.test.ts +1 -1
package/src/__tests__/system-prompt.test.ts +6 -73
package/src/__tests__/workspace-migration-087-memory-router-balanced-profile.test.ts +228 -0
package/src/a2a/__tests__/agent-card.test.ts +98 -0
package/src/a2a/__tests__/e2e-a2a-channel.test.ts +597 -0
package/src/a2a/__tests__/protocol-helpers.test.ts +113 -0
package/src/a2a/__tests__/task-store.test.ts +246 -0
package/src/a2a/agent-card.ts +58 -0
package/src/a2a/feature-gate.ts +8 -0
package/src/a2a/protocol-constants.ts +21 -0
package/src/a2a/protocol-errors.ts +50 -0
package/src/a2a/protocol-types.ts +162 -0
package/src/a2a/task-store.ts +168 -0
package/src/agent/loop.ts +167 -18
package/src/channels/config.ts +9 -0
package/src/channels/types.ts +14 -0
package/src/cli/{__tests__ → commands/__tests__}/notifications.test.ts +201 -28
package/src/cli/commands/__tests__/schedules.test.ts +469 -0
package/src/cli/commands/notifications.ts +65 -35
package/src/cli/commands/plugins.ts +67 -0
package/src/cli/commands/schedules.ts +297 -5
package/src/cli/lib/__tests__/search-plugins.test.ts +261 -0
package/src/cli/lib/install-from-github.ts +8 -9
package/src/cli/lib/search-plugins.ts +163 -0
package/src/cli/program.ts +14 -0
package/src/config/assistant-feature-flags.ts +24 -54
package/src/config/bundled-skills/app-builder/SKILL.md +117 -1
package/src/config/bundled-skills/phone-calls/SKILL.md +1 -1
package/src/config/call-site-defaults.ts +105 -0
package/src/config/feature-flag-registry.json +21 -29
package/src/config/llm-resolver.ts +52 -1
package/src/config/schema.ts +2 -0
package/src/config/schemas/__tests__/memory-v2.test.ts +3 -3
package/src/config/schemas/channels.ts +9 -0
package/src/config/schemas/conversations.ts +10 -0
package/src/config/schemas/heartbeat.ts +14 -0
package/src/config/schemas/llm.ts +1 -3
package/src/config/schemas/memory-retrospective.ts +1 -1
package/src/config/schemas/memory-v2.ts +4 -4
package/src/config/schemas/memory.ts +3 -1
package/src/config/seed-inference-profiles.ts +99 -29
package/src/context/compactor.ts +72 -12
package/src/context/token-estimator.ts +32 -34
package/src/daemon/__tests__/conversation-lifecycle-auto-analyze.test.ts +3 -22
package/src/daemon/conversation-agent-loop-handlers.ts +78 -0
package/src/daemon/conversation-agent-loop.ts +29 -2
package/src/daemon/conversation-runtime-assembly.ts +9 -0
package/src/daemon/conversation.ts +0 -7
package/src/daemon/date-context.ts +40 -0
package/src/daemon/guardian-action-generators.ts +1 -125
package/src/daemon/handlers/__tests__/config-a2a-complete.test.ts +248 -0
package/src/daemon/handlers/__tests__/config-a2a-invite.test.ts +154 -0
package/src/daemon/handlers/__tests__/config-a2a-redeem.test.ts +133 -0
package/src/daemon/handlers/__tests__/config-a2a.test.ts +95 -0
package/src/daemon/handlers/config-a2a.ts +289 -0
package/src/daemon/handlers/conversations.ts +1 -0
package/src/daemon/host-app-control-proxy.ts +69 -18
package/src/daemon/host-proxy-preactivation.ts +85 -18
package/src/daemon/lifecycle.ts +49 -61
package/src/daemon/memory-v2-startup.ts +49 -13
package/src/daemon/message-types/notifications.ts +21 -0
package/src/daemon/pkb-reminder-builder.test.ts +10 -53
package/src/daemon/pkb-reminder-builder.ts +4 -19
package/src/daemon/process-message.ts +3 -0
package/src/daemon/skill-memory-refresh.ts +5 -1
package/src/daemon/wake-target-adapter.ts +2 -0
package/src/export/__tests__/transcript-formatter.test.ts +121 -0
package/src/export/transcript-formatter.ts +54 -20
package/src/heartbeat/__tests__/heartbeat-service.test.ts +44 -0
package/src/heartbeat/heartbeat-service.ts +34 -191
package/src/home/__tests__/feed-types.test.ts +40 -0
package/src/home/feed-types.ts +14 -2
package/src/ipc/cli-client.ts +147 -45
package/src/memory/__tests__/conversation-queries.test.ts +220 -0
package/src/memory/__tests__/memory-retrospective-enqueue.test.ts +2 -50
package/src/memory/__tests__/memory-retrospective-job.test.ts +87 -4
package/src/memory/conversation-queries.ts +87 -1
package/src/memory/conversation-title-service.ts +26 -4
package/src/memory/db-init.ts +6 -0
package/src/memory/graph/__tests__/conversation-graph-memory-v2-routing.test.ts +84 -3
package/src/memory/graph/conversation-graph-memory.ts +18 -6
package/src/memory/graph/tools.ts +6 -37
package/src/memory/invite-store.ts +53 -0
package/src/memory/llm-request-log-source-clickhouse.ts +7 -2
package/src/memory/llm-request-log-store.ts +92 -1
package/src/memory/memory-retrospective-enqueue.ts +1 -20
package/src/memory/memory-retrospective-job.ts +33 -6
package/src/memory/migrations/250-provider-connection-base-url-and-models.ts +28 -0
package/src/memory/migrations/251-a2a-tasks.ts +49 -0
package/src/memory/migrations/252-llm-request-log-agent-loop-exit-reason.ts +32 -0
package/src/memory/migrations/index.ts +3 -0
package/src/memory/migrations/registry.ts +8 -0
package/src/memory/schema/a2a.ts +15 -0
package/src/memory/schema/index.ts +1 -0
package/src/memory/schema/inference.ts +2 -0
package/src/memory/schema/infrastructure.ts +1 -0
package/src/memory/v2/__tests__/activation-store.test.ts +25 -23
package/src/memory/v2/__tests__/cli-command-store.test.ts +404 -0
package/src/memory/v2/__tests__/frontmatter-sweep.test.ts +25 -4
package/src/memory/v2/__tests__/injection.test.ts +190 -3
package/src/memory/v2/__tests__/static-context.test.ts +12 -1
package/src/memory/v2/activation-store.ts +14 -16
package/src/memory/v2/cli-command-content.ts +19 -0
package/src/memory/v2/cli-command-store.ts +304 -0
package/src/memory/v2/frontmatter-sweep.ts +7 -1
package/src/memory/v2/injection.ts +49 -20
package/src/memory/v2/page-index.ts +38 -13
package/src/memory/v2/static-context.ts +4 -4
package/src/memory/v2/types.ts +23 -0
package/src/messaging/providers/a2a/__tests__/deliver.test.ts +274 -0
package/src/messaging/providers/a2a/deliver.ts +156 -0
package/src/messaging/providers/gmail/client.ts +9 -2
package/src/messaging/providers/index.ts +11 -2
package/src/notifications/__tests__/broadcaster.test.ts +203 -0
package/src/notifications/__tests__/decision-engine.test.ts +283 -0
package/src/notifications/__tests__/deterministic-checks.test.ts +286 -0
package/src/notifications/__tests__/emit-signal-home-feed.test.ts +1 -0
package/src/notifications/__tests__/home-feed-side-effect.test.ts +430 -7
package/src/notifications/adapters/macos.ts +12 -2
package/src/notifications/broadcaster.ts +29 -4
package/src/notifications/copy-composer.ts +17 -64
package/src/notifications/decision-engine.ts +111 -44
package/src/notifications/deterministic-checks.ts +96 -0
package/src/notifications/emit-signal.ts +1 -0
package/src/notifications/home-feed-side-effect.ts +85 -6
package/src/notifications/signal.ts +0 -4
package/src/notifications/types.ts +8 -0
package/src/oauth/platform-connection.test.ts +43 -3
package/src/oauth/platform-connection.ts +13 -4
package/src/plugins/defaults/injectors.ts +38 -19
package/src/plugins/external-plugin-loader.ts +82 -10
package/src/plugins/types.ts +16 -7
package/src/prompts/__tests__/system-prompt.test.ts +6 -51
package/src/prompts/__tests__/task-progress-hint-section.test.ts +4 -8
package/src/prompts/system-prompt.ts +0 -8
package/src/prompts/templates/BOOTSTRAP.md +5 -5
package/src/prompts/templates/system-sections.ts +0 -9
package/src/providers/__tests__/inference.test.ts +2 -0
package/src/providers/call-site-routing.ts +24 -6
package/src/providers/connection-resolution.ts +63 -13
package/src/providers/inference/__tests__/adapter-factory-openai-compatible.test.ts +74 -0
package/src/providers/inference/__tests__/connections-openai-compatible.test.ts +175 -0
package/src/providers/inference/__tests__/connections-status-label.test.ts +15 -0
package/src/providers/inference/adapter-factory.ts +9 -20
package/src/providers/inference/auth.ts +12 -0
package/src/providers/inference/backfill.ts +14 -1
package/src/providers/inference/connections.ts +85 -5
package/src/providers/inference/resolve-auth.ts +2 -0
package/src/providers/model-catalog.ts +199 -244
package/src/providers/model-intents.ts +3 -3
package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts +235 -0
package/src/providers/openai/chat-completions-provider.ts +159 -6
package/src/providers/openrouter/client.ts +42 -4
package/src/providers/platform-proxy/constants.ts +3 -4
package/src/providers/provider-catalog-visibility.ts +3 -1
package/src/providers/provider-send-message.ts +27 -12
package/src/providers/registry.ts +30 -1
package/src/runtime/agent-wake.ts +61 -1
package/src/runtime/auth/route-policy.ts +13 -0
package/src/runtime/http-server.ts +7 -16
package/src/runtime/http-types.ts +0 -47
package/src/runtime/routes/__tests__/consolidation-routes.test.ts +258 -0
package/src/runtime/routes/__tests__/conversation-query-routes.test.ts +66 -4
package/src/runtime/routes/__tests__/inference-provider-connection-routes.test.ts +275 -44
package/src/runtime/routes/__tests__/llm-call-sites-routes.test.ts +12 -0
package/src/runtime/routes/channel-availability-routes.ts +5 -0
package/src/runtime/routes/consolidation-routes.ts +100 -0
package/src/runtime/routes/conversation-query-routes.ts +70 -11
package/src/runtime/routes/conversation-routes.ts +7 -0
package/src/runtime/routes/index.ts +2 -0
package/src/runtime/routes/inference-provider-connection-routes.ts +134 -1
package/src/runtime/routes/integrations/a2a.ts +235 -0
package/src/runtime/routes/llm-call-sites-routes.ts +11 -1
package/src/runtime/routes/subagents-routes.ts +41 -0
package/src/subagent/manager.ts +2 -0
package/src/tools/memory/register.ts +1 -9
package/src/tools/registry.ts +2 -2
package/src/tools/types.ts +37 -2
package/src/workspace/migrations/087-memory-router-balanced-profile.ts +91 -0
package/src/workspace/migrations/registry.ts +2 -0
package/src/__tests__/guardian-action-conversation-turn.test.ts +0 -441
package/src/memory/graph/__tests__/remember-description.test.ts +0 -55
package/src/runtime/guardian-action-conversation-turn.ts +0 -99

package/src/providers/openai/__tests__/chat-completions-provider-reasoning.test.ts ADDED Viewed

@@ -0,0 +1,235 @@
+import { describe, expect, test } from "bun:test";
+import { OpenAIChatCompletionsProvider } from "../chat-completions-provider.js";
+type ReasoningDetail = {
+  type?: string;
+  summary?: string | null;
+  text?: string | null;
+};
+type MockChunkDelta = {
+  content?: string | null;
+  reasoning?: string | null;
+  reasoning_content?: string | null;
+  reasoning_details?: ReasoningDetail[] | null;
+};
+type MockChunk = {
+  choices: Array<{ delta: MockChunkDelta; finish_reason?: string | null }>;
+  model?: string;
+  usage?: {
+    prompt_tokens: number;
+    completion_tokens: number;
+  };
+};
+function makeStream(chunks: MockChunk[]): AsyncIterable<MockChunk> {
+  return {
+    async *[Symbol.asyncIterator]() {
+      for (const c of chunks) yield c;
+    },
+  };
+}
+function stubProvider(chunks: MockChunk[]): {
+  provider: OpenAIChatCompletionsProvider;
+  events: Array<{ type: string; thinking?: string; text?: string }>;
+} {
+  const provider = new OpenAIChatCompletionsProvider("test-key", "test-model");
+  // Swap the SDK client for a stub whose chat.completions.create returns our
+  // canned async iterable.
+  (provider as unknown as { client: unknown }).client = {
+    chat: {
+      completions: {
+        create: async () => makeStream(chunks),
+      },
+    },
+  };
+  const events: Array<{ type: string; thinking?: string; text?: string }> = [];
+  (provider as unknown as { __events: typeof events }).__events = events;
+  return { provider, events };
+}
+async function runStream(
+  provider: OpenAIChatCompletionsProvider,
+  events: Array<{ type: string; thinking?: string; text?: string }>,
+): Promise<{
+  thinking: string;
+}> {
+  const response = await provider.sendMessage(
+    [{ role: "user", content: [{ type: "text", text: "hi" }] }],
+    undefined,
+    undefined,
+    {
+      onEvent: (e) => {
+        events.push(e as { type: string; thinking?: string; text?: string });
+      },
+    },
+  );
+  const thinkingBlock = response.content.find((b) => b.type === "thinking") as
+    | { type: "thinking"; thinking: string }
+    | undefined;
+  return { thinking: thinkingBlock?.thinking ?? "" };
+}
+describe("OpenAIChatCompletionsProvider reasoning parsing", () => {
+  test("emits flat reasoning_content once (Fireworks/DeepSeek/Together/Groq shape)", async () => {
+    const { provider, events } = stubProvider([
+      { choices: [{ delta: { reasoning_content: "hello " } }] },
+      { choices: [{ delta: { reasoning_content: "world" } }] },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 2 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas.map((d) => d.thinking)).toEqual(["hello ", "world"]);
+    expect(thinking).toBe("hello world");
+  });
+  test("emits flat reasoning once (OpenRouter non-Kimi shape)", async () => {
+    const { provider, events } = stubProvider([
+      { choices: [{ delta: { reasoning: "step " } }] },
+      { choices: [{ delta: { reasoning: "two" } }] },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 2 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas.map((d) => d.thinking)).toEqual(["step ", "two"]);
+    expect(thinking).toBe("step two");
+  });
+  test("emits reasoning_details once when only details present", async () => {
+    const { provider, events } = stubProvider([
+      {
+        choices: [
+          {
+            delta: {
+              reasoning_details: [{ type: "reasoning.text", text: "alpha " }],
+            },
+          },
+        ],
+      },
+      {
+        choices: [
+          {
+            delta: {
+              reasoning_details: [
+                { type: "reasoning.summary", summary: "beta" },
+              ],
+            },
+          },
+        ],
+      },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 2 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas.map((d) => d.thinking)).toEqual(["alpha ", "beta"]);
+    expect(thinking).toBe("alpha beta");
+  });
+  test("skips reasoning.encrypted entries entirely", async () => {
+    const { provider, events } = stubProvider([
+      {
+        choices: [
+          {
+            delta: {
+              reasoning_details: [
+                { type: "reasoning.encrypted", text: "opaque" },
+              ],
+            },
+          },
+        ],
+      },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 2 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas).toEqual([]);
+    expect(thinking).toBe("");
+  });
+  test("falls back to flat reasoning when details carry only encrypted entries", async () => {
+    const { provider, events } = stubProvider([
+      {
+        choices: [
+          {
+            delta: {
+              reasoning: "visible ",
+              reasoning_details: [
+                { type: "reasoning.encrypted", text: "opaque" },
+              ],
+            },
+          },
+        ],
+      },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 2 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas.map((d) => d.thinking)).toEqual(["visible "]);
+    expect(thinking).toBe("visible ");
+  });
+  test("does NOT double-emit when Kimi K2.6 mirrors text into both fields", async () => {
+    // OpenRouter Kimi K2.6 with `reasoning.summary` set sends the same token
+    // in both `delta.reasoning` and `delta.reasoning_details[].text`. The
+    // structured field is preferred and the flat field is skipped, so each
+    // token appears exactly once in the output stream.
+    const { provider, events } = stubProvider([
+      {
+        choices: [
+          {
+            delta: {
+              reasoning: "it ",
+              reasoning_details: [{ type: "reasoning.text", text: "it " }],
+            },
+          },
+        ],
+      },
+      {
+        choices: [
+          {
+            delta: {
+              reasoning: "worked",
+              reasoning_details: [{ type: "reasoning.text", text: "worked" }],
+            },
+          },
+        ],
+      },
+      {
+        choices: [
+          {
+            delta: {
+              reasoning: "!",
+              reasoning_details: [{ type: "reasoning.text", text: "!" }],
+            },
+          },
+        ],
+      },
+      {
+        choices: [{ delta: {}, finish_reason: "stop" }],
+        usage: { prompt_tokens: 1, completion_tokens: 3 },
+      },
+    ]);
+    const { thinking } = await runStream(provider, events);
+    const deltas = events.filter((e) => e.type === "thinking_delta");
+    expect(deltas.map((d) => d.thinking)).toEqual(["it ", "worked", "!"]);
+    expect(thinking).toBe("it worked!");
+  });
+});

package/src/providers/openai/chat-completions-provider.ts CHANGED Viewed

@@ -69,6 +69,10 @@ export interface OpenAIChatCompletionsProviderOptions {
    *  document `low|medium|high` (e.g. Fireworks) should set this to "high" so
    *  Vellum's `xhigh`/`max` tiers don't 4xx upstream. */
   maxReasoningEffort?: "high" | "xhigh";
+  /** Parse `<think>...</think>` tags from the content stream into thinking
+   *  blocks. MiniMax and similar providers embed reasoning inside XML-style
+   *  tags in the regular content field rather than using `reasoning_content`. */
+  parseThinkTags?: boolean;
 }
 /** Map our internal effort values to OpenAI's reasoning_effort parameter.
@@ -76,7 +80,7 @@ export interface OpenAIChatCompletionsProviderOptions {
  *  passed through explicitly because OpenAI defaults `reasoning_effort` to
  *  "medium" when the field is omitted — the user's opt-out is only honored
  *  when we send it on the wire. */
-const EFFORT_TO_REASONING_EFFORT: Record<
+export const EFFORT_TO_REASONING_EFFORT: Record<
   string,
   NonNullable<
     OpenAI.Chat.Completions.ChatCompletionCreateParams["reasoning_effort"]
@@ -97,6 +101,13 @@ const OPENAI_SUPPORTED_IMAGE_TYPES = new Set([
   "image/webp",
 ]);
+function partialTagSuffix(text: string, tag: string): number {
+  for (let len = Math.min(text.length, tag.length - 1); len > 0; len--) {
+    if (text.endsWith(tag.substring(0, len))) return len;
+  }
+  return 0;
+}
 /**
  * OpenAI-compatible chat-completions transport.
  *
@@ -113,6 +124,7 @@ export class OpenAIChatCompletionsProvider implements Provider {
   private extraCreateParams: Record<string, unknown>;
   private maxReasoningEffort: "high" | "xhigh";
   private requestHeaders: Record<string, string>;
+  private parseThinkTags: boolean;
   constructor(
     apiKey: string,
@@ -130,6 +142,7 @@ export class OpenAIChatCompletionsProvider implements Provider {
     this.extraCreateParams = options.extraCreateParams ?? {};
     this.maxReasoningEffort = options.maxReasoningEffort ?? "xhigh";
     this.requestHeaders = options.requestHeaders ?? {};
+    this.parseThinkTags = options.parseThinkTags ?? false;
   }
   async sendMessage(
@@ -163,10 +176,17 @@ export class OpenAIChatCompletionsProvider implements Provider {
         params.max_completion_tokens = maxTokens;
       }
+      // Subclasses (OpenRouter) may already have nested effort under
+      // `reasoning.effort` via `buildExtraCreateParams`. Skip the flat
+      // `reasoning_effort` assignment in that case to avoid sending both forms,
+      // which OpenRouter rejects on reasoning models.
+      const nestedReasoningEffort = (
+        params as { reasoning?: { effort?: unknown } }
+      ).reasoning?.effort;
       const reasoningEffort = effort
         ? EFFORT_TO_REASONING_EFFORT[effort]
         : undefined;
-      if (reasoningEffort) {
+      if (reasoningEffort && typeof nestedReasoningEffort !== "string") {
         params.reasoning_effort =
           reasoningEffort === "xhigh" && this.maxReasoningEffort === "high"
             ? "high"
@@ -189,6 +209,68 @@ export class OpenAIChatCompletionsProvider implements Provider {
       // Accumulate the response from chunks
       let contentText = "";
+      let reasoningText = "";
+      let insideThinkBlock = false;
+      let pendingContent = "";
+      const flushPendingContent = (final: boolean): void => {
+        while (pendingContent.length > 0) {
+          if (insideThinkBlock) {
+            const closeIdx = pendingContent.indexOf("</think>");
+            if (closeIdx >= 0) {
+              const thinking = pendingContent.substring(0, closeIdx);
+              if (thinking) {
+                reasoningText += thinking;
+                onEvent?.({ type: "thinking_delta", thinking });
+              }
+              insideThinkBlock = false;
+              pendingContent = pendingContent.substring(
+                closeIdx + "</think>".length,
+              );
+            } else {
+              const partial = final
+                ? 0
+                : partialTagSuffix(pendingContent, "</think>");
+              const safeLen = pendingContent.length - partial;
+              if (safeLen > 0) {
+                const thinking = pendingContent.substring(0, safeLen);
+                reasoningText += thinking;
+                onEvent?.({ type: "thinking_delta", thinking });
+              }
+              pendingContent =
+                partial > 0 ? pendingContent.substring(safeLen) : "";
+              break;
+            }
+          } else {
+            const openIdx = pendingContent.indexOf("<think>");
+            if (openIdx >= 0) {
+              const text = pendingContent.substring(0, openIdx);
+              if (text) {
+                contentText += text;
+                onEvent?.({ type: "text_delta", text });
+              }
+              insideThinkBlock = true;
+              pendingContent = pendingContent.substring(
+                openIdx + "<think>".length,
+              );
+            } else {
+              const partial = final
+                ? 0
+                : partialTagSuffix(pendingContent, "<think>");
+              const safeLen = pendingContent.length - partial;
+              if (safeLen > 0) {
+                const t = pendingContent.substring(0, safeLen);
+                contentText += t;
+                onEvent?.({ type: "text_delta", text: t });
+              }
+              pendingContent =
+                partial > 0 ? pendingContent.substring(safeLen) : "";
+              break;
+            }
+          }
+        }
+      };
       const toolCallMap = new Map<
         number,
         { id: string; name: string; args: string }
@@ -216,8 +298,62 @@ export class OpenAIChatCompletionsProvider implements Provider {
           const choice = chunk.choices[0];
           if (choice) {
             if (choice.delta.content) {
-              contentText += choice.delta.content;
-              onEvent?.({ type: "text_delta", text: choice.delta.content });
+              if (this.parseThinkTags) {
+                pendingContent += choice.delta.content;
+                flushPendingContent(false);
+              } else {
+                contentText += choice.delta.content;
+                onEvent?.({ type: "text_delta", text: choice.delta.content });
+              }
+            }
+            // Compatibility providers disagree on the field name: Fireworks /
+            // DeepSeek / Together / Groq stream `reasoning_content`; OpenRouter
+            // (per its ChatAssistantMessage spec) streams `reasoning`, and for
+            // reasoning summaries (e.g. Kimi K2.6) also populates
+            // `delta.reasoning_details[]` (entries are `reasoning.summary`,
+            // `reasoning.text`, or opaque `reasoning.encrypted`).
+            //
+            // Kimi K2.6 mirrors the same token into BOTH `delta.reasoning` and
+            // `delta.reasoning_details[].text` per chunk — prefer details when
+            // they carry visible text, otherwise fall through to the flat
+            // field. The encrypted-only case must fall through too, so the
+            // flat `reasoning` field isn't silently dropped.
+            const deltaWithReasoning = choice.delta as {
+              reasoning?: string | null;
+              reasoning_content?: string | null;
+              reasoning_details?: Array<{
+                type?: string;
+                summary?: string | null;
+                text?: string | null;
+              }> | null;
+            };
+            let sawVisibleDetail = false;
+            const reasoningDetails = deltaWithReasoning.reasoning_details;
+            if (Array.isArray(reasoningDetails)) {
+              for (const entry of reasoningDetails) {
+                if (entry.type === "reasoning.encrypted") continue;
+                const piece = entry.summary ?? entry.text;
+                if (piece) {
+                  sawVisibleDetail = true;
+                  reasoningText += piece;
+                  onEvent?.({ type: "thinking_delta", thinking: piece });
+                }
+              }
+            }
+            if (!sawVisibleDetail) {
+              const reasoningContent =
+                deltaWithReasoning.reasoning_content ??
+                deltaWithReasoning.reasoning;
+              if (reasoningContent) {
+                reasoningText += reasoningContent;
+                onEvent?.({
+                  type: "thinking_delta",
+                  thinking: reasoningContent,
+                });
+              }
             }
             if (choice.delta.tool_calls) {
@@ -260,10 +396,27 @@ export class OpenAIChatCompletionsProvider implements Provider {
         cleanupTimeout();
       }
+      if (this.parseThinkTags && pendingContent) {
+        flushPendingContent(true);
+      }
       // Build content blocks
+      const finalReasoning = this.parseThinkTags
+        ? reasoningText.trim()
+        : reasoningText;
+      const finalContent = this.parseThinkTags
+        ? contentText.trim()
+        : contentText;
       const content: ContentBlock[] = [];
-      if (contentText) {
-        content.push({ type: "text", text: contentText });
+      if (finalReasoning) {
+        content.push({
+          type: "thinking",
+          thinking: finalReasoning,
+          signature: "",
+        });
+      }
+      if (finalContent) {
+        content.push({ type: "text", text: finalContent });
       }
       for (const [, tc] of toolCallMap) {
         let input: Record<string, unknown>;

package/src/providers/openrouter/client.ts CHANGED Viewed

@@ -1,6 +1,9 @@
 import { ProviderError } from "../../util/errors.js";
 import { AnthropicProvider } from "../anthropic/client.js";
-import { OpenAIChatCompletionsProvider } from "../openai/chat-completions-provider.js";
+import {
+  EFFORT_TO_REASONING_EFFORT,
+  OpenAIChatCompletionsProvider,
+} from "../openai/chat-completions-provider.js";
 import { isThinkingConfigEnabled } from "../thinking-config.js";
 import type {
   Message,
@@ -53,6 +56,25 @@ export function extractOnlyList(config: unknown): string[] {
   return only.filter((x): x is string => typeof x === "string" && x.length > 0);
 }
+// OpenRouter's `reasoning.summary` field controls whether reasoning models emit
+// a human-readable summary alongside (or instead of) encrypted reasoning blocks.
+// Models like Kimi K2.6 return only encrypted `reasoning_details` unless a
+// summary level is requested, so the stream carries no visible thinking content.
+// Default to "detailed" so users see thinking by default; allow per-call
+// override via `config.openrouter.reasoning.summary`. Per OpenRouter's
+// ChatRequestReasoning schema, valid values are "auto" | "concise" | "detailed".
+const VALID_REASONING_SUMMARIES = new Set(["auto", "concise", "detailed"]);
+function extractReasoningSummaryOverride(config: unknown): string | undefined {
+  const cfg = config as
+    | { openrouter?: { reasoning?: { summary?: unknown } } }
+    | undefined;
+  const summary = cfg?.openrouter?.reasoning?.summary;
+  return typeof summary === "string" && VALID_REASONING_SUMMARIES.has(summary)
+    ? summary
+    : undefined;
+}
 /**
  * Rewrite `options.config` for the Anthropic-compat path so OpenRouter's
  * `provider: { only: [...] }` body field travels through `AnthropicProvider`'s
@@ -160,14 +182,30 @@ export class OpenRouterProvider extends OpenAIChatCompletionsProvider {
   // OpenRouter's unified `reasoning` parameter controls extended thinking on
   // its OpenAI-compatible endpoint. Anthropic models skip this path entirely and
   // go through AnthropicProvider, which receives the native `thinking` object.
+  //
+  // `effort` nests under `reasoning` here (rather than flat `reasoning_effort`)
+  // because OpenRouter's documented `ChatRequestReasoning` shape is the union of
+  // { effort, summary }. `summary` is required for models like Kimi K2.6 that
+  // would otherwise return only encrypted reasoning blocks; we default to
+  // "detailed" and let callers override via `config.openrouter.reasoning.summary`.
   protected override buildExtraCreateParams(
     options?: SendMessageOptions,
   ): Record<string, unknown> {
     const config = options?.config as Record<string, unknown> | undefined;
     const thinkingEnabled = isThinkingConfigEnabled(config?.thinking);
-    const extras: Record<string, unknown> = {
-      reasoning: { enabled: thinkingEnabled },
-    };
+    const effort = config?.effort as string | undefined;
+    const mappedEffort = effort
+      ? EFFORT_TO_REASONING_EFFORT[effort]
+      : undefined;
+    const summaryOverride = extractReasoningSummaryOverride(config);
+    const reasoning: Record<string, unknown> = { enabled: thinkingEnabled };
+    if (mappedEffort) {
+      reasoning.effort = mappedEffort;
+    }
+    if (thinkingEnabled) {
+      reasoning.summary = summaryOverride ?? "detailed";
+    }
+    const extras: Record<string, unknown> = { reasoning };
     const only = extractOnlyList(config);
     if (only.length > 0) {
       const existingProvider = (config?.provider ?? {}) as Record<

package/src/providers/platform-proxy/constants.ts CHANGED Viewed

@@ -43,14 +43,13 @@ export const PLATFORM_PROVIDER_META: Record<string, ManagedProviderMeta> = {
   },
   fireworks: {
     name: "fireworks",
-    managed: false,
+    managed: true,
+    proxyPath: "/v1/runtime-proxy/fireworks",
   },
   openrouter: {
     name: "openrouter",
     managed: false,
   },
   ollama: { name: "ollama", managed: false },
-  zai: { name: "zai", managed: false },
-  deepseek: { name: "deepseek", managed: false },
-  minimax: { name: "minimax", managed: false },
+  "openai-compatible": { name: "openai-compatible", managed: false },
 };

package/src/providers/provider-catalog-visibility.ts CHANGED Viewed

@@ -32,5 +32,7 @@ export function getVisibleProviderCatalog(
       if (visibleModels.length === entry.models.length) return entry;
       return { ...entry, models: visibleModels };
     })
-    .filter((entry) => entry.models.length > 0);
+    .filter(
+      (entry) => entry.models.length > 0 || entry.defaultModel === "",
+    );
 }

package/src/providers/provider-send-message.ts CHANGED Viewed

@@ -7,8 +7,10 @@
 import { resolveCallSiteConfig } from "../config/llm-resolver.js";
 import { getConfig } from "../config/loader.js";
 import type { LLMCallSite } from "../config/schemas/llm.js";
+import { getDb } from "../memory/db-connection.js";
 import { getLogger } from "../util/logger.js";
 import { tryResolveProviderForConnectionName } from "./connection-resolution.js";
+import { listConnections } from "./inference/connections.js";
 import { initializeProviders, listProviders } from "./registry.js";
 import type {
   ContentBlock,
@@ -110,22 +112,35 @@ export async function resolveConfiguredProvider(
   const resolved = resolveCallSiteConfig(callSite, config.llm, opts);
   const inferenceProvider = resolved.provider;
-  const connectionName = resolved.provider_connection;
+  let connectionName = resolved.provider_connection;
   // Connection-aware path: every dispatch goes through `provider_connection`.
   // The boot-time backfill ensures every profile has one in production.
-  // When unset (test envs that skip backfill, freshly-installed configs
-  // not yet backfilled, or users who manually cleared the field), we
-  // return null so callsites with deterministic fallbacks (invite
-  // instructions, telegram username resolution, etc.) keep working.
-  // Hard config errors — connection lookup failure, provider mismatch —
-  // still throw via `tryResolveProviderForConnectionName` below.
+  // When unset (profile set provider with "Any active" connection, test envs
+  // that skip backfill, freshly-installed configs not yet backfilled, or
+  // users who manually cleared the field), try to auto-resolve from the
+  // provider before falling back to null.
   if (!connectionName) {
-    log.debug(
-      { callSite, inferenceProvider },
-      "resolveCallSiteConfig yielded no provider_connection — returning null so callsite can fall back",
-    );
-    return null;
+    if (inferenceProvider) {
+      try {
+        const candidates = listConnections(getDb(), {
+          provider: inferenceProvider,
+        });
+        const active = candidates.find((c) => c.status === "active");
+        if (active) {
+          connectionName = active.name;
+        }
+      } catch {
+        // DB not available — fall through to the existing null-return path.
+      }
+    }
+    if (!connectionName) {
+      log.debug(
+        { callSite, inferenceProvider },
+        "resolveCallSiteConfig yielded no provider_connection — returning null so callsite can fall back",
+      );
+      return null;
+    }
   }
   const connectionProvider = await tryResolveProviderForConnectionName(