npm - @firstlovecenter/ai-chat - Versions diffs - 0.2.3 → 0.6.0 - Mend

@firstlovecenter/ai-chat 0.2.3 → 0.6.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/CHANGELOG.md +57 -0
package/dist/drizzle/index.cjs +24 -0
package/dist/drizzle/index.cjs.map +1 -1
package/dist/drizzle/index.d.cts +36 -1
package/dist/drizzle/index.d.ts +36 -1
package/dist/drizzle/index.js +25 -1
package/dist/drizzle/index.js.map +1 -1
package/dist/prisma/index.cjs +7 -0
package/dist/prisma/index.cjs.map +1 -1
package/dist/prisma/index.d.cts +8 -1
package/dist/prisma/index.d.ts +8 -1
package/dist/prisma/index.js +7 -0
package/dist/prisma/index.js.map +1 -1
package/dist/server/index.cjs +353 -15
package/dist/server/index.cjs.map +1 -1
package/dist/server/index.d.cts +50 -4
package/dist/server/index.d.ts +50 -4
package/dist/server/index.js +353 -15
package/dist/server/index.js.map +1 -1
package/dist/{types-DNwFvL-C.d.cts → types-CQntnyDJ.d.cts} +24 -2
package/dist/{types-DNwFvL-C.d.ts → types-CQntnyDJ.d.ts} +24 -2
package/dist/ui/index.cjs +1024 -87
package/dist/ui/index.cjs.map +1 -1
package/dist/ui/index.d.cts +24 -12
package/dist/ui/index.d.ts +24 -12
package/dist/ui/index.js +1022 -88
package/dist/ui/index.js.map +1 -1
package/package.json +1 -1
package/prisma/chat-models.prisma +7 -0

package/dist/server/index.d.cts CHANGED Viewed

@@ -1,7 +1,8 @@
-import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-DNwFvL-C.cjs';
-export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-DNwFvL-C.cjs';
+import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-CQntnyDJ.cjs';
+export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-CQntnyDJ.cjs';
 import { GoogleAuth } from 'google-auth-library';
 export { GoogleAuth } from 'google-auth-library';
+import 'zod';
 /**
  * Provider-agnostic tool-calling abstraction.
@@ -302,6 +303,34 @@ declare function createAgentCustomRoutes<S>(ctx: AgentCustomRouteCtx<S>): {
     POST: (req: Request) => Promise<Response>;
 };
+/**
+ * Streaming-route hooks for the Vercel AI SDK chat.
+ *
+ * Identical to `AgentCustomHooks` — the lifecycle (pre-auth → auth →
+ * post-auth → resolve session → onSessionStart → stream → onSessionEnd)
+ * is the same. We re-alias rather than introducing a new type so consumers
+ * can plug a single hook bag into both routes.
+ */
+type AgentVercelHooks$1<S> = AgentCustomHooks$1<S>;
+type AgentVercelRouteCtx<S> = {
+    persistence: PersistencePort;
+    auth: AuthPort<S>;
+    scope: ScopePort<S>;
+    tools: ToolsPort;
+    vertex: VertexPort;
+    logger?: LoggerPort;
+    /**
+     * Optional lifecycle hooks. See `AgentCustomHooks` for the available
+     * extension points (shutdown gating, rate limiting, per-request
+     * resource setup/teardown).
+     */
+    hooks?: AgentVercelHooks$1<S>;
+};
+declare function createAgentVercelRoutes<S>(ctx: AgentVercelRouteCtx<S>): {
+    /** Next.js-compatible POST handler. */
+    POST: (req: Request) => Promise<Response>;
+};
 /**
  * `chat-sessions` route factory — host-agnostic CRUD for chat sessions.
  *
@@ -369,7 +398,7 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
 /**
  * `/api/admin/ai-settings` route factory — global AI configuration (super_admin only).
  *
- * Three patchable fields on the singleton settings row:
+ * Five patchable fields on the singleton settings row:
  *   - `tool_provider` — vendor that drives the agent tool loop. Validated
  *     against the registered `toolProviders` registry passed in via ctx.
  *   - `gcp_location` — the Vertex region every provider call hits. Stays
@@ -379,6 +408,15 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
  *     against the `chatInterfaces` registry passed in via ctx (the actual
  *     registry lives in `@firstlovecenter/ai-chat/ui` so the host wires it through;
  *     the route stays free of UI imports).
+ *   - `max_output_tokens` — caps the agent loop's per-turn output AND each
+ *     narrator's prose pass. Bounded `[256, 64000]` — anything below 256 can't
+ *     fit a useful response, anything above 64000 exceeds the headroom of any
+ *     model currently routed through Vertex.
+ *   - `role_prompt` — admin-editable persona string. Empty string and the
+ *     explicit JSON `null` both clear the override back to the host's static
+ *     `configureAiChat({ rolePrompt })` fallback; we canonicalise an empty/
+ *     whitespace-only string to `null` on write so the "no override" state has
+ *     a single representation in storage.
  *
  * Wire format is snake_case to preserve byte-for-byte parity with the
  * host route the package replaces — existing host UIs keep working
@@ -501,6 +539,7 @@ type AiChatRuntime<S = unknown> = {
     }) => Promise<AgentResult>;
     routes: {
         agentCustom: ReturnType<typeof createAgentCustomRoutes<S>>;
+        agentVercel: ReturnType<typeof createAgentVercelRoutes<S>>;
         chatSessions: ReturnType<typeof createChatSessionsRoutes<S>>;
         adminSettings: ReturnType<typeof createAdminSettingsRoutes<S>>;
     };
@@ -513,5 +552,12 @@ declare function configureAiChat<S = unknown>(opts: ConfigureAiChatOpts<S>): AiC
 type RouteHooks<S> = RouteHooks$1<S>;
 type AgentCustomHooks<S> = AgentCustomHooks$1<S>;
+/**
+ * Alias of `AgentCustomHooks` — the Vercel AI SDK chat reuses the same
+ * lifecycle (pre-auth → auth → post-auth → resolve session → onSessionStart
+ * → stream → onSessionEnd). Re-exported for callers that prefer the more
+ * specific name.
+ */
+type AgentVercelHooks<S> = AgentVercelHooks$1<S>;
-export { type AgentCustomHooks, type AgentInput, type AgentResult, type AiChatRuntime, AuthPort, BUILTIN_CHAT_INTERFACE_IDS, type ChatInterfaceRegistryEntry, type ConfigureAiChatOpts, DEFAULT_MAX_OUTPUT_TOKENS, DEFAULT_MAX_TOOL_TURNS, LoggerPort, PersistencePort, PresentPayload, type ProviderInitOpts, type RouteHooks, ScopePort, SystemBlock, ToolContext, ToolDefinition, type ToolProviderDef, ToolSchema, ToolsPort, type TranscriptEntry, VertexPort, configureAiChat, getToolProvider, runAgent, toolProviders };
+export { type AgentCustomHooks, type AgentInput, type AgentResult, type AgentVercelHooks, type AiChatRuntime, AuthPort, BUILTIN_CHAT_INTERFACE_IDS, type ChatInterfaceRegistryEntry, type ConfigureAiChatOpts, DEFAULT_MAX_OUTPUT_TOKENS, DEFAULT_MAX_TOOL_TURNS, LoggerPort, PersistencePort, PresentPayload, type ProviderInitOpts, type RouteHooks, ScopePort, SystemBlock, ToolContext, ToolDefinition, type ToolProviderDef, ToolSchema, ToolsPort, type TranscriptEntry, VertexPort, configureAiChat, getToolProvider, runAgent, toolProviders };

package/dist/server/index.d.ts CHANGED Viewed

@@ -1,7 +1,8 @@
-import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-DNwFvL-C.js';
-export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-DNwFvL-C.js';
+import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-CQntnyDJ.js';
+export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-CQntnyDJ.js';
 import { GoogleAuth } from 'google-auth-library';
 export { GoogleAuth } from 'google-auth-library';
+import 'zod';
 /**
  * Provider-agnostic tool-calling abstraction.
@@ -302,6 +303,34 @@ declare function createAgentCustomRoutes<S>(ctx: AgentCustomRouteCtx<S>): {
     POST: (req: Request) => Promise<Response>;
 };
+/**
+ * Streaming-route hooks for the Vercel AI SDK chat.
+ *
+ * Identical to `AgentCustomHooks` — the lifecycle (pre-auth → auth →
+ * post-auth → resolve session → onSessionStart → stream → onSessionEnd)
+ * is the same. We re-alias rather than introducing a new type so consumers
+ * can plug a single hook bag into both routes.
+ */
+type AgentVercelHooks$1<S> = AgentCustomHooks$1<S>;
+type AgentVercelRouteCtx<S> = {
+    persistence: PersistencePort;
+    auth: AuthPort<S>;
+    scope: ScopePort<S>;
+    tools: ToolsPort;
+    vertex: VertexPort;
+    logger?: LoggerPort;
+    /**
+     * Optional lifecycle hooks. See `AgentCustomHooks` for the available
+     * extension points (shutdown gating, rate limiting, per-request
+     * resource setup/teardown).
+     */
+    hooks?: AgentVercelHooks$1<S>;
+};
+declare function createAgentVercelRoutes<S>(ctx: AgentVercelRouteCtx<S>): {
+    /** Next.js-compatible POST handler. */
+    POST: (req: Request) => Promise<Response>;
+};
 /**
  * `chat-sessions` route factory — host-agnostic CRUD for chat sessions.
  *
@@ -369,7 +398,7 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
 /**
  * `/api/admin/ai-settings` route factory — global AI configuration (super_admin only).
  *
- * Three patchable fields on the singleton settings row:
+ * Five patchable fields on the singleton settings row:
  *   - `tool_provider` — vendor that drives the agent tool loop. Validated
  *     against the registered `toolProviders` registry passed in via ctx.
  *   - `gcp_location` — the Vertex region every provider call hits. Stays
@@ -379,6 +408,15 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
  *     against the `chatInterfaces` registry passed in via ctx (the actual
  *     registry lives in `@firstlovecenter/ai-chat/ui` so the host wires it through;
  *     the route stays free of UI imports).
+ *   - `max_output_tokens` — caps the agent loop's per-turn output AND each
+ *     narrator's prose pass. Bounded `[256, 64000]` — anything below 256 can't
+ *     fit a useful response, anything above 64000 exceeds the headroom of any
+ *     model currently routed through Vertex.
+ *   - `role_prompt` — admin-editable persona string. Empty string and the
+ *     explicit JSON `null` both clear the override back to the host's static
+ *     `configureAiChat({ rolePrompt })` fallback; we canonicalise an empty/
+ *     whitespace-only string to `null` on write so the "no override" state has
+ *     a single representation in storage.
  *
  * Wire format is snake_case to preserve byte-for-byte parity with the
  * host route the package replaces — existing host UIs keep working
@@ -501,6 +539,7 @@ type AiChatRuntime<S = unknown> = {
     }) => Promise<AgentResult>;
     routes: {
         agentCustom: ReturnType<typeof createAgentCustomRoutes<S>>;
+        agentVercel: ReturnType<typeof createAgentVercelRoutes<S>>;
         chatSessions: ReturnType<typeof createChatSessionsRoutes<S>>;
         adminSettings: ReturnType<typeof createAdminSettingsRoutes<S>>;
     };
@@ -513,5 +552,12 @@ declare function configureAiChat<S = unknown>(opts: ConfigureAiChatOpts<S>): AiC
 type RouteHooks<S> = RouteHooks$1<S>;
 type AgentCustomHooks<S> = AgentCustomHooks$1<S>;
+/**
+ * Alias of `AgentCustomHooks` — the Vercel AI SDK chat reuses the same
+ * lifecycle (pre-auth → auth → post-auth → resolve session → onSessionStart
+ * → stream → onSessionEnd). Re-exported for callers that prefer the more
+ * specific name.
+ */
+type AgentVercelHooks<S> = AgentVercelHooks$1<S>;
-export { type AgentCustomHooks, type AgentInput, type AgentResult, type AiChatRuntime, AuthPort, BUILTIN_CHAT_INTERFACE_IDS, type ChatInterfaceRegistryEntry, type ConfigureAiChatOpts, DEFAULT_MAX_OUTPUT_TOKENS, DEFAULT_MAX_TOOL_TURNS, LoggerPort, PersistencePort, PresentPayload, type ProviderInitOpts, type RouteHooks, ScopePort, SystemBlock, ToolContext, ToolDefinition, type ToolProviderDef, ToolSchema, ToolsPort, type TranscriptEntry, VertexPort, configureAiChat, getToolProvider, runAgent, toolProviders };
+export { type AgentCustomHooks, type AgentInput, type AgentResult, type AgentVercelHooks, type AiChatRuntime, AuthPort, BUILTIN_CHAT_INTERFACE_IDS, type ChatInterfaceRegistryEntry, type ConfigureAiChatOpts, DEFAULT_MAX_OUTPUT_TOKENS, DEFAULT_MAX_TOOL_TURNS, LoggerPort, PersistencePort, PresentPayload, type ProviderInitOpts, type RouteHooks, ScopePort, SystemBlock, ToolContext, ToolDefinition, type ToolProviderDef, ToolSchema, ToolsPort, type TranscriptEntry, VertexPort, configureAiChat, getToolProvider, runAgent, toolProviders };

package/dist/server/index.js CHANGED Viewed

@@ -1,5 +1,8 @@
 import { AnthropicVertex } from '@anthropic-ai/vertex-sdk';
 import { randomUUID } from 'crypto';
+import { StreamData, streamText, tool } from 'ai';
+import { createVertex } from '@ai-sdk/google-vertex';
+import { createVertexAnthropic } from '@ai-sdk/google-vertex/anthropic';
 export { GoogleAuth } from 'google-auth-library';
 // src/server/tools/types.ts
@@ -70,8 +73,8 @@ async function runAgent(input) {
     const toolResults = [];
     for (const tc of response.toolCalls) {
       transcript.push({ kind: "tool_use", name: tc.name, input: tc.input });
-      const tool = input.tools[tc.name];
-      if (!tool) {
+      const tool2 = input.tools[tc.name];
+      if (!tool2) {
         const errResult = {
           ok: false,
           error: { code: "UNKNOWN_TOOL", message: `Unknown tool: ${tc.name}` }
@@ -85,7 +88,7 @@ async function runAgent(input) {
         });
         continue;
       }
-      const result = await tool.execute(tc.input, {
+      const result = await tool2.execute(tc.input, {
         ...input.ctx,
         toolCallCount
       });
@@ -647,7 +650,7 @@ async function* streamClaudeNarration(opts) {
   });
   const stream = await client.messages.stream({
     model: opts.modelId,
-    max_tokens: 400,
+    max_tokens: opts.maxTokens,
     system: NARRATIVE_SYSTEM,
     messages: [{ role: "user", content: buildNarrativeUserMessage(opts.input) }]
   });
@@ -707,7 +710,7 @@ async function* streamGeminiNarration(opts) {
           parts: [{ text: buildNarrativeUserMessage(opts.input) }]
         }
       ],
-      generationConfig: { maxOutputTokens: 400, temperature: 0 }
+      generationConfig: { maxOutputTokens: opts.maxTokens, temperature: 0 }
     })
   });
   if (!res.ok || !res.body) {
@@ -783,7 +786,7 @@ async function* streamGrokNarration(opts) {
     },
     body: JSON.stringify({
       model: opts.modelId,
-      max_tokens: 400,
+      max_tokens: opts.maxTokens,
       stream: true,
       messages: [
         { role: "system", content: NARRATIVE_SYSTEM3 },
@@ -1006,7 +1009,8 @@ data: ${JSON.stringify(data)}
               ctx: toolContext,
               tools: tools.tools,
               systemBlocks,
-              provider
+              provider,
+              maxOutputTokens: aiSettings.maxOutputTokens
             });
             if (!agentResult.ok) {
               persistedError = agentResult.error;
@@ -1032,6 +1036,7 @@ data: ${JSON.stringify(data)}
                     projectId: vertex.projectId,
                     location: aiSettings.gcpLocation,
                     modelId: narratorModelId,
+                    maxTokens: aiSettings.maxOutputTokens,
                     input: {
                       question,
                       structured,
@@ -1135,6 +1140,297 @@ data: {}
     }
   };
 }
+function buildVercelTools(tools, ctx, data, onPresent) {
+  const result = {};
+  let toolCallCount = 0;
+  for (const [name, def] of Object.entries(tools)) {
+    if (!def.zodSchema) {
+      throw new Error(
+        `Tool '${name}' has no zodSchema; required for the Vercel AI SDK chat. Add a Zod schema to the tool definition (or remove it from the registry if the host only uses the custom SSE chat).`
+      );
+    }
+    if (name === TERMINAL_TOOL_NAME) {
+      result[name] = tool({
+        description: def.schema.description,
+        // The Zod schema doubles as the runtime parameter validator the SDK
+        // hands the model. We accept whatever Zod shape the host registered;
+        // the SDK uses it to validate the tool-call arguments before dispatch.
+        parameters: def.zodSchema,
+        execute: async (input) => {
+          if (toolCallCount < 2) {
+            return {
+              error: {
+                code: "SELF_VERIFY_REQUIRED",
+                message: "Per FR-8.3 you must run at least one CROSS-CHECK tool call (a different metric, a different period, or a run_sql sanity-check) before present. Make that extra call now, then call present again."
+              }
+            };
+          }
+          const payload = input;
+          for (let i = 0; i < payload.blocks.length; i++) {
+            data.append({
+              type: "block",
+              value: { index: i, ...payload.blocks[i] }
+            });
+          }
+          onPresent(payload);
+          return { ok: true };
+        }
+      });
+      continue;
+    }
+    result[name] = tool({
+      description: def.schema.description,
+      parameters: def.zodSchema,
+      execute: async (input) => {
+        const res = await def.execute(input, { ...ctx, toolCallCount });
+        toolCallCount += 1;
+        if (res.ok) return res.data;
+        return { error: res.error };
+      }
+    });
+  }
+  return result;
+}
+// src/server/routes/agent-vercel.ts
+var VALID_MODELS = /* @__PURE__ */ new Set(["claude", "gemini"]);
+function jsonError2(status, code, message) {
+  return new Response(JSON.stringify({ error: { code, message } }), {
+    status,
+    headers: { "Content-Type": "application/json" }
+  });
+}
+function defaultGenerateSessionId2() {
+  return randomUUID().replace(/-/g, "").slice(0, 16);
+}
+function createAgentVercelRoutes(ctx) {
+  const { persistence, auth, scope, tools, vertex, logger, hooks } = ctx;
+  return {
+    /** Next.js-compatible POST handler. */
+    POST: async (req) => {
+      if (hooks?.onRequest) {
+        const short = await hooks.onRequest(req);
+        if (short) return short;
+      }
+      const authResult = await auth.requireAuth(req);
+      if (!authResult.ok) return authResult.response;
+      const { scope: callerScope, userId } = authResult;
+      if (hooks?.onAuthenticated) {
+        const short = await hooks.onAuthenticated({
+          req,
+          scope: callerScope,
+          userId
+        });
+        if (short) return short;
+      }
+      const body = await req.json().catch(() => null);
+      const question = typeof body?.question === "string" ? body.question.trim() : "";
+      if (!question) {
+        return jsonError2(
+          400,
+          "VALIDATION_FAILED",
+          "question must be a non-empty string."
+        );
+      }
+      const rawChatSessionId = body?.chatSessionId;
+      const incomingChatSessionId = typeof rawChatSessionId === "number" && Number.isInteger(rawChatSessionId) ? rawChatSessionId : null;
+      const rawModel = body?.model;
+      const requestedModel = typeof rawModel === "string" && VALID_MODELS.has(rawModel) ? rawModel : null;
+      const aiSettings = await persistence.getAiSettings();
+      let chatSessionId;
+      if (incomingChatSessionId !== null) {
+        const owned = await persistence.getSession(
+          incomingChatSessionId,
+          userId
+        );
+        if (!owned) {
+          return jsonError2(404, "NOT_FOUND", "Chat session not found.");
+        }
+        chatSessionId = owned.id;
+      } else {
+        const created = await persistence.createSession({
+          userId,
+          title: question.slice(0, 200)
+        });
+        chatSessionId = created.id;
+      }
+      await persistence.appendMessage({
+        sessionId: chatSessionId,
+        role: "user",
+        question
+      });
+      const sessionId = hooks?.generateSessionId ? await hooks.generateSessionId({
+        scope: callerScope,
+        userId,
+        chatSessionId: incomingChatSessionId
+      }) : defaultGenerateSessionId2();
+      const scopeSummary = await scope.buildScopeSummary(callerScope);
+      const scopeLabel = await scope.resolveScopeLabel(callerScope);
+      const toolContext = {
+        scope: callerScope,
+        sessionId,
+        scopeSummary,
+        toolCallCount: 0
+      };
+      const systemBlocks = await tools.buildSystemBlocks(toolContext);
+      const provider = requestedModel ?? aiSettings.toolProvider;
+      if (!VALID_MODELS.has(provider)) {
+        return jsonError2(
+          400,
+          "INVALID_PROVIDER",
+          `Vercel chat only supports 'claude' or 'gemini'; got '${provider}'.`
+        );
+      }
+      const data = new StreamData();
+      let presentPayload = null;
+      let persistedError = null;
+      let sessionStarted = false;
+      try {
+        if (hooks?.onSessionStart) {
+          await hooks.onSessionStart({
+            scope: callerScope,
+            sessionId,
+            userId
+          });
+        }
+        sessionStarted = true;
+        const vercelTools = buildVercelTools(
+          tools.tools,
+          toolContext,
+          data,
+          (p) => {
+            presentPayload = p;
+          }
+        );
+        data.append({
+          type: "meta",
+          value: { chatSessionId, scopeLabel }
+        });
+        const system = systemBlocks.map((b) => b.text).join("\n\n");
+        const model = provider === "claude" ? createVertexAnthropic({
+          project: vertex.projectId,
+          location: vertex.defaultLocation,
+          googleAuthOptions: {}
+        })(vertex.modelIds.claude) : createVertex({
+          project: vertex.projectId,
+          location: aiSettings.gcpLocation,
+          googleAuthOptions: {}
+        })(vertex.modelIds.gemini);
+        const result = streamText({
+          model,
+          system,
+          messages: [{ role: "user", content: question }],
+          tools: vercelTools,
+          maxSteps: 12,
+          maxTokens: aiSettings.maxOutputTokens,
+          onFinish: async ({ text }) => {
+            try {
+              let blocks = presentPayload?.blocks ?? [];
+              const prose = {};
+              const trimmed = (text ?? "").trim();
+              if (presentPayload === null && trimmed) {
+                const topic = question.length > 80 ? question.slice(0, 77) + "..." : question;
+                const synthetic = {
+                  kind: "paragraph_brief",
+                  topic,
+                  key_facts: [trimmed]
+                };
+                blocks = [synthetic];
+                prose[0] = trimmed;
+                data.append({
+                  type: "block",
+                  value: { index: 0, ...synthetic }
+                });
+              } else if (text) {
+                const firstPbIdx = blocks.findIndex(
+                  (b) => b.kind === "paragraph_brief"
+                );
+                if (firstPbIdx >= 0) prose[firstPbIdx] = text;
+              }
+              await persistence.appendMessage({
+                sessionId: chatSessionId,
+                role: "assistant",
+                blocks: blocks.length ? blocks : null,
+                prose: Object.keys(prose).length ? prose : null,
+                errorJson: persistedError
+              });
+            } catch (err2) {
+              logger?.warn?.(
+                {
+                  chatSessionId,
+                  sessionId,
+                  err: err2.message
+                },
+                "[agent-vercel] failed to persist assistant turn"
+              );
+            } finally {
+              try {
+                await data.close();
+              } catch {
+              }
+            }
+          }
+        });
+        return result.toDataStreamResponse({ data });
+      } catch (e) {
+        const message = e.message ?? "Internal error";
+        persistedError = { code: "INTERNAL", message };
+        logger?.error?.(
+          { chatSessionId, sessionId, err: message },
+          "[agent-vercel] route errored"
+        );
+        try {
+          data.append({
+            type: "error",
+            value: { code: "INTERNAL", message }
+          });
+        } catch {
+        }
+        try {
+          await data.close();
+        } catch {
+        }
+        try {
+          await persistence.appendMessage({
+            sessionId: chatSessionId,
+            role: "assistant",
+            blocks: null,
+            prose: null,
+            errorJson: persistedError
+          });
+        } catch (err2) {
+          logger?.warn?.(
+            { chatSessionId, sessionId, err: err2.message },
+            "[agent-vercel] failed to persist error turn"
+          );
+        }
+        return jsonError2(500, "INTERNAL", message);
+      } finally {
+        if (hooks?.onSessionEnd) {
+          const cause = req.signal.aborted ? "abort" : persistedError ? "error" : "complete";
+          try {
+            await hooks.onSessionEnd({
+              scope: callerScope,
+              sessionId,
+              userId,
+              cause
+            });
+          } catch (err2) {
+            logger?.warn?.(
+              {
+                chatSessionId,
+                sessionId,
+                sessionStarted,
+                err: err2.message
+              },
+              "[agent-vercel] onSessionEnd hook failed"
+            );
+          }
+        }
+      }
+    }
+  };
+}
 // src/server/routes/chat-sessions.ts
 var DEFAULT_TITLE = "New chat";
@@ -1315,6 +1611,8 @@ function createChatSessionsRoutes(ctx) {
 // src/server/routes/admin-settings.ts
 var VALID_LOCATIONS = ["us-east5", "global"];
+var MIN_MAX_OUTPUT_TOKENS = 256;
+var MAX_MAX_OUTPUT_TOKENS = 64e3;
 function isStringRecord(v) {
   return typeof v === "object" && v !== null && !Array.isArray(v);
 }
@@ -1329,6 +1627,8 @@ function toWire(settings) {
     tool_provider: settings.toolProvider,
     gcp_location: settings.gcpLocation,
     chat_interface: settings.chatInterface,
+    max_output_tokens: settings.maxOutputTokens,
+    role_prompt: settings.rolePrompt,
     updated_at: settings.updatedAt ? settings.updatedAt.toISOString() : null,
     updated_by_user_id: settings.updatedByUserId
   };
@@ -1408,11 +1708,29 @@ function createAdminSettingsRoutes(ctx) {
       }
       patch.chatInterface = v;
     }
-    if (patch.toolProvider === void 0 && patch.gcpLocation === void 0 && patch.chatInterface === void 0) {
+    if ("max_output_tokens" in body) {
+      const v = body.max_output_tokens;
+      if (typeof v !== "number" || !Number.isInteger(v) || v < MIN_MAX_OUTPUT_TOKENS || v > MAX_MAX_OUTPUT_TOKENS) {
+        return jsonResponse({ error: "invalid_max_output_tokens" }, 400);
+      }
+      patch.maxOutputTokens = v;
+    }
+    if ("role_prompt" in body) {
+      const v = body.role_prompt;
+      if (v === null) {
+        patch.rolePrompt = null;
+      } else if (typeof v === "string") {
+        const trimmed = v.trim();
+        patch.rolePrompt = trimmed === "" ? null : trimmed;
+      } else {
+        return jsonResponse({ error: "invalid_role_prompt" }, 400);
+      }
+    }
+    if (patch.toolProvider === void 0 && patch.gcpLocation === void 0 && patch.chatInterface === void 0 && patch.maxOutputTokens === void 0 && !("rolePrompt" in patch)) {
       return jsonResponse(
         {
           error: "empty_patch",
-          message: "Body must set at least one of tool_provider, gcp_location, chat_interface."
+          message: "Body must set at least one of tool_provider, gcp_location, chat_interface, max_output_tokens, role_prompt."
         },
         400
       );
@@ -1437,16 +1755,27 @@ function configureAiChat(opts) {
   ];
   const getProvider = (id) => toolProviders2.find((p) => p.id === id) ?? getToolProvider(id);
   const chatInterfaces = opts.chatInterfaces ?? BUILTIN_CHAT_INTERFACE_IDS.map((id) => ({ id }));
-  const tools = opts.rolePrompt ? {
+  const staticRolePrompt = opts.rolePrompt;
+  const tools = {
     tools: opts.tools.tools,
     async buildSystemBlocks(ctx) {
       const inner = await opts.tools.buildSystemBlocks(ctx);
-      const rolePrompt = opts.rolePrompt;
-      const role = typeof rolePrompt === "function" ? await rolePrompt(ctx) : rolePrompt;
-      if (!role || !role.trim()) return inner;
+      let role = null;
+      try {
+        const settings = await opts.persistence.getAiSettings();
+        if (settings.rolePrompt && settings.rolePrompt.trim()) {
+          role = settings.rolePrompt;
+        }
+      } catch {
+      }
+      if (!role && staticRolePrompt) {
+        const resolved = typeof staticRolePrompt === "function" ? await staticRolePrompt(ctx) : staticRolePrompt;
+        if (resolved && resolved.trim()) role = resolved;
+      }
+      if (!role) return inner;
       return [{ text: role, cached: true }, ...inner];
     }
-  } : opts.tools;
+  };
   const runAgentBound = async ({
     question,
     ctx,
@@ -1495,6 +1824,15 @@ function configureAiChat(opts) {
     resolveNarratorId: opts.resolveNarratorId,
     hooks: opts.hooks
   });
+  const agentVercel = createAgentVercelRoutes({
+    persistence: opts.persistence,
+    auth: opts.auth,
+    scope: opts.scope,
+    tools,
+    vertex: opts.vertex,
+    logger: opts.logger,
+    hooks: opts.hooks
+  });
   const chatSessions = createChatSessionsRoutes({
     persistence: opts.persistence,
     auth: opts.auth,
@@ -1511,7 +1849,7 @@ function configureAiChat(opts) {
   });
   return {
     runAgent: runAgentBound,
-    routes: { agentCustom, chatSessions, adminSettings },
+    routes: { agentCustom, agentVercel, chatSessions, adminSettings },
     registries: { toolProviders: toolProviders2, chatInterfaces }
   };
 }