npm - @firstlovecenter/ai-chat - Versions diffs - 0.6.1 → 0.8.0 - Mend

@firstlovecenter/ai-chat 0.6.1 → 0.8.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/CHANGELOG.md +50 -0
package/dist/drizzle/index.cjs +14 -0
package/dist/drizzle/index.cjs.map +1 -1
package/dist/drizzle/index.d.cts +18 -1
package/dist/drizzle/index.d.ts +18 -1
package/dist/drizzle/index.js +14 -0
package/dist/drizzle/index.js.map +1 -1
package/dist/prisma/index.cjs +6 -0
package/dist/prisma/index.cjs.map +1 -1
package/dist/prisma/index.d.cts +4 -1
package/dist/prisma/index.d.ts +4 -1
package/dist/prisma/index.js +6 -0
package/dist/prisma/index.js.map +1 -1
package/dist/server/index.cjs +169 -12
package/dist/server/index.cjs.map +1 -1
package/dist/server/index.d.cts +27 -3
package/dist/server/index.d.ts +27 -3
package/dist/server/index.js +169 -12
package/dist/server/index.js.map +1 -1
package/dist/{types-CQntnyDJ.d.cts → types-BnwUkqKb.d.cts} +8 -0
package/dist/{types-CQntnyDJ.d.ts → types-BnwUkqKb.d.ts} +8 -0
package/dist/ui/index.cjs +137 -98
package/dist/ui/index.cjs.map +1 -1
package/dist/ui/index.d.cts +15 -2
package/dist/ui/index.d.ts +15 -2
package/dist/ui/index.js +137 -98
package/dist/ui/index.js.map +1 -1
package/package.json +1 -1
package/prisma/chat-models.prisma +5 -0

package/dist/server/index.d.cts CHANGED Viewed

@@ -1,5 +1,5 @@
-import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-CQntnyDJ.cjs';
-export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-CQntnyDJ.cjs';
+import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-BnwUkqKb.cjs';
+export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-BnwUkqKb.cjs';
 import { GoogleAuth } from 'google-auth-library';
 export { GoogleAuth } from 'google-auth-library';
 import 'zod';
@@ -55,6 +55,14 @@ type NormalizedToolResult = {
 type NormalizedMessage = {
     role: 'user';
     text: string;
+    /**
+     * Cache hint: when true, the producing route is asking the provider
+     * to mark this message's content with a cache breakpoint so the
+     * full prefix becomes cacheable on a subsequent request. Anthropic
+     * applies `cache_control: ephemeral`; Vertex Gemini ignores the
+     * flag (its prefix cache works automatically).
+     */
+    cached?: boolean;
 } | {
     role: 'assistant';
     /** Free text the model emitted (zero-or-more text blocks joined as-is). */
@@ -69,6 +77,8 @@ type NormalizedMessage = {
      * thought_signature`. Other adapters can ignore.
      */
     providerData?: unknown;
+    /** See `user.cached`. */
+    cached?: boolean;
 } | {
     role: 'tool';
     results: NormalizedToolResult[];
@@ -155,6 +165,16 @@ type AgentInput<S = unknown> = {
     systemBlocks: SystemBlock[];
     /** Constructed ToolProvider — caller resolves the right one via toolProviders[id].createProvider({...}). */
     provider: ToolProvider;
+    /**
+     * Conversation history to seed the prompt with, in chronological order.
+     * Hosts pass this to give the model memory across turns in a chat session
+     * (so a follow-up like "summarize that" resolves the antecedent). The
+     * route handler is responsible for fetching prior `chat_messages` and
+     * normalising them; see `historyToNormalizedMessages` in `./history`.
+     * Tool-call provenance is intentionally not replayed — assistant turns
+     * here should be plain text only.
+     */
+    priorMessages?: NormalizedMessage[];
     /** Optional caps. Default both. */
     maxToolTurns?: number;
     maxOutputTokens?: number;
@@ -398,7 +418,7 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
 /**
  * `/api/admin/ai-settings` route factory — global AI configuration (super_admin only).
  *
- * Five patchable fields on the singleton settings row:
+ * Six patchable fields on the singleton settings row:
  *   - `tool_provider` — vendor that drives the agent tool loop. Validated
  *     against the registered `toolProviders` registry passed in via ctx.
  *   - `gcp_location` — the Vertex region every provider call hits. Stays
@@ -417,6 +437,10 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
  *     `configureAiChat({ rolePrompt })` fallback; we canonicalise an empty/
  *     whitespace-only string to `null` on write so the "no override" state has
  *     a single representation in storage.
+ *   - `gcp_project_id` — admin-editable GCP project override. Empty string and
+ *     the explicit JSON `null` both clear the override back to the host's
+ *     static `VertexPort.projectId`. Validated against GCP's project-id
+ *     format (`[a-z][-a-z0-9]{4,28}[a-z0-9]`) when non-null.
  *
  * Wire format is snake_case to preserve byte-for-byte parity with the
  * host route the package replaces — existing host UIs keep working

package/dist/server/index.d.ts CHANGED Viewed

@@ -1,5 +1,5 @@
-import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-CQntnyDJ.js';
-export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-CQntnyDJ.js';
+import { S as SystemBlock, T as ToolSchema, a as ToolContext, b as ToolDefinition, P as PresentPayload, c as PersistencePort, A as AuthPort, d as ScopePort, e as ToolsPort, V as VertexPort, L as LoggerPort } from '../types-BnwUkqKb.js';
+export { f as AiSettings, g as AiSettingsPatch, h as AppendMessageInput, i as AuthFail, j as AuthOk, k as AuthResult, B as Block, C as ChartSpec, l as ChatMessage, m as ChatMessageRole, n as ChatSession, o as CreateSessionInput, p as ListSessionsOpts, q as TERMINAL_TOOL_NAME, r as ToolResult, s as err, t as ok } from '../types-BnwUkqKb.js';
 import { GoogleAuth } from 'google-auth-library';
 export { GoogleAuth } from 'google-auth-library';
 import 'zod';
@@ -55,6 +55,14 @@ type NormalizedToolResult = {
 type NormalizedMessage = {
     role: 'user';
     text: string;
+    /**
+     * Cache hint: when true, the producing route is asking the provider
+     * to mark this message's content with a cache breakpoint so the
+     * full prefix becomes cacheable on a subsequent request. Anthropic
+     * applies `cache_control: ephemeral`; Vertex Gemini ignores the
+     * flag (its prefix cache works automatically).
+     */
+    cached?: boolean;
 } | {
     role: 'assistant';
     /** Free text the model emitted (zero-or-more text blocks joined as-is). */
@@ -69,6 +77,8 @@ type NormalizedMessage = {
      * thought_signature`. Other adapters can ignore.
      */
     providerData?: unknown;
+    /** See `user.cached`. */
+    cached?: boolean;
 } | {
     role: 'tool';
     results: NormalizedToolResult[];
@@ -155,6 +165,16 @@ type AgentInput<S = unknown> = {
     systemBlocks: SystemBlock[];
     /** Constructed ToolProvider — caller resolves the right one via toolProviders[id].createProvider({...}). */
     provider: ToolProvider;
+    /**
+     * Conversation history to seed the prompt with, in chronological order.
+     * Hosts pass this to give the model memory across turns in a chat session
+     * (so a follow-up like "summarize that" resolves the antecedent). The
+     * route handler is responsible for fetching prior `chat_messages` and
+     * normalising them; see `historyToNormalizedMessages` in `./history`.
+     * Tool-call provenance is intentionally not replayed — assistant turns
+     * here should be plain text only.
+     */
+    priorMessages?: NormalizedMessage[];
     /** Optional caps. Default both. */
     maxToolTurns?: number;
     maxOutputTokens?: number;
@@ -398,7 +418,7 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
 /**
  * `/api/admin/ai-settings` route factory — global AI configuration (super_admin only).
  *
- * Five patchable fields on the singleton settings row:
+ * Six patchable fields on the singleton settings row:
  *   - `tool_provider` — vendor that drives the agent tool loop. Validated
  *     against the registered `toolProviders` registry passed in via ctx.
  *   - `gcp_location` — the Vertex region every provider call hits. Stays
@@ -417,6 +437,10 @@ declare function createChatSessionsRoutes<S>(ctx: ChatSessionsRouteCtx<S>): {
  *     `configureAiChat({ rolePrompt })` fallback; we canonicalise an empty/
  *     whitespace-only string to `null` on write so the "no override" state has
  *     a single representation in storage.
+ *   - `gcp_project_id` — admin-editable GCP project override. Empty string and
+ *     the explicit JSON `null` both clear the override back to the host's
+ *     static `VertexPort.projectId`. Validated against GCP's project-id
+ *     format (`[a-z][-a-z0-9]{4,28}[a-z0-9]`) when non-null.
  *
  * Wire format is snake_case to preserve byte-for-byte parity with the
  * host route the package replaces — existing host UIs keep working

package/dist/server/index.js CHANGED Viewed

@@ -23,7 +23,10 @@ async function runAgent(input) {
   const maxOutputTokens = input.maxOutputTokens ?? DEFAULT_MAX_OUTPUT_TOKENS;
   const transcript = [];
   transcript.push({ kind: "user", text: input.question });
-  const messages = [{ role: "user", text: input.question }];
+  const messages = [
+    ...input.priorMessages ?? [],
+    { role: "user", text: input.question }
+  ];
   const system = input.systemBlocks;
   const toolSchemas = Object.values(input.tools).map((t) => t.schema);
   let toolCallCount = 0;
@@ -216,11 +219,28 @@ function toAnthropicMessages(messages) {
   const out = [];
   for (const msg of messages) {
     if (msg.role === "user") {
-      out.push({ role: "user", content: msg.text });
+      if (msg.cached) {
+        out.push({
+          role: "user",
+          content: [
+            {
+              type: "text",
+              text: msg.text,
+              cache_control: { type: "ephemeral" }
+            }
+          ]
+        });
+      } else {
+        out.push({ role: "user", content: msg.text });
+      }
     } else if (msg.role === "assistant") {
       const blocks = [];
       if (msg.text) {
-        blocks.push({ type: "text", text: msg.text });
+        const textBlock = { type: "text", text: msg.text };
+        if (msg.cached && msg.toolCalls.length === 0) {
+          textBlock.cache_control = { type: "ephemeral" };
+        }
+        blocks.push(textBlock);
       }
       for (const tc of msg.toolCalls) {
         blocks.push({
@@ -572,6 +592,87 @@ var toolProviders = [
 function getToolProvider(id) {
   return toolProviders.find((p) => p.id === id);
 }
+// src/server/history.ts
+var DEFAULT_MAX_HISTORY_PAIRS = 20;
+var DEFAULT_MAX_TEXT_CHARS = 4e3;
+function historyToNormalizedMessages(rows, opts = {}) {
+  const maxPairs = opts.maxPairs ?? DEFAULT_MAX_HISTORY_PAIRS;
+  const maxTextChars = opts.maxTextChars ?? DEFAULT_MAX_TEXT_CHARS;
+  const pairs = [];
+  let i = 0;
+  while (i < rows.length) {
+    const row = rows[i];
+    if (row.role !== "user" || !row.question) {
+      i += 1;
+      continue;
+    }
+    const next = rows[i + 1];
+    if (next?.role !== "assistant") {
+      i += 1;
+      continue;
+    }
+    const assistantText = truncate(
+      assistantMessageToText(next),
+      maxTextChars
+    );
+    if (assistantText) {
+      pairs.push([
+        { role: "user", text: truncate(row.question, maxTextChars) },
+        { role: "assistant", text: assistantText, toolCalls: [] }
+      ]);
+    }
+    i += 2;
+  }
+  const kept = maxPairs > 0 ? pairs.slice(-maxPairs) : pairs;
+  return kept.flat();
+}
+function truncate(text, max) {
+  if (max <= 0 || text.length <= max) return text;
+  return text.slice(0, max);
+}
+function assistantMessageToText(row) {
+  if (row.errorJson) return "";
+  const proseText = proseToText(row.prose);
+  if (proseText) return proseText;
+  const blockText = blocksToText(row.blocks);
+  return blockText;
+}
+function proseToText(prose) {
+  if (!prose || typeof prose !== "object") return "";
+  const entries = Object.entries(prose).map(([k, v]) => [Number(k), typeof v === "string" ? v : ""]).filter(([k, v]) => Number.isFinite(k) && v.length > 0).sort(([a], [b]) => a - b);
+  return entries.map(([, v]) => v).join("\n\n").trim();
+}
+function blocksToText(blocks) {
+  if (!Array.isArray(blocks)) return "";
+  const parts = [];
+  for (const raw of blocks) {
+    if (!raw || typeof raw !== "object") continue;
+    const b = raw;
+    switch (b.kind) {
+      case "paragraph_brief": {
+        const facts = (b.key_facts ?? []).filter((f) => f && f.trim());
+        if (b.topic) parts.push(b.topic);
+        if (facts.length) parts.push(facts.join("\n"));
+        break;
+      }
+      case "list": {
+        const items = (b.items ?? []).filter((s) => s && s.trim());
+        if (b.title) parts.push(b.title);
+        if (items.length) parts.push(items.map((s) => `- ${s}`).join("\n"));
+        break;
+      }
+      case "chart":
+      case "table":
+        if (b.title) parts.push(`[${b.title}]`);
+        break;
+      case "callout":
+        if (b.text) parts.push(b.text);
+        break;
+    }
+  }
+  return parts.join("\n\n").trim();
+}
 function vertexHost2(location) {
   return location === "global" ? "aiplatform.googleapis.com" : `${location}-aiplatform.googleapis.com`;
 }
@@ -912,13 +1013,25 @@ function createAgentCustomRoutes(ctx) {
       const rawChatSessionId = body?.chatSessionId;
       const incomingChatSessionId = typeof rawChatSessionId === "number" && Number.isInteger(rawChatSessionId) ? rawChatSessionId : null;
       const aiSettings = await persistence.getAiSettings();
+      const effectiveProjectId = aiSettings.gcpProjectId ?? vertex.projectId;
       let chatSessionId;
+      let priorMessages = [];
       if (incomingChatSessionId !== null) {
         const owned = await persistence.getSession(incomingChatSessionId, userId);
         if (!owned) {
           return jsonError(404, "NOT_FOUND", "Chat session not found.");
         }
         chatSessionId = owned.id;
+        const stored = await persistence.listMessagesForSession(chatSessionId, userId);
+        priorMessages = historyToNormalizedMessages(stored);
+        if (priorMessages.length > 0) {
+          const last = priorMessages[priorMessages.length - 1];
+          if (last.role === "assistant" && last.toolCalls.length === 0) {
+            priorMessages[priorMessages.length - 1] = { ...last, cached: true };
+          } else if (last.role === "user") {
+            priorMessages[priorMessages.length - 1] = { ...last, cached: true };
+          }
+        }
       } else {
         const created = await persistence.createSession({
           userId,
@@ -955,7 +1068,7 @@ function createAgentCustomRoutes(ctx) {
       }
       const provider = def.createProvider({
         auth: vertex.auth,
-        projectId: vertex.projectId,
+        projectId: effectiveProjectId,
         defaultLocation: vertex.defaultLocation,
         modelIds: vertex.modelIds,
         location: aiSettings.gcpLocation
@@ -1006,6 +1119,7 @@ data: ${JSON.stringify(data)}
             send("meta", { chatSessionId, scopeLabel });
             const agentResult = await runAgent({
               question,
+              priorMessages,
               ctx: toolContext,
               tools: tools.tools,
               systemBlocks,
@@ -1033,7 +1147,7 @@ data: ${JSON.stringify(data)}
                   }
                   for await (const token of narratorFn({
                     auth: vertex.auth,
-                    projectId: vertex.projectId,
+                    projectId: effectiveProjectId,
                     location: aiSettings.gcpLocation,
                     modelId: narratorModelId,
                     maxTokens: aiSettings.maxOutputTokens,
@@ -1224,7 +1338,17 @@ function createAgentVercelRoutes(ctx) {
         if (short) return short;
       }
       const body = await req.json().catch(() => null);
-      const question = typeof body?.question === "string" ? body.question.trim() : "";
+      let question = typeof body?.question === "string" ? body.question.trim() : "";
+      if (!question && Array.isArray(body?.messages)) {
+        const msgs = body.messages;
+        for (let i = msgs.length - 1; i >= 0; i -= 1) {
+          const m = msgs[i];
+          if (m && m.role === "user" && typeof m.content === "string") {
+            question = m.content.trim();
+            break;
+          }
+        }
+      }
       if (!question) {
         return jsonError2(
           400,
@@ -1237,7 +1361,9 @@ function createAgentVercelRoutes(ctx) {
       const rawModel = body?.model;
       const requestedModel = typeof rawModel === "string" && VALID_MODELS.has(rawModel) ? rawModel : null;
       const aiSettings = await persistence.getAiSettings();
+      const effectiveProjectId = aiSettings.gcpProjectId ?? vertex.projectId;
       let chatSessionId;
+      let priorMessages = [];
       if (incomingChatSessionId !== null) {
         const owned = await persistence.getSession(
           incomingChatSessionId,
@@ -1247,6 +1373,11 @@ function createAgentVercelRoutes(ctx) {
           return jsonError2(404, "NOT_FOUND", "Chat session not found.");
         }
         chatSessionId = owned.id;
+        const stored = await persistence.listMessagesForSession(
+          chatSessionId,
+          userId
+        );
+        priorMessages = historyToNormalizedMessages(stored);
       } else {
         const created = await persistence.createSession({
           userId,
@@ -1308,18 +1439,24 @@ function createAgentVercelRoutes(ctx) {
         });
         const system = systemBlocks.map((b) => b.text).join("\n\n");
         const model = provider === "claude" ? createVertexAnthropic({
-          project: vertex.projectId,
+          project: effectiveProjectId,
           location: vertex.defaultLocation,
           googleAuthOptions: {}
         })(vertex.modelIds.claude) : createVertex({
-          project: vertex.projectId,
+          project: effectiveProjectId,
           location: aiSettings.gcpLocation,
           googleAuthOptions: {}
         })(vertex.modelIds.gemini);
+        const priorCoreMessages = priorMessages.filter(
+          (m) => m.role === "user" || m.role === "assistant"
+        ).map((m) => ({ role: m.role, content: m.text }));
         const result = streamText({
           model,
           system,
-          messages: [{ role: "user", content: question }],
+          messages: [
+            ...priorCoreMessages,
+            { role: "user", content: question }
+          ],
           tools: vercelTools,
           maxSteps: 12,
           maxTokens: aiSettings.maxOutputTokens,
@@ -1613,6 +1750,7 @@ function createChatSessionsRoutes(ctx) {
 var VALID_LOCATIONS = ["us-east5", "global"];
 var MIN_MAX_OUTPUT_TOKENS = 256;
 var MAX_MAX_OUTPUT_TOKENS = 64e3;
+var GCP_PROJECT_ID_REGEX = /^[a-z][-a-z0-9]{4,28}[a-z0-9]$/;
 function isStringRecord(v) {
   return typeof v === "object" && v !== null && !Array.isArray(v);
 }
@@ -1629,6 +1767,7 @@ function toWire(settings) {
     chat_interface: settings.chatInterface,
     max_output_tokens: settings.maxOutputTokens,
     role_prompt: settings.rolePrompt,
+    gcp_project_id: settings.gcpProjectId,
     updated_at: settings.updatedAt ? settings.updatedAt.toISOString() : null,
     updated_by_user_id: settings.updatedByUserId
   };
@@ -1726,11 +1865,28 @@ function createAdminSettingsRoutes(ctx) {
         return jsonResponse({ error: "invalid_role_prompt" }, 400);
       }
     }
-    if (patch.toolProvider === void 0 && patch.gcpLocation === void 0 && patch.chatInterface === void 0 && patch.maxOutputTokens === void 0 && !("rolePrompt" in patch)) {
+    if ("gcp_project_id" in body) {
+      const v = body.gcp_project_id;
+      if (v === null) {
+        patch.gcpProjectId = null;
+      } else if (typeof v === "string") {
+        const trimmed = v.trim();
+        if (trimmed === "") {
+          patch.gcpProjectId = null;
+        } else if (trimmed.length > 64 || !GCP_PROJECT_ID_REGEX.test(trimmed)) {
+          return jsonResponse({ error: "invalid_gcp_project_id" }, 400);
+        } else {
+          patch.gcpProjectId = trimmed;
+        }
+      } else {
+        return jsonResponse({ error: "invalid_gcp_project_id" }, 400);
+      }
+    }
+    if (patch.toolProvider === void 0 && patch.gcpLocation === void 0 && patch.chatInterface === void 0 && patch.maxOutputTokens === void 0 && !("rolePrompt" in patch) && !("gcpProjectId" in patch)) {
       return jsonResponse(
         {
           error: "empty_patch",
-          message: "Body must set at least one of tool_provider, gcp_location, chat_interface, max_output_tokens, role_prompt."
+          message: "Body must set at least one of tool_provider, gcp_location, chat_interface, max_output_tokens, role_prompt, gcp_project_id."
         },
         400
       );
@@ -1791,9 +1947,10 @@ function configureAiChat(opts) {
         `Unknown tool provider '${providerId ?? settings.toolProvider}'. Registered: ${toolProviders2.map((p) => p.id).join(", ")}.`
       );
     }
+    const effectiveProjectId = settings.gcpProjectId ?? opts.vertex.projectId;
     const provider = def.createProvider({
       auth: opts.vertex.auth,
-      projectId: opts.vertex.projectId,
+      projectId: effectiveProjectId,
       defaultLocation: opts.vertex.defaultLocation,
       modelIds: opts.vertex.modelIds,
       location: location ?? settings.gcpLocation