npm - @juspay/neurolink - Versions diffs - 9.63.1 → 9.64.0 - Mend

@juspay/neurolink 9.63.1 → 9.64.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (77) hide show

package/CHANGELOG.md +6 -0
package/dist/adapters/video/vertexVideoHandler.js +9 -2
package/dist/browser/neurolink.min.js +1014 -1018
package/dist/cli/factories/commandFactory.d.ts +14 -0
package/dist/cli/factories/commandFactory.js +50 -25
package/dist/cli/loop/optionsSchema.d.ts +1 -1
package/dist/cli/loop/optionsSchema.js +12 -0
package/dist/core/baseProvider.d.ts +1 -1
package/dist/core/modules/MessageBuilder.js +20 -0
package/dist/factories/providerRegistry.js +5 -1
package/dist/lib/adapters/video/vertexVideoHandler.js +9 -2
package/dist/lib/core/baseProvider.d.ts +1 -1
package/dist/lib/core/modules/MessageBuilder.js +20 -0
package/dist/lib/factories/providerRegistry.js +5 -1
package/dist/lib/memory/hippocampusInitializer.d.ts +2 -2
package/dist/lib/memory/hippocampusInitializer.js +32 -2
package/dist/lib/middleware/builtin/lifecycle.js +19 -48
package/dist/lib/neurolink.js +49 -2
package/dist/lib/providers/googleAiStudio.d.ts +11 -3
package/dist/lib/providers/googleAiStudio.js +292 -339
package/dist/lib/providers/googleNativeGemini3.d.ts +83 -1
package/dist/lib/providers/googleNativeGemini3.js +208 -4
package/dist/lib/providers/googleVertex.d.ts +116 -129
package/dist/lib/providers/googleVertex.js +2826 -1968
package/dist/lib/providers/openRouter.js +7 -3
package/dist/lib/types/aliases.d.ts +14 -0
package/dist/lib/types/common.d.ts +0 -3
package/dist/lib/types/conversation.d.ts +10 -3
package/dist/lib/types/generate.d.ts +14 -0
package/dist/lib/types/index.d.ts +1 -0
package/dist/lib/types/index.js +1 -0
package/dist/lib/types/memory.d.ts +96 -0
package/dist/lib/types/memory.js +23 -0
package/dist/lib/types/providers.d.ts +140 -2
package/dist/lib/types/stream.d.ts +6 -0
package/dist/lib/utils/lifecycleCallbacks.d.ts +13 -0
package/dist/lib/utils/lifecycleCallbacks.js +44 -0
package/dist/lib/utils/messageBuilder.d.ts +10 -0
package/dist/lib/utils/messageBuilder.js +40 -5
package/dist/lib/utils/modelDetection.d.ts +11 -0
package/dist/lib/utils/modelDetection.js +27 -0
package/dist/lib/utils/providerHealth.js +7 -7
package/dist/lib/utils/schemaConversion.d.ts +1 -1
package/dist/lib/utils/schemaConversion.js +59 -4
package/dist/lib/utils/tokenLimits.js +23 -32
package/dist/memory/hippocampusInitializer.d.ts +2 -2
package/dist/memory/hippocampusInitializer.js +32 -2
package/dist/middleware/builtin/lifecycle.js +19 -48
package/dist/neurolink.js +49 -2
package/dist/providers/googleAiStudio.d.ts +11 -3
package/dist/providers/googleAiStudio.js +291 -339
package/dist/providers/googleNativeGemini3.d.ts +83 -1
package/dist/providers/googleNativeGemini3.js +208 -4
package/dist/providers/googleVertex.d.ts +116 -129
package/dist/providers/googleVertex.js +2824 -1967
package/dist/providers/openRouter.js +7 -3
package/dist/types/aliases.d.ts +14 -0
package/dist/types/common.d.ts +0 -3
package/dist/types/conversation.d.ts +10 -3
package/dist/types/generate.d.ts +14 -0
package/dist/types/index.d.ts +1 -0
package/dist/types/index.js +1 -0
package/dist/types/memory.d.ts +96 -0
package/dist/types/memory.js +22 -0
package/dist/types/providers.d.ts +140 -2
package/dist/types/stream.d.ts +6 -0
package/dist/utils/lifecycleCallbacks.d.ts +13 -0
package/dist/utils/lifecycleCallbacks.js +43 -0
package/dist/utils/messageBuilder.d.ts +10 -0
package/dist/utils/messageBuilder.js +40 -5
package/dist/utils/modelDetection.d.ts +11 -0
package/dist/utils/modelDetection.js +27 -0
package/dist/utils/providerHealth.js +7 -7
package/dist/utils/schemaConversion.d.ts +1 -1
package/dist/utils/schemaConversion.js +59 -4
package/dist/utils/tokenLimits.js +23 -32
package/package.json +11 -4

package/dist/lib/providers/googleNativeGemini3.d.ts CHANGED Viewed

@@ -9,7 +9,7 @@
  * providers so they can share a single implementation.
  */
 import { type Tool } from "ai";
-import type { ThinkingConfig, CollectedChunkResult, NativeFunctionCall, NativeFunctionResponse, NativeToolDeclarationsResult, NativeToolsConfig, TextChannel } from "../types/index.js";
+import type { ThinkingConfig, CollectedChunkResult, NativeFunctionCall, NativeFunctionResponse, NativeToolDeclarationsResult, NativeToolsConfig, TextChannel, VertexNativePart, GeminiMultimodalInput } from "../types/index.js";
 /**
  * Sanitize a JSON Schema for Gemini's proto-based API.
  *
@@ -48,12 +48,30 @@ export declare function normalizeToolsForJsonSchemaProvider(tools: Record<string
 export declare function buildNativeToolDeclarations(tools: Record<string, Tool>): NativeToolDeclarationsResult;
 /**
  * Build the native @google/genai config object shared by stream and generate.
+ *
+ * Caller is responsible for the tools-vs-JSON conflict resolution: Gemini's
+ * function calling cannot be combined with `responseMimeType:
+ * "application/json"`, and `responseSchema` requires that mime type. So
+ * when tools are active, callers must NOT pass `wantsJsonOutput`/
+ * `responseSchema` here; when JSON/schema output is requested, callers
+ * must omit `toolsConfig`. The AI Studio path enforces this by forcing
+ * `disableTools: true` whenever JSON/schema output is requested.
  */
 export declare function buildNativeConfig(options: {
     temperature?: number;
     maxTokens?: number;
     systemPrompt?: string;
     thinkingConfig?: ThinkingConfig;
+    /**
+     * When true (and `toolsConfig` is undefined), set
+     * `responseMimeType: "application/json"` to enforce native JSON output.
+     */
+    wantsJsonOutput?: boolean;
+    /**
+     * Pre-converted JSON Schema for native `responseSchema`. Implies
+     * `wantsJsonOutput`. Ignored if `toolsConfig` is present.
+     */
+    responseSchema?: Record<string, unknown>;
 }, toolsConfig?: NativeToolsConfig): Record<string, unknown>;
 /**
  * Compute a safe, clamped maxSteps value.
@@ -142,3 +160,67 @@ export declare function pushModelResponseToHistory(currentContents: Array<{
     role: string;
     parts: unknown[];
 }>, rawResponseParts: unknown[], stepFunctionCalls: NativeFunctionCall[]): void;
+/**
+ * Convert a Zod schema (or AI SDK `jsonSchema()` wrapper) into the shape
+ * `@google/genai` accepts as `responseSchema`. Mirrors the inline pipeline
+ * the Vertex Gemini paths already use:
+ *
+ *   convertZodToJsonSchema → inlineJsonSchema → strip `$schema` → ensure
+ *   every nested schema has a `type` (Vertex/Gemini reject schemas missing
+ *   that field, even on nested objects).
+ *
+ * Lives here so the AI Studio and Vertex paths can share the same
+ * sanitization without duplicating the schema-conversion churn.
+ */
+export declare function buildGeminiResponseSchema(schema: unknown): Record<string, unknown>;
+/**
+ * Map NeuroLink ChatMessage[] history into the @google/genai content format
+ * and push the entries onto a contents array.
+ *
+ * Used by the native Vertex Gemini and Google AI Studio paths to honor
+ * `options.conversationMessages` so multi-turn conversations (memory, loop
+ * REPL, agent flows) actually carry prior turns into the request.
+ *
+ * Behavior notes:
+ *  - Only `user` and `assistant` roles are forwarded; system messages are
+ *    expected to be wired via `systemInstruction`, and tool-call /
+ *    tool-result roles only appear inside intra-call tool loops which build
+ *    their own model/function entries.
+ *  - String content is wrapped as a single `{ text }` part. Empty strings
+ *    are skipped to avoid sending empty parts that some Gemini regions
+ *    reject.
+ *  - The current user input should be appended AFTER calling this helper
+ *    so the prior turns appear first in chronological order.
+ */
+export declare function prependConversationMessages(contents: Array<{
+    role: string;
+    parts: unknown[];
+}>, conversationMessages?: Array<{
+    role: string;
+    content: string;
+}>): void;
+/**
+ * Build the `parts` array for the current user turn of a Gemini native
+ * `generateContent` request, including inline image + PDF blobs.
+ *
+ * Both providers that hit the native `@google/genai` SDK — `GoogleVertex`
+ * and `GoogleAIStudio` — need this. The previous AI Studio code only
+ * pushed a single `{ text }` part, which silently dropped `input.images`
+ * and `input.pdfFiles` on the floor: the model received text only and
+ * legitimately reported "no image attached". Extracting this from the
+ * Vertex copy keeps both providers on one definition.
+ *
+ * Accepted shapes per element (mirroring the runtime behaviour the Vertex
+ * code already supported):
+ *   - `Buffer` → used as-is
+ *   - local file path → read via `readFileSync`, MIME guessed from extension
+ *   - `data:<mime>;base64,...` URL → mime parsed, data base64-decoded
+ *   - `http(s)://...` URL → fetched, mime from `content-type`
+ *   - any other string → assumed to be a base64-encoded payload
+ *
+ * Image MIME guessing is conservative — only known extensions override the
+ * default `image/jpeg`. Fetch failures are logged and the offending entry
+ * is skipped rather than aborting the entire request, matching prior
+ * Vertex behaviour.
+ */
+export declare function buildUserPartsWithMultimodal(input: GeminiMultimodalInput | undefined, textOverride?: string, logPrefix?: string): Promise<VertexNativePart[]>;

package/dist/lib/providers/googleNativeGemini3.js CHANGED Viewed

@@ -9,10 +9,12 @@
  * providers so they can share a single implementation.
  */
 import { randomUUID } from "node:crypto";
+import { existsSync, readFileSync } from "node:fs";
+import { extname } from "node:path";
 import { jsonSchema as aiJsonSchema, tool as createAISDKTool, } from "ai";
 import { DEFAULT_MAX_STEPS, DEFAULT_TOOL_MAX_RETRIES, } from "../core/constants.js";
 import { logger } from "../utils/logger.js";
-import { convertZodToJsonSchema, inlineJsonSchema, isZodSchema, normalizeJsonSchemaObject, } from "../utils/schemaConversion.js";
+import { convertZodToJsonSchema, ensureNestedSchemaTypes, inlineJsonSchema, isZodSchema, normalizeJsonSchemaObject, } from "../utils/schemaConversion.js";
 import { createNativeThinkingConfig } from "../utils/thinkingConfig.js";
 // ── Functions ──
 /**
@@ -125,7 +127,7 @@ export function sanitizeToolsForGemini(tools) {
                 typeof params === "object" &&
                 "_def" in params &&
                 typeof params.parse === "function") {
-                const rawJsonSchema = convertZodToJsonSchema(params);
+                const rawJsonSchema = convertZodToJsonSchema(params, "openApi3");
                 const inlined = inlineJsonSchema(rawJsonSchema);
                 // Gemini sanitization strips Zod-only features not supported by the Gemini API:
                 // union types (anyOf/oneOf) are collapsed to string, default values and
@@ -171,7 +173,7 @@ export function normalizeToolsForJsonSchemaProvider(tools) {
         const toolParams = legacyTool.parameters || tool.inputSchema;
         let rawSchema;
         if (isZodSchema(toolParams)) {
-            rawSchema = convertZodToJsonSchema(toolParams);
+            rawSchema = convertZodToJsonSchema(toolParams, "openApi3");
         }
         else if (toolParams && typeof toolParams === "object") {
             rawSchema = toolParams;
@@ -222,7 +224,7 @@ export function buildNativeToolDeclarations(tools) {
                 let rawSchema;
                 const toolParams = legacyTool.parameters || tool.inputSchema;
                 if (isZodSchema(toolParams)) {
-                    rawSchema = convertZodToJsonSchema(toolParams);
+                    rawSchema = convertZodToJsonSchema(toolParams, "openApi3");
                 }
                 else if (typeof toolParams === "object") {
                     rawSchema = toolParams;
@@ -255,6 +257,14 @@ export function buildNativeToolDeclarations(tools) {
 }
 /**
  * Build the native @google/genai config object shared by stream and generate.
+ *
+ * Caller is responsible for the tools-vs-JSON conflict resolution: Gemini's
+ * function calling cannot be combined with `responseMimeType:
+ * "application/json"`, and `responseSchema` requires that mime type. So
+ * when tools are active, callers must NOT pass `wantsJsonOutput`/
+ * `responseSchema` here; when JSON/schema output is requested, callers
+ * must omit `toolsConfig`. The AI Studio path enforces this by forcing
+ * `disableTools: true` whenever JSON/schema output is requested.
  */
 export function buildNativeConfig(options, toolsConfig) {
     const config = {
@@ -272,6 +282,16 @@ export function buildNativeConfig(options, toolsConfig) {
     if (nativeThinkingConfig) {
         config.thinkingConfig = nativeThinkingConfig;
     }
+    // Native JSON / schema enforcement. Only set when tools are NOT being sent
+    // (Gemini rejects the combination). responseSchema implies JSON mime type.
+    if (!toolsConfig) {
+        if (options.responseSchema || options.wantsJsonOutput) {
+            config.responseMimeType = "application/json";
+        }
+        if (options.responseSchema) {
+            config.responseSchema = options.responseSchema;
+        }
+    }
     return config;
 }
 /**
@@ -597,4 +617,188 @@ export function pushModelResponseToHistory(currentContents, rawResponseParts, st
             : stepFunctionCalls.map((fc) => ({ functionCall: fc })),
     });
 }
+/**
+ * Convert a Zod schema (or AI SDK `jsonSchema()` wrapper) into the shape
+ * `@google/genai` accepts as `responseSchema`. Mirrors the inline pipeline
+ * the Vertex Gemini paths already use:
+ *
+ *   convertZodToJsonSchema → inlineJsonSchema → strip `$schema` → ensure
+ *   every nested schema has a `type` (Vertex/Gemini reject schemas missing
+ *   that field, even on nested objects).
+ *
+ * Lives here so the AI Studio and Vertex paths can share the same
+ * sanitization without duplicating the schema-conversion churn.
+ */
+export function buildGeminiResponseSchema(schema) {
+    const raw = convertZodToJsonSchema(schema, "openApi3");
+    const inlined = inlineJsonSchema(raw);
+    if (inlined.$schema) {
+        delete inlined.$schema;
+    }
+    return ensureNestedSchemaTypes(inlined);
+}
+/**
+ * Map NeuroLink ChatMessage[] history into the @google/genai content format
+ * and push the entries onto a contents array.
+ *
+ * Used by the native Vertex Gemini and Google AI Studio paths to honor
+ * `options.conversationMessages` so multi-turn conversations (memory, loop
+ * REPL, agent flows) actually carry prior turns into the request.
+ *
+ * Behavior notes:
+ *  - Only `user` and `assistant` roles are forwarded; system messages are
+ *    expected to be wired via `systemInstruction`, and tool-call /
+ *    tool-result roles only appear inside intra-call tool loops which build
+ *    their own model/function entries.
+ *  - String content is wrapped as a single `{ text }` part. Empty strings
+ *    are skipped to avoid sending empty parts that some Gemini regions
+ *    reject.
+ *  - The current user input should be appended AFTER calling this helper
+ *    so the prior turns appear first in chronological order.
+ */
+export function prependConversationMessages(contents, conversationMessages) {
+    if (!conversationMessages || conversationMessages.length === 0) {
+        return;
+    }
+    for (const msg of conversationMessages) {
+        if (msg.role !== "user" && msg.role !== "assistant") {
+            continue;
+        }
+        const text = typeof msg.content === "string" ? msg.content : "";
+        if (text.length === 0) {
+            continue;
+        }
+        contents.push({
+            role: msg.role === "assistant" ? "model" : "user",
+            parts: [{ text }],
+        });
+    }
+}
+/**
+ * Build the `parts` array for the current user turn of a Gemini native
+ * `generateContent` request, including inline image + PDF blobs.
+ *
+ * Both providers that hit the native `@google/genai` SDK — `GoogleVertex`
+ * and `GoogleAIStudio` — need this. The previous AI Studio code only
+ * pushed a single `{ text }` part, which silently dropped `input.images`
+ * and `input.pdfFiles` on the floor: the model received text only and
+ * legitimately reported "no image attached". Extracting this from the
+ * Vertex copy keeps both providers on one definition.
+ *
+ * Accepted shapes per element (mirroring the runtime behaviour the Vertex
+ * code already supported):
+ *   - `Buffer` → used as-is
+ *   - local file path → read via `readFileSync`, MIME guessed from extension
+ *   - `data:<mime>;base64,...` URL → mime parsed, data base64-decoded
+ *   - `http(s)://...` URL → fetched, mime from `content-type`
+ *   - any other string → assumed to be a base64-encoded payload
+ *
+ * Image MIME guessing is conservative — only known extensions override the
+ * default `image/jpeg`. Fetch failures are logged and the offending entry
+ * is skipped rather than aborting the entire request, matching prior
+ * Vertex behaviour.
+ */
+export async function buildUserPartsWithMultimodal(input, textOverride, logPrefix = "[GeminiNative]") {
+    const text = typeof textOverride === "string" ? textOverride : (input?.text ?? "");
+    const parts = [{ text }];
+    if (input?.pdfFiles && input.pdfFiles.length > 0) {
+        logger.debug(`${logPrefix} Processing ${input.pdfFiles.length} PDF(s)`);
+        for (const pdfFile of input.pdfFiles) {
+            let pdfBuffer;
+            if (typeof pdfFile === "string") {
+                if (existsSync(pdfFile)) {
+                    pdfBuffer = readFileSync(pdfFile);
+                }
+                else {
+                    // Treat as already-base64-encoded payload
+                    pdfBuffer = Buffer.from(pdfFile, "base64");
+                }
+            }
+            else {
+                pdfBuffer = pdfFile;
+            }
+            parts.push({
+                inlineData: {
+                    mimeType: "application/pdf",
+                    data: pdfBuffer.toString("base64"),
+                },
+            });
+        }
+    }
+    if (input?.images && input.images.length > 0) {
+        logger.debug(`${logPrefix} Processing ${input.images.length} image(s)`);
+        for (const rawImage of input.images) {
+            // `images` may carry plain Buffer/string values or `{ data, altText? }`
+            // objects. Normalise to the inner payload before format detection.
+            const image = rawImage && typeof rawImage === "object" && !Buffer.isBuffer(rawImage)
+                ? rawImage.data
+                : rawImage;
+            let imageBuffer;
+            let mimeType = "image/jpeg";
+            if (typeof image === "string") {
+                if (existsSync(image)) {
+                    imageBuffer = readFileSync(image);
+                    const ext = extname(image).toLowerCase();
+                    if (ext === ".png") {
+                        mimeType = "image/png";
+                    }
+                    else if (ext === ".gif") {
+                        mimeType = "image/gif";
+                    }
+                    else if (ext === ".webp") {
+                        mimeType = "image/webp";
+                    }
+                }
+                else if (image.startsWith("data:")) {
+                    const matches = image.match(/^data:([^;]+);base64,(.+)$/);
+                    if (matches) {
+                        mimeType = matches[1];
+                        imageBuffer = Buffer.from(matches[2], "base64");
+                    }
+                    else {
+                        continue;
+                    }
+                }
+                else if (image.startsWith("http://") ||
+                    image.startsWith("https://")) {
+                    try {
+                        const response = await fetch(image);
+                        if (!response.ok) {
+                            logger.warn(`${logPrefix} Image fetch failed: ${response.status} ${response.statusText}, skipping`, { url: image });
+                            continue;
+                        }
+                        const arrayBuffer = await response.arrayBuffer();
+                        imageBuffer = Buffer.from(arrayBuffer);
+                        const headerMime = response.headers.get("content-type");
+                        if (headerMime && headerMime.startsWith("image/")) {
+                            mimeType = headerMime.split(";")[0];
+                        }
+                    }
+                    catch (fetchError) {
+                        logger.warn(`${logPrefix} Image URL fetch threw, skipping: ${fetchError instanceof Error
+                            ? fetchError.message
+                            : String(fetchError)}`, { url: image });
+                        continue;
+                    }
+                }
+                else {
+                    imageBuffer = Buffer.from(image, "base64");
+                }
+            }
+            else {
+                imageBuffer = image;
+            }
+            if (!imageBuffer) {
+                continue;
+            }
+            parts.push({
+                inlineData: {
+                    mimeType,
+                    data: imageBuffer.toString("base64"),
+                },
+            });
+        }
+    }
+    return parts;
+}
 //# sourceMappingURL=googleNativeGemini3.js.map