npm - @juspay/neurolink - Versions diffs - 8.5.1 → 8.7.0 - Mend

@juspay/neurolink 8.5.1 → 8.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

package/CHANGELOG.md +30 -0
package/dist/adapters/providerImageAdapter.d.ts +4 -2
package/dist/adapters/providerImageAdapter.js +16 -2
package/dist/cli/factories/commandFactory.d.ts +5 -0
package/dist/cli/factories/commandFactory.js +96 -0
package/dist/cli/utils/audioFileUtils.d.ts +70 -0
package/dist/cli/utils/audioFileUtils.js +174 -0
package/dist/core/baseProvider.js +6 -2
package/dist/core/modules/TelemetryHandler.js +6 -1
package/dist/lib/adapters/providerImageAdapter.d.ts +4 -2
package/dist/lib/adapters/providerImageAdapter.js +16 -2
package/dist/lib/core/baseProvider.js +6 -2
package/dist/lib/core/modules/TelemetryHandler.js +6 -1
package/dist/lib/middleware/builtin/guardrails.js +7 -0
package/dist/lib/neurolink.js +75 -5
package/dist/lib/telemetry/telemetryService.d.ts +1 -1
package/dist/lib/telemetry/telemetryService.js +4 -4
package/dist/lib/types/cli.d.ts +2 -0
package/dist/lib/types/common.d.ts +5 -0
package/dist/lib/types/content.d.ts +1 -1
package/dist/lib/types/fileTypes.d.ts +13 -12
package/dist/lib/types/generateTypes.d.ts +19 -2
package/dist/lib/types/index.d.ts +1 -0
package/dist/lib/types/index.js +2 -0
package/dist/lib/types/multimodal.d.ts +38 -1
package/dist/lib/types/streamTypes.d.ts +21 -2
package/dist/lib/types/ttsTypes.d.ts +91 -0
package/dist/lib/types/ttsTypes.js +58 -0
package/dist/lib/utils/imageProcessor.d.ts +38 -5
package/dist/lib/utils/imageProcessor.js +131 -7
package/dist/lib/utils/messageBuilder.js +52 -7
package/dist/lib/utils/multimodalOptionsBuilder.d.ts +1 -1
package/dist/lib/utils/pdfProcessor.js +24 -2
package/dist/middleware/builtin/guardrails.js +7 -0
package/dist/neurolink.js +75 -5
package/dist/telemetry/telemetryService.d.ts +1 -1
package/dist/telemetry/telemetryService.js +4 -4
package/dist/types/cli.d.ts +2 -0
package/dist/types/common.d.ts +5 -0
package/dist/types/content.d.ts +1 -1
package/dist/types/fileTypes.d.ts +13 -12
package/dist/types/generateTypes.d.ts +19 -2
package/dist/types/index.d.ts +1 -0
package/dist/types/index.js +2 -0
package/dist/types/multimodal.d.ts +38 -1
package/dist/types/streamTypes.d.ts +21 -2
package/dist/types/ttsTypes.d.ts +91 -0
package/dist/types/ttsTypes.js +57 -0
package/dist/utils/imageProcessor.d.ts +38 -5
package/dist/utils/imageProcessor.js +131 -7
package/dist/utils/messageBuilder.js +52 -7
package/dist/utils/multimodalOptionsBuilder.d.ts +1 -1
package/dist/utils/pdfProcessor.js +24 -2
package/package.json +7 -4

package/dist/types/multimodal.d.ts CHANGED Viewed

@@ -52,6 +52,8 @@ export type TextContent = {
 export type ImageContent = {
     type: "image";
     data: Buffer | string;
+    /** Alternative text for accessibility (screen readers, SEO) */
+    altText?: string;
     mediaType?: "image/jpeg" | "image/png" | "image/gif" | "image/webp" | "image/bmp" | "image/tiff";
     metadata?: {
         description?: string;
@@ -164,13 +166,48 @@ export type VideoContent = {
  * Covers text, images, documents, and multimedia
  */
 export type Content = TextContent | ImageContent | CSVContent | PDFContent | AudioContent | VideoContent;
+/**
+ * Image data with optional alt text for accessibility
+ * Use this when you need to provide alt text for screen readers and SEO
+ *
+ * @example
+ * ```typescript
+ * const imageWithAlt: ImageWithAltText = {
+ *   data: imageBuffer,
+ *   altText: "A dashboard showing quarterly sales trends"
+ * };
+ * ```
+ */
+export type ImageWithAltText = {
+    /** Image data as Buffer, base64 string, URL, or data URI */
+    data: Buffer | string;
+    /** Alternative text for accessibility (screen readers, SEO) */
+    altText?: string;
+};
 /**
  * Multimodal input type for options that may contain images or content arrays
  * This is the primary interface for users to provide multimodal content
  */
 export type MultimodalInput = {
     text: string;
-    images?: Array<Buffer | string>;
+    /**
+     * Images to include in the request.
+     * Can be simple image data (Buffer, string) or objects with alt text for accessibility.
+     *
+     * @example Simple usage
+     * ```typescript
+     * images: [imageBuffer, "https://example.com/image.jpg"]
+     * ```
+     *
+     * @example With alt text for accessibility
+     * ```typescript
+     * images: [
+     *   { data: imageBuffer, altText: "Product screenshot showing main dashboard" },
+     *   { data: "https://example.com/chart.png", altText: "Sales chart for Q3 2024" }
+     * ]
+     * ```
+     */
+    images?: Array<Buffer | string | ImageWithAltText>;
     content?: Content[];
     csvFiles?: Array<Buffer | string>;
     pdfFiles?: Array<Buffer | string>;

package/dist/types/streamTypes.d.ts CHANGED Viewed

@@ -1,7 +1,7 @@
 import type { Tool } from "ai";
 import type { ValidationSchema, StandardRecord } from "./typeAliases.js";
 import type { AIModelProviderConfig } from "./providers.js";
-import type { Content } from "./content.js";
+import type { Content, ImageWithAltText } from "./content.js";
 import type { AnalyticsData, ToolExecutionEvent, ToolExecutionSummary } from "../types/index.js";
 import { AIProviderName } from "../constants/enums.js";
 import type { TokenUsage } from "./analytics.js";
@@ -125,7 +125,24 @@ export type StreamOptions = {
     input: {
         text: string;
         audio?: AudioInputSpec;
-        images?: Array<Buffer | string>;
+        /**
+         * Images to include in the request.
+         * Supports simple image data (Buffer, string) or objects with alt text for accessibility.
+         *
+         * @example Simple usage
+         * ```typescript
+         * images: [imageBuffer, "https://example.com/image.jpg"]
+         * ```
+         *
+         * @example With alt text for accessibility
+         * ```typescript
+         * images: [
+         *   { data: imageBuffer, altText: "Product screenshot showing main dashboard" },
+         *   { data: "https://example.com/chart.png", altText: "Sales chart for Q3 2024" }
+         * ]
+         * ```
+         */
+        images?: Array<Buffer | string | ImageWithAltText>;
         csvFiles?: Array<Buffer | string>;
         pdfFiles?: Array<Buffer | string>;
         files?: Array<Buffer | string>;
@@ -211,6 +228,8 @@ export type StreamResult = {
         totalToolExecutions?: number;
         toolExecutionTime?: number;
         hasToolErrors?: boolean;
+        guardrailsBlocked?: boolean;
+        error?: string;
     };
     analytics?: AnalyticsData | Promise<AnalyticsData>;
     evaluation?: EvaluationData | Promise<EvaluationData>;

package/dist/types/ttsTypes.d.ts ADDED Viewed

@@ -0,0 +1,91 @@
+/**
+ * Text-to-Speech (TTS) Type Definitions for NeuroLink
+ *
+ * This module defines types for TTS audio generation and output.
+ *
+ * @module types/ttsTypes
+ */
+/**
+ * Supported audio formats for TTS output
+ */
+export type AudioFormat = "mp3" | "wav" | "ogg" | "opus";
+/**
+ * TTS quality settings
+ */
+export type TTSQuality = "standard" | "hd";
+/**
+ * TTS configuration options
+ */
+export type TTSOptions = {
+    /** Enable TTS output */
+    enabled?: boolean;
+    /** Voice identifier (e.g., "en-US-Neural2-C") */
+    voice?: string;
+    /** Audio format (default: mp3) */
+    format?: AudioFormat;
+    /** Speaking rate 0.25-4.0 (default: 1.0) */
+    speed?: number;
+    /** Audio quality (default: standard) */
+    quality?: TTSQuality;
+    /** Output file path (optional) */
+    output?: string;
+    /** Auto-play audio after generation (default: false) */
+    play?: boolean;
+};
+/**
+ * TTS audio result returned from generation
+ */
+export type TTSResult = {
+    /** Audio data as Buffer */
+    buffer: Buffer;
+    /** Audio format */
+    format: AudioFormat;
+    /** Audio file size in bytes */
+    size: number;
+    /** Duration in seconds (if available) */
+    duration?: number;
+    /** Voice used for generation */
+    voice?: string;
+    /** Sample rate in Hz */
+    sampleRate?: number;
+};
+/**
+ * Result of saving audio to file
+ */
+export type AudioSaveResult = {
+    /** Whether the save was successful */
+    success: boolean;
+    /** Full path to the saved file */
+    path: string;
+    /** File size in bytes */
+    size: number;
+    /** Error message if failed */
+    error?: string;
+};
+/**
+ * TTS voice information
+ */
+export type TTSVoice = {
+    /** Voice identifier */
+    id: string;
+    /** Display name */
+    name: string;
+    /** Language code (e.g., "en-US") */
+    languageCode: string;
+    /** Gender */
+    gender: "male" | "female" | "neutral";
+    /** Voice type */
+    type: "neural" | "wavenet" | "standard";
+};
+/** Valid audio formats as an array for runtime validation */
+export declare const VALID_AUDIO_FORMATS: readonly AudioFormat[];
+/** Valid TTS quality levels as an array for runtime validation */
+export declare const VALID_TTS_QUALITIES: readonly TTSQuality[];
+/**
+ * Type guard to check if an object is a TTSResult
+ */
+export declare function isTTSResult(value: unknown): value is TTSResult;
+/**
+ * Type guard to check if TTSOptions are valid
+ */
+export declare function isValidTTSOptions(options: unknown): options is TTSOptions;

package/dist/types/ttsTypes.js ADDED Viewed

@@ -0,0 +1,57 @@
+/**
+ * Text-to-Speech (TTS) Type Definitions for NeuroLink
+ *
+ * This module defines types for TTS audio generation and output.
+ *
+ * @module types/ttsTypes
+ */
+/** Valid audio formats as an array for runtime validation */
+export const VALID_AUDIO_FORMATS = [
+    "mp3",
+    "wav",
+    "ogg",
+    "opus",
+];
+/** Valid TTS quality levels as an array for runtime validation */
+export const VALID_TTS_QUALITIES = ["standard", "hd"];
+/**
+ * Type guard to check if an object is a TTSResult
+ */
+export function isTTSResult(value) {
+    if (!value || typeof value !== "object") {
+        return false;
+    }
+    const obj = value;
+    return (Buffer.isBuffer(obj.buffer) &&
+        typeof obj.format === "string" &&
+        VALID_AUDIO_FORMATS.includes(obj.format) &&
+        typeof obj.size === "number" &&
+        obj.size >= 0);
+}
+/**
+ * Type guard to check if TTSOptions are valid
+ */
+export function isValidTTSOptions(options) {
+    if (!options || typeof options !== "object") {
+        return false;
+    }
+    const opts = options;
+    if (opts.speed !== undefined) {
+        if (typeof opts.speed !== "number" ||
+            opts.speed < 0.25 ||
+            opts.speed > 4.0) {
+            return false;
+        }
+    }
+    if (opts.format !== undefined) {
+        if (!VALID_AUDIO_FORMATS.includes(opts.format)) {
+            return false;
+        }
+    }
+    if (opts.quality !== undefined) {
+        if (!VALID_TTS_QUALITIES.includes(opts.quality)) {
+            return false;
+        }
+    }
+    return true;
+}

package/dist/utils/imageProcessor.d.ts CHANGED Viewed

@@ -17,6 +17,18 @@ export declare class ImageProcessor {
      * @returns Processed image as data URI
      */
     static process(content: Buffer, _options?: unknown): Promise<FileProcessingResult>;
+    /**
+     * Validate processed output meets required format
+     * Checks:
+     * - Base64 content is non-empty
+     * - Data URI format is valid (data:{mimeType};base64,{content})
+     * - MIME type is in the allowed list
+     * @param dataUri - The complete data URI string
+     * @param base64 - The base64-encoded content
+     * @param mediaType - The MIME type of the image
+     * @throws Error if any validation fails
+     */
+    private static validateProcessOutput;
     /**
      * Process image for OpenAI (requires data URI format)
      */
@@ -104,11 +116,32 @@ export declare const imageUtils: {
      */
     fileToBase64DataUri: (filePath: string, maxBytes?: number) => Promise<string>;
     /**
-     * Convert URL to base64 data URI by downloading the image
-     */
-    urlToBase64DataUri: (url: string, { timeoutMs, maxBytes }?: {
-        timeoutMs?: number | undefined;
-        maxBytes?: number | undefined;
+     * Convert URL to base64 data URI by downloading the image.
+     * Implements retry logic with exponential backoff for network errors.
+     *
+     * Retries are performed for:
+     * - Network errors (ECONNRESET, ENOTFOUND, ECONNREFUSED, ETIMEDOUT, ERR_NETWORK, AbortError)
+     * - Server errors (5xx status codes)
+     * - Rate limiting (429 Too Many Requests)
+     * - Request timeouts (408 Request Timeout)
+     *
+     * Retries are NOT performed for:
+     * - Client errors (4xx status codes except 408, 429)
+     * - Invalid content type
+     * - Content size limit exceeded
+     * - Unsupported protocol
+     *
+     * @param url - The URL of the image to download
+     * @param options - Configuration options
+     * @param options.timeoutMs - Timeout for each download attempt (default: 15000ms)
+     * @param options.maxBytes - Maximum allowed file size (default: 10MB)
+     * @param options.maxAttempts - Maximum number of total attempts including initial attempt (default: 3)
+     * @returns Promise<string> - Base64 data URI of the downloaded image
+     */
+    urlToBase64DataUri: (url: string, { timeoutMs, maxBytes, maxAttempts, }?: {
+        timeoutMs?: number;
+        maxBytes?: number;
+        maxAttempts?: number;
     }) => Promise<string>;
     /**
      * Extract base64 data from data URI

package/dist/utils/imageProcessor.js CHANGED Viewed

@@ -3,6 +3,57 @@
  * Handles format conversion for different AI providers
  */
 import { logger } from "./logger.js";
+import { withRetry } from "./retryHandler.js";
+import { SYSTEM_LIMITS } from "../core/constants.js";
+/**
+ * Network error codes that should trigger a retry
+ */
+const RETRYABLE_ERROR_CODES = new Set([
+    "ECONNRESET",
+    "ENOTFOUND",
+    "ECONNREFUSED",
+    "ETIMEDOUT",
+    "ERR_NETWORK",
+]);
+/**
+ * Determines if an HTTP error is retryable based on status code
+ * Only network errors and certain HTTP status codes should be retried
+ * 4xx client errors like 404 (Not Found) and 403 (Forbidden) should NOT be retried
+ *
+ * @param error - The error to check
+ * @returns true if the error is retryable, false otherwise
+ */
+function isRetryableDownloadError(error) {
+    // Network-related errors should be retried
+    if (error && typeof error === "object") {
+        const errorCode = error.code;
+        const errorName = error.name;
+        if (RETRYABLE_ERROR_CODES.has(errorCode || "") ||
+            errorName === "AbortError") {
+            return true;
+        }
+    }
+    // Check for HTTP status code in error message for retryable errors
+    // Only retry on 5xx server errors, 429 (Too Many Requests), and 408 (Request Timeout)
+    // Do NOT retry on 4xx client errors like 404 (Not Found) or 403 (Forbidden)
+    if (error instanceof Error) {
+        const message = error.message;
+        // Extract HTTP status from error message like "HTTP 503: Service Unavailable"
+        const statusMatch = message.match(/HTTP (\d{3}):/);
+        if (statusMatch) {
+            const status = parseInt(statusMatch[1], 10);
+            // Retry on 5xx server errors, 429 (rate limit), 408 (timeout)
+            return status >= 500 || status === 429 || status === 408;
+        }
+        // Check for timeout/network-related error messages
+        // Use more precise matching to avoid false positives like "No timeout specified"
+        if (/\b(request timed out|operation timed out|connection timed out|timed out)\b/i.test(message) ||
+            /\bnetwork (error|failure|unreachable|down)\b/i.test(message)) {
+            return true;
+        }
+    }
+    return false;
+}
 /**
  * Image processor class for handling provider-specific image formatting
  */
@@ -16,9 +67,16 @@ export class ImageProcessor {
      * @returns Processed image as data URI
      */
     static async process(content, _options) {
+        // Validate content is non-empty before processing
+        if (content.length === 0) {
+            logger.error("Empty buffer provided");
+            throw new Error("Invalid image processing: buffer is empty");
+        }
         const mediaType = this.detectImageType(content);
         const base64 = content.toString("base64");
         const dataUri = `data:${mediaType};base64,${base64}`;
+        // Validate output before returning
+        this.validateProcessOutput(dataUri, base64, mediaType);
         return {
             type: "image",
             content: dataUri,
@@ -29,6 +87,37 @@ export class ImageProcessor {
             },
         };
     }
+    /**
+     * Validate processed output meets required format
+     * Checks:
+     * - Base64 content is non-empty
+     * - Data URI format is valid (data:{mimeType};base64,{content})
+     * - MIME type is in the allowed list
+     * @param dataUri - The complete data URI string
+     * @param base64 - The base64-encoded content
+     * @param mediaType - The MIME type of the image
+     * @throws Error if any validation fails
+     */
+    static validateProcessOutput(dataUri, base64, mediaType) {
+        // Validate base64 is non-empty (check first for better error message)
+        if (base64.length === 0) {
+            logger.error("Empty base64 content generated");
+            throw new Error("Invalid image processing: base64 content is empty");
+        }
+        // Validate data URI format with proper base64 character validation
+        // Base64 can only have 0, 1, or 2 padding characters at the end
+        const dataUriRegex = /^data:[^;]+;base64,[A-Za-z0-9+/]*={0,2}$/;
+        if (!dataUriRegex.test(dataUri)) {
+            logger.error("Invalid data URI format generated", { dataUri });
+            throw new Error("Invalid data URI format: must be data:{mimeType};base64,{content}");
+        }
+        // Defensive check: ensure detectImageType() returns valid MIME type
+        // This validation protects against future changes to detectImageType()
+        if (!this.validateImageFormat(mediaType)) {
+            logger.error("Invalid MIME type generated", { mediaType });
+            throw new Error(`Invalid MIME type: ${mediaType} is not in allowed list`);
+        }
+    }
     /**
      * Process image for OpenAI (requires data URI format)
      */
@@ -434,14 +523,35 @@ export const imageUtils = {
         }
     },
     /**
-     * Convert URL to base64 data URI by downloading the image
+     * Convert URL to base64 data URI by downloading the image.
+     * Implements retry logic with exponential backoff for network errors.
+     *
+     * Retries are performed for:
+     * - Network errors (ECONNRESET, ENOTFOUND, ECONNREFUSED, ETIMEDOUT, ERR_NETWORK, AbortError)
+     * - Server errors (5xx status codes)
+     * - Rate limiting (429 Too Many Requests)
+     * - Request timeouts (408 Request Timeout)
+     *
+     * Retries are NOT performed for:
+     * - Client errors (4xx status codes except 408, 429)
+     * - Invalid content type
+     * - Content size limit exceeded
+     * - Unsupported protocol
+     *
+     * @param url - The URL of the image to download
+     * @param options - Configuration options
+     * @param options.timeoutMs - Timeout for each download attempt (default: 15000ms)
+     * @param options.maxBytes - Maximum allowed file size (default: 10MB)
+     * @param options.maxAttempts - Maximum number of total attempts including initial attempt (default: 3)
+     * @returns Promise<string> - Base64 data URI of the downloaded image
      */
-    urlToBase64DataUri: async (url, { timeoutMs = 15000, maxBytes = 10 * 1024 * 1024 } = {}) => {
-        try {
-            // Basic protocol whitelist
-            if (!/^https?:\/\//i.test(url)) {
-                throw new Error("Unsupported protocol");
-            }
+    urlToBase64DataUri: async (url, { timeoutMs = 15000, maxBytes = 10 * 1024 * 1024, maxAttempts = 3, } = {}) => {
+        // Basic protocol whitelist - fail fast, no retry needed
+        if (!/^https?:\/\//i.test(url)) {
+            throw new Error("Unsupported protocol");
+        }
+        // Perform the actual download with retry logic
+        const performDownload = async () => {
             const controller = new AbortController();
             const t = setTimeout(() => controller.abort(), timeoutMs);
             try {
@@ -467,6 +577,20 @@ export const imageUtils = {
             finally {
                 clearTimeout(t);
             }
+        };
+        try {
+            return await withRetry(performDownload, {
+                maxAttempts,
+                initialDelay: SYSTEM_LIMITS.DEFAULT_INITIAL_DELAY,
+                backoffMultiplier: SYSTEM_LIMITS.DEFAULT_BACKOFF_MULTIPLIER,
+                maxDelay: SYSTEM_LIMITS.DEFAULT_MAX_DELAY,
+                retryCondition: isRetryableDownloadError,
+                onRetry: (attempt, error) => {
+                    const message = error instanceof Error ? error.message : String(error);
+                    const attemptsLeft = maxAttempts - attempt;
+                    logger.warn(`⚠️ Image download attempt ${attempt} failed for ${url}: ${message}. ${attemptsLeft} ${attemptsLeft === 1 ? "attempt" : "attempts"} remaining...`);
+                },
+            });
         }
         catch (error) {
             throw new Error(`Failed to download and convert URL to base64: ${error instanceof Error ? error.message : "Unknown error"}`);

package/dist/utils/messageBuilder.js CHANGED Viewed

@@ -10,6 +10,30 @@ import { FileDetector } from "./fileDetector.js";
 import { PDFProcessor } from "./pdfProcessor.js";
 import { request, getGlobalDispatcher, interceptors } from "undici";
 import { readFileSync, existsSync } from "fs";
+/**
+ * Type guard to check if an image input has alt text
+ */
+function isImageWithAltText(image) {
+    return (typeof image === "object" && !Buffer.isBuffer(image) && "data" in image);
+}
+/**
+ * Extract image data from an image input (handles both simple and alt text formats)
+ */
+function extractImageData(image) {
+    if (isImageWithAltText(image)) {
+        return image.data;
+    }
+    return image;
+}
+/**
+ * Extract alt text from an image input if available
+ */
+function extractAltText(image) {
+    if (isImageWithAltText(image)) {
+        return image.altText;
+    }
+    return undefined;
+}
 /**
  * Type guard for validating message roles
  */
@@ -639,28 +663,47 @@ async function downloadImageFromUrl(url) {
  * - URLs: Downloaded and converted to base64 for Vercel AI SDK compatibility
  * - Local files: Converted to base64 for Vercel AI SDK compatibility
  * - Buffers/Data URIs: Processed normally
+ * - Supports alt text for accessibility (included as context in text parts)
  */
 async function convertSimpleImagesToProviderFormat(text, images, provider, _model) {
     // For Vercel AI SDK, we need to return the content in the standard format
     // The Vercel AI SDK will handle provider-specific formatting internally
+    // IMPORTANT: Generate alt text descriptions BEFORE URL downloading to maintain correct image numbering
+    // This ensures image numbers match the original order provided by users, even if some URLs fail to download
+    const altTextDescriptions = images
+        .map((image, idx) => {
+        const altText = extractAltText(image);
+        return altText ? `[Image ${idx + 1}: ${altText}]` : null;
+    })
+        .filter(Boolean);
+    // Build enhanced text with alt text context for accessibility
+    // NOTE: Alt text is appended to the user's prompt as contextual information because most AI providers
+    // don't have native alt text fields in their APIs. This approach ensures accessibility metadata
+    // is preserved and helps AI models better understand image content.
+    const enhancedText = altTextDescriptions.length > 0
+        ? `${text}\n\nImage descriptions for context: ${altTextDescriptions.join(" ")}`
+        : text;
     // Smart auto-detection: separate URLs from actual image data
+    // Also track alt text for each image
     const urlImages = [];
     const actualImages = [];
     images.forEach((image, _index) => {
-        if (typeof image === "string" && isInternetUrl(image)) {
+        const imageData = extractImageData(image);
+        const altText = extractAltText(image);
+        if (typeof imageData === "string" && isInternetUrl(imageData)) {
             // Internet URL - will be downloaded and converted to base64
-            urlImages.push(image);
+            urlImages.push({ url: imageData, altText });
         }
         else {
             // Actual image data (file path, Buffer, data URI) - process for Vercel AI SDK
-            actualImages.push(image);
+            actualImages.push({ data: imageData, altText });
         }
     });
     // Download URL images and add to actual images
-    for (const url of urlImages) {
+    for (const { url, altText } of urlImages) {
         try {
             const downloadedDataUri = await downloadImageFromUrl(url);
-            actualImages.push(downloadedDataUri);
+            actualImages.push({ data: downloadedDataUri, altText });
         }
         catch (error) {
             MultimodalLogger.logError("URL_DOWNLOAD_FAILED_SKIPPING", error, { url });
@@ -668,9 +711,11 @@ async function convertSimpleImagesToProviderFormat(text, images, provider, _mode
             logger.warn(`Failed to download image from ${url}, skipping: ${error instanceof Error ? error.message : String(error)}`);
         }
     }
-    const content = [{ type: "text", text }];
+    const content = [
+        { type: "text", text: enhancedText },
+    ];
     // Process all images (including downloaded URLs) for Vercel AI SDK
-    actualImages.forEach((image, index) => {
+    actualImages.forEach(({ data: image }, index) => {
         try {
             // Vercel AI SDK expects { type: 'image', image: Buffer | string, mimeType?: string }
             // For Vertex AI, we need to include mimeType

package/dist/utils/multimodalOptionsBuilder.d.ts CHANGED Viewed

@@ -44,7 +44,7 @@ import type { StreamOptions } from "../types/streamTypes.js";
 export declare function buildMultimodalOptions(options: StreamOptions, providerName: string, modelName: string): {
     input: {
         text: string;
-        images: (string | Buffer<ArrayBufferLike>)[] | undefined;
+        images: (string | Buffer<ArrayBufferLike> | import("../types/multimodal.js").ImageWithAltText)[] | undefined;
         content: import("../types/multimodal.js").Content[] | undefined;
         files: (string | Buffer<ArrayBufferLike>)[] | undefined;
         csvFiles: (string | Buffer<ArrayBufferLike>)[] | undefined;

package/dist/utils/pdfProcessor.js CHANGED Viewed

@@ -1,6 +1,6 @@
 import { logger } from "./logger.js";
-import * as pdfjs from "pdfjs-dist/legacy/build/pdf.mjs";
-import { createCanvas } from "canvas";
+// Lazy-load pdfjs-dist to avoid DOMMatrix errors in Node.js server environment
+// import * as pdfjs from "pdfjs-dist/legacy/build/pdf.mjs";
 const PDF_PROVIDER_CONFIGS = {
     anthropic: {
         maxSizeMB: 5,
@@ -196,6 +196,28 @@ export class PDFProcessor {
         }
     }
     static async convertPDFToImages(pdfBuffer, options) {
+        // Dynamic import canvas - only load when actually needed
+        let createCanvas;
+        try {
+            const canvasModule = await import("canvas");
+            createCanvas = canvasModule.createCanvas;
+        }
+        catch {
+            throw new Error("Canvas dependency not available. " +
+                "PDF-to-image conversion requires the 'canvas' package with native bindings. " +
+                "Install with: pnpm install canvas\n" +
+                "Note: This requires native build tools (Python, C++ compiler).");
+        }
+        // Dynamic import pdfjs - only load when actually needed to avoid DOMMatrix errors
+        let pdfjs;
+        try {
+            pdfjs = await import("pdfjs-dist/legacy/build/pdf.mjs");
+        }
+        catch {
+            throw new Error("pdfjs-dist dependency not available. " +
+                "PDF processing requires the 'pdfjs-dist' package. " +
+                "Install with: pnpm install pdfjs-dist");
+        }
         const maxPages = options?.maxPages || 10;
         const scale = options?.scale || 2.0;
         const format = options?.format || "png";

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@juspay/neurolink",
-  "version": "8.5.1",
+  "version": "8.7.0",
   "description": "Universal AI Development Platform with working MCP integration, multi-provider support, and professional CLI. Built-in tools operational, 58+ external MCP servers discoverable. Connect to filesystem, GitHub, database operations, and more. Build, test, and deploy AI applications with 9 major providers: OpenAI, Anthropic, Google AI, AWS Bedrock, Azure, Hugging Face, Ollama, and Mistral AI.",
   "author": {
     "name": "Juspay Technologies",
@@ -179,7 +179,6 @@
     "@opentelemetry/sdk-trace-node": "^2.1.0",
     "@opentelemetry/semantic-conventions": "^1.30.1",
     "ai": "4.3.16",
-    "canvas": "^3.2.0",
     "chalk": "^5.6.2",
     "csv-parser": "^3.2.0",
     "dotenv": "^16.6.1",
@@ -201,6 +200,9 @@
     "zod": "^3.22.0",
     "zod-to-json-schema": "^3.24.6"
   },
+  "optionalDependencies": {
+    "canvas": "^3.2.0"
+  },
   "devDependencies": {
     "@biomejs/biome": "^2.2.4",
     "@changesets/changelog-github": "^0.5.1",
@@ -210,7 +212,7 @@
     "@semantic-release/commit-analyzer": "^13.0.1",
     "@semantic-release/git": "^10.0.1",
     "@semantic-release/github": "^11.0.6",
-    "@semantic-release/npm": "^12.0.2",
+    "@semantic-release/npm": "^13.1.2",
     "@semantic-release/release-notes-generator": "^14.1.0",
     "@smithy/types": "^4.5.0",
     "@sveltejs/adapter-auto": "^6.1.0",
@@ -297,7 +299,8 @@
       "@eslint/plugin-kit@<0.3.4": ">=0.3.4",
       "tmp@<=0.2.3": ">=0.2.4",
       "axios@<1.8.2": ">=1.8.2",
-      "glob@>=10.3.7 <=11.0.3": ">=11.1.0"
+      "glob@>=10.3.7 <=11.0.3": ">=11.1.0",
+      "@semantic-release/npm": "^13.1.2"
     }
   },
   "os": [