npm - @providerprotocol/ai - Versions diffs - 0.0.25 → 0.0.27 - Mend

@providerprotocol/ai 0.0.25 → 0.0.27

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/dist/anthropic/index.d.ts +1 -1
package/dist/{stream-ITNFNnO4.d.ts → embedding-CK5oa38O.d.ts} +157 -2
package/dist/google/index.d.ts +35 -2
package/dist/google/index.js +42 -1
package/dist/google/index.js.map +1 -1
package/dist/http/index.d.ts +2 -2
package/dist/index.d.ts +6 -161
package/dist/ollama/index.d.ts +1 -1
package/dist/openai/index.d.ts +1 -1
package/dist/openrouter/index.d.ts +1 -1
package/dist/{provider-x4RocsnK.d.ts → provider-6-mJYOOl.d.ts} +1 -1
package/dist/proxy/index.d.ts +220 -3
package/dist/proxy/index.js +814 -20
package/dist/proxy/index.js.map +1 -1
package/dist/{retry-DTfjXXPh.d.ts → retry-BhX8mIrL.d.ts} +1 -1
package/dist/xai/index.d.ts +1 -1
package/package.json +1 -1

package/dist/anthropic/index.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { g as Provider } from '../provider-x4RocsnK.js';
+import { e as Provider } from '../provider-6-mJYOOl.js';
 /**
  * @fileoverview Anthropic API type definitions.

package/dist/{stream-ITNFNnO4.d.ts → embedding-CK5oa38O.d.ts} RENAMED Viewed

@@ -1,4 +1,4 @@
-import { C as ContentBlock, m as ImageBlock, n as AudioBlock, V as VideoBlock, R as ReasoningBlock, A as AssistantContent, U as UserContent } from './provider-x4RocsnK.js';
+import { C as ContentBlock, k as ImageBlock, l as AudioBlock, V as VideoBlock, R as ReasoningBlock, A as AssistantContent, U as UserContent, P as ProviderIdentity, a as ProviderConfig, N as EmbeddingInput, J as EmbeddingUsage, D as BoundEmbeddingModel } from './provider-6-mJYOOl.js';
 /**
  * @fileoverview JSON Schema types for tool parameters and structured outputs.
@@ -1077,4 +1077,159 @@ declare function contentBlockStart(index: number): StreamEvent;
  */
 declare function contentBlockStop(index: number): StreamEvent;
-export { AssistantMessage as A, type BeforeCallResult as B, toolCallDelta as C, messageStart as D, type EventDelta as E, messageStop as F, contentBlockStart as G, contentBlockStop as H, type TurnJSON as I, type JSONSchema as J, Message as M, type StreamResult as S, type Turn as T, UserMessage as U, type MessageType as a, type MessageJSON as b, type Tool as c, type ToolUseStrategy as d, type TokenUsage as e, type StreamEvent as f, type JSONSchemaProperty as g, type JSONSchemaPropertyType as h, type ToolCall as i, type ToolResult as j, type ToolMetadata as k, type AfterCallResult as l, type ToolExecution as m, ToolResultMessage as n, MessageRole as o, isUserMessage as p, isAssistantMessage as q, isToolResultMessage as r, type MessageMetadata as s, type MessageOptions as t, createTurn as u, emptyUsage as v, aggregateUsage as w, StreamEventType as x, createStreamResult as y, textDelta as z };
+/**
+ * @fileoverview Embedding types for vector embedding generation.
+ *
+ * Defines the interfaces for configuring and executing embedding operations,
+ * including options, instances, requests, responses, and streaming progress.
+ *
+ * @module types/embedding
+ */
+/**
+ * Structural type for embedding model input.
+ * Uses structural typing to avoid generic variance issues with Provider generics.
+ *
+ * @remarks
+ * This type mirrors {@link ModelReference} while keeping provider options
+ * structurally compatible across providers.
+ *
+ * @see ModelReference
+ */
+interface EmbeddingModelInput {
+    readonly modelId: string;
+    readonly provider: ProviderIdentity;
+    /** Optional provider configuration merged into requests */
+    readonly providerConfig?: Partial<ProviderConfig>;
+}
+/**
+ * Options for creating an embedding instance with the embedding() function.
+ *
+ * @typeParam TParams - Provider-specific parameter type
+ *
+ * @example
+ * ```typescript
+ * const options: EmbeddingOptions<OpenAIEmbedParams> = {
+ *   model: openai('text-embedding-3-large'),
+ *   config: { apiKey: process.env.OPENAI_API_KEY },
+ *   params: { dimensions: 1536 }
+ * };
+ * ```
+ */
+interface EmbeddingOptions<TParams = unknown> {
+    /** A model reference from a provider factory */
+    model: EmbeddingModelInput;
+    /** Provider infrastructure configuration */
+    config?: ProviderConfig;
+    /** Provider-specific parameters (passed through unchanged) */
+    params?: TParams;
+}
+/**
+ * Options for embed() calls.
+ */
+interface EmbedOptions {
+    /**
+     * Enable chunked processing with progress for large input sets.
+     * When true, returns EmbeddingStream instead of Promise.
+     */
+    chunked?: boolean;
+    /** Inputs per batch when chunked (default: provider max) */
+    batchSize?: number;
+    /** Concurrent batch limit when chunked (default: 1) */
+    concurrency?: number;
+    /** Abort signal for cancellation */
+    signal?: AbortSignal;
+}
+/**
+ * Single embedding vector result.
+ */
+interface Embedding {
+    /** The embedding vector */
+    vector: number[];
+    /** Vector dimensionality */
+    dimensions: number;
+    /** Index corresponding to input array position */
+    index: number;
+    /** Token count for this input (if provider reports) */
+    tokens?: number;
+    /** Provider-specific per-embedding metadata */
+    metadata?: Record<string, unknown>;
+}
+/**
+ * Result from embed() call.
+ */
+interface EmbeddingResult {
+    /** Embeddings in same order as inputs */
+    embeddings: Embedding[];
+    /** Usage statistics */
+    usage: EmbeddingUsage;
+    /** Provider-specific response metadata */
+    metadata?: Record<string, unknown>;
+}
+/**
+ * Progress update when using chunked mode.
+ */
+interface EmbeddingProgress {
+    /** Embeddings from the latest batch */
+    embeddings: Embedding[];
+    /** Total embeddings completed so far */
+    completed: number;
+    /** Total number of inputs */
+    total: number;
+    /** Percentage complete (0-100) */
+    percent: number;
+}
+/**
+ * Async iterable stream with final result accessor.
+ * Returned when embed() is called with { chunked: true }.
+ */
+interface EmbeddingStream extends AsyncIterable<EmbeddingProgress> {
+    /** Promise resolving to complete result after iteration */
+    readonly result: Promise<EmbeddingResult>;
+    /** Abort the operation */
+    abort(): void;
+}
+/**
+ * Embedding instance returned by the embedding() function.
+ *
+ * @typeParam TParams - Provider-specific parameter type
+ *
+ * @example
+ * ```typescript
+ * const embedder = embedding({ model: openai('text-embedding-3-large') });
+ *
+ * // Single input
+ * const result = await embedder.embed('Hello world');
+ *
+ * // Batch input
+ * const batch = await embedder.embed(['doc1', 'doc2', 'doc3']);
+ *
+ * // Large-scale with progress
+ * const stream = embedder.embed(documents, { chunked: true });
+ * for await (const progress of stream) {
+ *   console.log(`${progress.percent}% complete`);
+ * }
+ * ```
+ */
+interface EmbeddingInstance<TParams = unknown> {
+    /**
+     * Generate embeddings for one or more inputs.
+     *
+     * @param input - Single input or array of inputs
+     * @param options - Optional embed options
+     * @returns Promise<EmbeddingResult> or EmbeddingStream if chunked
+     */
+    embed(input: EmbeddingInput | EmbeddingInput[], options?: EmbedOptions & {
+        chunked?: false;
+    }): Promise<EmbeddingResult>;
+    embed(input: EmbeddingInput[], options: EmbedOptions & {
+        chunked: true;
+    }): EmbeddingStream;
+    embed(input: EmbeddingInput | EmbeddingInput[], options?: EmbedOptions): Promise<EmbeddingResult> | EmbeddingStream;
+    /** The bound embedding model */
+    readonly model: BoundEmbeddingModel<TParams>;
+    /** Current parameters */
+    readonly params: TParams | undefined;
+}
+export { AssistantMessage as A, type BeforeCallResult as B, createStreamResult as C, textDelta as D, type EmbeddingOptions as E, toolCallDelta as F, messageStart as G, messageStop as H, contentBlockStart as I, type JSONSchema as J, contentBlockStop as K, type EmbedOptions as L, Message as M, type Embedding as N, type EmbeddingResult as O, type EmbeddingProgress as P, type EmbeddingStream as Q, type EmbeddingModelInput as R, type StreamResult as S, type Turn as T, UserMessage as U, type TurnJSON as V, type MessageType as a, type MessageJSON as b, type Tool as c, type ToolUseStrategy as d, type TokenUsage as e, type StreamEvent as f, type EmbeddingInstance as g, type JSONSchemaProperty as h, type JSONSchemaPropertyType as i, type ToolCall as j, type ToolResult as k, type ToolMetadata as l, type AfterCallResult as m, type ToolExecution as n, ToolResultMessage as o, MessageRole as p, isUserMessage as q, isAssistantMessage as r, isToolResultMessage as s, type MessageMetadata as t, type MessageOptions as u, createTurn as v, emptyUsage as w, aggregateUsage as x, type EventDelta as y, StreamEventType as z };

package/dist/google/index.d.ts CHANGED Viewed

@@ -1,4 +1,4 @@
-import { a as ProviderConfig, g as Provider } from '../provider-x4RocsnK.js';
+import { a as ProviderConfig, e as Provider } from '../provider-6-mJYOOl.js';
 /**
  * Provider-specific parameters for Google Gemini API requests.
@@ -42,6 +42,17 @@ interface GoogleLLMParams {
     responseMimeType?: 'text/plain' | 'application/json';
     /** Response schema for structured output */
     responseSchema?: Record<string, unknown>;
+    /**
+     * Modalities to generate in the response.
+     *
+     * Use `['IMAGE']` or `['TEXT', 'IMAGE']` with Gemini image generation models
+     * (e.g., gemini-2.5-flash-image aka Nano Banana).
+     */
+    responseModalities?: GoogleResponseModality[];
+    /**
+     * Image generation configuration for Gemini image response modalities.
+     */
+    imageConfig?: GoogleImageConfig;
     /**
      * Presence penalty for new topics
      * Positive values encourage discussing new topics
@@ -124,6 +135,28 @@ interface GoogleLLMParams {
      */
     toolConfig?: GoogleToolConfig;
 }
+/**
+ * Output modality enum values for Gemini responseModalities.
+ *
+ * The API supports TEXT, IMAGE, and AUDIO response types. Some SDK examples
+ * use Title Case values, so both are accepted here.
+ */
+type GoogleResponseModality = 'TEXT' | 'IMAGE' | 'AUDIO' | 'Text' | 'Image' | 'Audio';
+/**
+ * Image generation configuration for Gemini response modalities.
+ */
+interface GoogleImageConfig {
+    /**
+     * Preferred aspect ratio for generated images.
+     * Example: "1:1", "9:16", "16:9".
+     */
+    aspectRatio?: string;
+    /**
+     * Preferred output size for generated images.
+     * Example: "1024x1024".
+     */
+    imageSize?: string;
+}
 /**
  * Configuration for extended thinking/reasoning in Gemini 2.5+ and 3+ models.
  *
@@ -980,4 +1013,4 @@ declare const google: Provider<unknown> & {
     };
 };
-export { type CacheCreateOptions, type CacheListOptions, type GoogleBuiltInTool, type GoogleCacheCreateRequest, type GoogleCacheListResponse, type GoogleCacheResponse, type GoogleCacheUpdateRequest, type GoogleCodeExecutionResult, type GoogleCodeExecutionTool, type GoogleEmbedParams, type GoogleFileSearchTool, type GoogleGroundingMetadata, type GoogleHeaders, type GoogleLLMParams, type GoogleMapsTool, type GoogleSearchTool, type GoogleTaskType, type GoogleToolConfig, type GoogleUrlContextTool, cache, google, tools };
+export { type CacheCreateOptions, type CacheListOptions, type GoogleBuiltInTool, type GoogleCacheCreateRequest, type GoogleCacheListResponse, type GoogleCacheResponse, type GoogleCacheUpdateRequest, type GoogleCodeExecutionResult, type GoogleCodeExecutionTool, type GoogleEmbedParams, type GoogleFileSearchTool, type GoogleGroundingMetadata, type GoogleHeaders, type GoogleImageConfig, type GoogleLLMParams, type GoogleMapsTool, type GoogleResponseModality, type GoogleSearchTool, type GoogleTaskType, type GoogleToolConfig, type GoogleUrlContextTool, cache, google, tools };

package/dist/google/index.js CHANGED Viewed

@@ -281,6 +281,16 @@ function transformResponse(data) {
         args: fc.functionCall.args,
         thoughtSignature: fc.thoughtSignature
       });
+    } else if ("inlineData" in part) {
+      const imagePart = part;
+      const dataString = imagePart.inlineData.data;
+      if (dataString) {
+        content.push({
+          type: "image",
+          mimeType: imagePart.inlineData.mimeType ?? "image/png",
+          source: { type: "base64", data: dataString }
+        });
+      }
     } else if ("codeExecutionResult" in part) {
       const codeResult = part;
       if (codeResult.codeExecutionResult.output) {
@@ -326,6 +336,7 @@ function createStreamState() {
     reasoning: "",
     thoughtSignature: void 0,
     toolCalls: [],
+    images: [],
     finishReason: null,
     inputTokens: 0,
     outputTokens: 0,
@@ -387,6 +398,20 @@ function transformStreamChunk(chunk, state) {
           argumentsJson: JSON.stringify(fc.functionCall.args)
         }
       });
+    } else if ("inlineData" in part) {
+      const imagePart = part;
+      const dataString = imagePart.inlineData.data;
+      if (dataString) {
+        state.images.push({
+          data: dataString,
+          mimeType: imagePart.inlineData.mimeType ?? "image/png"
+        });
+        events.push({
+          type: StreamEventType.ImageDelta,
+          index: state.images.length - 1,
+          delta: { data: decodeBase64(dataString) }
+        });
+      }
     } else if ("codeExecutionResult" in part) {
       const codeResult = part;
       if (codeResult.codeExecutionResult.output) {
@@ -424,6 +449,13 @@ function buildResponseFromState(state) {
     } catch {
     }
   }
+  for (const imageData of state.images) {
+    content.push({
+      type: "image",
+      mimeType: imageData.mimeType,
+      source: { type: "base64", data: imageData.data }
+    });
+  }
   for (const tc of state.toolCalls) {
     const toolCallId = tc.id || createGoogleToolCallId(tc.name, toolCalls.length);
     toolCalls.push({
@@ -479,6 +511,14 @@ function normalizeStopReason(reason) {
       return "end_turn";
   }
 }
+function decodeBase64(base64) {
+  const binaryString = atob(base64);
+  const bytes = new Uint8Array(binaryString.length);
+  for (let i = 0; i < binaryString.length; i += 1) {
+    bytes[i] = binaryString.charCodeAt(i);
+  }
+  return bytes;
+}
 // src/providers/google/llm.ts
 var GOOGLE_API_BASE = "https://generativelanguage.googleapis.com/v1beta";
@@ -488,7 +528,8 @@ var GOOGLE_CAPABILITIES = {
   structuredOutput: true,
   imageInput: true,
   videoInput: true,
-  audioInput: true
+  audioInput: true,
+  imageOutput: true
 };
 function buildUrl(modelId, action) {
   return `${GOOGLE_API_BASE}/models/${modelId}:${action}`;