npm - @providerprotocol/ai - Versions diffs - 0.0.7 → 0.0.9 - Mend

@providerprotocol/ai 0.0.7 → 0.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (19) hide show

package/dist/anthropic/index.js +1 -1
package/dist/{chunk-QUUX4G7U.js → chunk-W4BB4BG2.js} +19 -1
package/dist/chunk-W4BB4BG2.js.map +1 -0
package/dist/google/index.js +1 -1
package/dist/index.d.ts +12 -0
package/dist/index.js +1 -1
package/dist/ollama/index.js +1 -1
package/dist/openai/index.d.ts +385 -14
package/dist/openai/index.js +110 -17
package/dist/openai/index.js.map +1 -1
package/dist/openrouter/index.js +1 -1
package/dist/xai/index.js +1 -1
package/package.json +1 -1
package/src/openai/index.ts +29 -1
package/src/providers/openai/index.ts +30 -0
package/src/providers/openai/transform.responses.ts +51 -19
package/src/providers/openai/types.ts +510 -16
package/src/types/messages.ts +24 -1
package/dist/chunk-QUUX4G7U.js.map +0 -1

package/src/providers/openai/transform.responses.ts CHANGED Viewed

@@ -3,7 +3,7 @@ import type { Message } from '../../types/messages.ts';
 import type { StreamEvent } from '../../types/stream.ts';
 import type { Tool, ToolCall } from '../../types/tool.ts';
 import type { TokenUsage } from '../../types/turn.ts';
-import type { ContentBlock, TextBlock, ImageBlock } from '../../types/content.ts';
+import type { ContentBlock, TextBlock, ImageBlock, AssistantContent } from '../../types/content.ts';
 import {
   AssistantMessage,
   isUserMessage,
@@ -16,11 +16,13 @@ import type {
   OpenAIResponsesInputItem,
   OpenAIResponsesContentPart,
   OpenAIResponsesTool,
+  OpenAIResponsesToolUnion,
   OpenAIResponsesResponse,
   OpenAIResponsesStreamEvent,
   OpenAIResponsesOutputItem,
   OpenAIResponsesMessageOutput,
   OpenAIResponsesFunctionCallOutput,
+  OpenAIResponsesImageGenerationOutput,
 } from './types.ts';
 /**
@@ -36,16 +38,23 @@ export function transformRequest(
 ): OpenAIResponsesRequest {
   const params = request.params ?? ({} as OpenAIResponsesParams);
+  // Extract built-in tools from params before spreading
+  const builtInTools = params.tools as OpenAIResponsesToolUnion[] | undefined;
+  const { tools: _paramsTools, ...restParams } = params;
   // Spread params to pass through all fields, then set required fields
   const openaiRequest: OpenAIResponsesRequest = {
-    ...params,
+    ...restParams,
     model: modelId,
     input: transformInputItems(request.messages, request.system),
   };
-  // Tools come from request, not params
-  if (request.tools && request.tools.length > 0) {
-    openaiRequest.tools = request.tools.map(transformTool);
+  // Merge tools: UPP function tools from request + built-in tools from params
+  const functionTools: OpenAIResponsesToolUnion[] = request.tools?.map(transformTool) ?? [];
+  const allTools: OpenAIResponsesToolUnion[] = [...functionTools, ...(builtInTools ?? [])];
+  if (allTools.length > 0) {
+    openaiRequest.tools = allTools;
   }
   // Structured output via text.format (overrides params.text if set)
@@ -276,8 +285,8 @@ function transformTool(tool: Tool): OpenAIResponsesTool {
  * Transform OpenAI Responses API response to UPP LLMResponse
  */
 export function transformResponse(data: OpenAIResponsesResponse): LLMResponse {
-  // Extract text content and tool calls from output items
-  const textContent: TextBlock[] = [];
+  // Extract content and tool calls from output items
+  const content: AssistantContent[] = [];
   const toolCalls: ToolCall[] = [];
   const functionCallItems: Array<{
     id: string;
@@ -291,20 +300,19 @@ export function transformResponse(data: OpenAIResponsesResponse): LLMResponse {
   for (const item of data.output) {
     if (item.type === 'message') {
       const messageItem = item as OpenAIResponsesMessageOutput;
-      for (const content of messageItem.content) {
-        if (content.type === 'output_text') {
-          textContent.push({ type: 'text', text: content.text });
+      for (const part of messageItem.content) {
+        if (part.type === 'output_text') {
+          content.push({ type: 'text', text: part.text });
           // Try to parse as JSON for structured output (native JSON mode)
-          // Only set data if text is valid JSON
           if (structuredData === undefined) {
             try {
-              structuredData = JSON.parse(content.text);
+              structuredData = JSON.parse(part.text);
             } catch {
               // Not valid JSON - that's fine, might not be structured output
             }
           }
-        } else if (content.type === 'refusal') {
-          textContent.push({ type: 'text', text: content.refusal });
+        } else if (part.type === 'refusal') {
+          content.push({ type: 'text', text: part.refusal });
           hadRefusal = true;
         }
       }
@@ -327,11 +335,20 @@ export function transformResponse(data: OpenAIResponsesResponse): LLMResponse {
         name: functionCall.name,
         arguments: functionCall.arguments,
       });
+    } else if (item.type === 'image_generation_call') {
+      const imageGen = item as OpenAIResponsesImageGenerationOutput;
+      if (imageGen.result) {
+        content.push({
+          type: 'image',
+          mimeType: 'image/png',
+          source: { type: 'base64', data: imageGen.result },
+        } as ImageBlock);
+      }
     }
   }
   const message = new AssistantMessage(
-    textContent,
+    content,
     toolCalls.length > 0 ? toolCalls : undefined,
     {
       id: data.id,
@@ -339,7 +356,6 @@ export function transformResponse(data: OpenAIResponsesResponse): LLMResponse {
         openai: {
           model: data.model,
           status: data.status,
-          // Store response_id for multi-turn tool calling
           response_id: data.id,
           functionCallItems:
             functionCallItems.length > 0 ? functionCallItems : undefined,
@@ -388,6 +404,7 @@ export interface ResponsesStreamState {
     number,
     { itemId?: string; callId?: string; name?: string; arguments: string }
   >;
+  images: string[]; // Base64 image data from image_generation_call outputs
   status: string;
   inputTokens: number;
   outputTokens: number;
@@ -403,6 +420,7 @@ export function createStreamState(): ResponsesStreamState {
     model: '',
     textByIndex: new Map(),
     toolCalls: new Map(),
+    images: [],
     status: 'in_progress',
     inputTokens: 0,
     outputTokens: 0,
@@ -479,6 +497,11 @@ export function transformStreamEvent(
           existing.arguments = functionCall.arguments;
         }
         state.toolCalls.set(event.output_index, existing);
+      } else if (event.item.type === 'image_generation_call') {
+        const imageGen = event.item as OpenAIResponsesImageGenerationOutput;
+        if (imageGen.result) {
+          state.images.push(imageGen.result);
+        }
       }
       events.push({
         type: 'content_block_stop',
@@ -579,13 +602,13 @@ export function transformStreamEvent(
  * Build LLMResponse from accumulated stream state
  */
 export function buildResponseFromState(state: ResponsesStreamState): LLMResponse {
-  const textContent: TextBlock[] = [];
+  const content: AssistantContent[] = [];
   let structuredData: unknown;
   // Combine all text content
   for (const [, text] of state.textByIndex) {
     if (text) {
-      textContent.push({ type: 'text', text });
+      content.push({ type: 'text', text });
       // Try to parse as JSON for structured output (native JSON mode)
       if (structuredData === undefined) {
         try {
@@ -597,6 +620,15 @@ export function buildResponseFromState(state: ResponsesStreamState): LLMResponse
     }
   }
+  // Add any generated images
+  for (const imageData of state.images) {
+    content.push({
+      type: 'image',
+      mimeType: 'image/png',
+      source: { type: 'base64', data: imageData },
+    } as ImageBlock);
+  }
   const toolCalls: ToolCall[] = [];
   const functionCallItems: Array<{
     id: string;
@@ -633,7 +665,7 @@ export function buildResponseFromState(state: ResponsesStreamState): LLMResponse
   }
   const message = new AssistantMessage(
-    textContent,
+    content,
     toolCalls.length > 0 ? toolCalls : undefined,
     {
       id: state.id,