npm - gsd-pi - Versions diffs - 2.23.0 → 2.25.0 - Mend

gsd-pi 2.23.0 → 2.25.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (212) hide show

package/packages/pi-ai/src/providers/anthropic.ts CHANGED Viewed

@@ -1,4 +1,6 @@
-import Anthropic from "@anthropic-ai/sdk";
+// Lazy-loaded: Anthropic SDK (~500ms) is imported on first use, not at startup.
+// This avoids penalizing users who don't use Anthropic models.
+import type Anthropic from "@anthropic-ai/sdk";
 import type {
 	ContentBlockParam,
 	MessageCreateParamsStreaming,
@@ -14,6 +16,7 @@ import type {
 	ImageContent,
 	Message,
 	Model,
+	ServerToolUseContent,
 	SimpleStreamOptions,
 	StopReason,
 	StreamFunction,
@@ -23,6 +26,7 @@ import type {
 	Tool,
 	ToolCall,
 	ToolResultMessage,
+	WebSearchResultContent,
 } from "../types.js";
 import { AssistantMessageEventStream } from "../utils/event-stream.js";
 import { parseStreamingJson } from "../utils/json-parse.js";
@@ -32,6 +36,15 @@ import { buildCopilotDynamicHeaders, hasCopilotVisionInput } from "./github-copi
 import { adjustMaxTokensForThinking, buildBaseOptions } from "./simple-options.js";
 import { transformMessages } from "./transform-messages.js";
+let _AnthropicClass: typeof Anthropic | undefined;
+async function getAnthropicClass(): Promise<typeof Anthropic> {
+	if (!_AnthropicClass) {
+		const mod = await import("@anthropic-ai/sdk");
+		_AnthropicClass = mod.default;
+	}
+	return _AnthropicClass;
+}
 /**
  * Resolve cache retention preference.
  * Defaults to "short" and uses PI_CACHE_RETENTION for backward compatibility.
@@ -265,7 +278,7 @@ export const streamAnthropic: StreamFunction<"anthropic-messages", AnthropicOpti
 				});
 			}
-			const { client, isOAuthToken } = createClient(
+			const { client, isOAuthToken } = await createClient(
 				model,
 				apiKey,
 				options?.interleavedThinking ?? true,
@@ -280,7 +293,7 @@ export const streamAnthropic: StreamFunction<"anthropic-messages", AnthropicOpti
 			const anthropicStream = client.messages.stream({ ...params, stream: true }, { signal: options?.signal });
 			stream.push({ type: "start", partial: output });
-			type Block = (ThinkingContent | TextContent | (ToolCall & { partialJson: string })) & { index: number };
+			type Block = (ThinkingContent | TextContent | (ToolCall & { partialJson: string }) | ServerToolUseContent | WebSearchResultContent) & { index: number };
 			const blocks = output.content as Block[];
 			for await (const event of anthropicStream) {
@@ -336,6 +349,27 @@ export const streamAnthropic: StreamFunction<"anthropic-messages", AnthropicOpti
 						};
 						output.content.push(block);
 						stream.push({ type: "toolcall_start", contentIndex: output.content.length - 1, partial: output });
+					} else if ((event.content_block as any).type === "server_tool_use") {
+						const serverBlock = event.content_block as any;
+						const block: Block = {
+							type: "serverToolUse",
+							id: serverBlock.id,
+							name: serverBlock.name,
+							input: serverBlock.input,
+							index: event.index,
+						};
+						output.content.push(block);
+						stream.push({ type: "server_tool_use", contentIndex: output.content.length - 1, partial: output });
+					} else if ((event.content_block as any).type === "web_search_tool_result") {
+						const resultBlock = event.content_block as any;
+						const block: Block = {
+							type: "webSearchResult",
+							toolUseId: resultBlock.tool_use_id,
+							content: resultBlock.content,
+							index: event.index,
+						};
+						output.content.push(block);
+						stream.push({ type: "web_search_result", contentIndex: output.content.length - 1, partial: output });
 					}
 				} else if (event.type === "content_block_delta") {
 					if (event.delta.type === "text_delta") {
@@ -412,6 +446,7 @@ export const streamAnthropic: StreamFunction<"anthropic-messages", AnthropicOpti
 								partial: output,
 							});
 						}
+						// serverToolUse and webSearchResult blocks just need index cleanup (already emitted on start)
 					}
 				} else if (event.type === "message_delta") {
 					if (event.delta.stop_reason) {
@@ -455,7 +490,8 @@ export const streamAnthropic: StreamFunction<"anthropic-messages", AnthropicOpti
 			if (model.provider === "alibaba-coding-plan") {
 				output.errorMessage = `[alibaba-coding-plan] ${output.errorMessage}`;
 			}
-			if (error instanceof Anthropic.APIError && error.headers) {
+			const AnthropicSdk = _AnthropicClass;
+			if (AnthropicSdk && error instanceof AnthropicSdk.APIError && error.headers) {
 				const retryAfterMs = extractRetryAfterMs(error.headers, error.message);
 				if (retryAfterMs !== undefined) {
 					output.retryAfterMs = retryAfterMs;
@@ -548,13 +584,14 @@ function isOAuthToken(apiKey: string): boolean {
 	return apiKey.includes("sk-ant-oat");
 }
-function createClient(
+async function createClient(
 	model: Model<"anthropic-messages">,
 	apiKey: string,
 	interleavedThinking: boolean,
 	optionsHeaders?: Record<string, string>,
 	dynamicHeaders?: Record<string, string>,
-): { client: Anthropic; isOAuthToken: boolean } {
+): Promise<{ client: Anthropic; isOAuthToken: boolean }> {
+	const AnthropicClass = await getAnthropicClass();
 	// Adaptive thinking models (Opus 4.6, Sonnet 4.6) have interleaved thinking built-in.
 	// The beta header is deprecated on Opus 4.6 and redundant on Sonnet 4.6, so skip it.
 	const needsInterleavedBeta = interleavedThinking && !supportsAdaptiveThinking(model.id);
@@ -566,7 +603,7 @@ function createClient(
 			betaFeatures.push("interleaved-thinking-2025-05-14");
 		}
-		const client = new Anthropic({
+		const client = new AnthropicClass({
 			apiKey: null,
 			authToken: apiKey,
 			baseURL: model.baseUrl,
@@ -595,7 +632,7 @@ function createClient(
 	// OAuth: Bearer auth, Claude Code identity headers
 	if (isOAuthToken(apiKey)) {
-		const client = new Anthropic({
+		const client = new AnthropicClass({
 			apiKey: null,
 			authToken: apiKey,
 			baseURL: model.baseUrl,
@@ -619,7 +656,7 @@ function createClient(
 	// API key auth
 	// Alibaba Coding Plan uses Bearer token auth instead of x-api-key
 	const isAlibabaProvider = model.provider === "alibaba-coding-plan";
-	const client = new Anthropic({
+	const client = new AnthropicClass({
 		apiKey: isAlibabaProvider ? null : apiKey,
 		authToken: isAlibabaProvider ? apiKey : undefined,
 		baseURL: model.baseUrl,
@@ -827,6 +864,19 @@ function convertMessages(
 						name: isOAuthToken ? toClaudeCodeName(block.name) : block.name,
 						input: block.arguments ?? {},
 					});
+				} else if (block.type === "serverToolUse") {
+					blocks.push({
+						type: "server_tool_use",
+						id: block.id,
+						name: block.name,
+						input: block.input ?? {},
+					} as any);
+				} else if (block.type === "webSearchResult") {
+					blocks.push({
+						type: "web_search_tool_result",
+						tool_use_id: block.toolUseId,
+						content: block.content,
+					} as any);
 				}
 			}
 			if (blocks.length === 0) continue;

package/packages/pi-ai/src/providers/azure-openai-responses.ts CHANGED Viewed

@@ -1,4 +1,6 @@
-import { AzureOpenAI } from "openai";
+// Lazy-loaded: OpenAI SDK (AzureOpenAI) is imported on first use, not at startup.
+// This avoids penalizing users who don't use Azure OpenAI models.
+import type { AzureOpenAI } from "openai";
 import type { ResponseCreateParamsStreaming } from "openai/resources/responses/responses.js";
 import { getEnvApiKey } from "../env-api-keys.js";
 import { supportsXhigh } from "../models.js";
@@ -15,6 +17,15 @@ import { AssistantMessageEventStream } from "../utils/event-stream.js";
 import { convertResponsesMessages, convertResponsesTools, processResponsesStream } from "./openai-responses-shared.js";
 import { buildBaseOptions, clampReasoning } from "./simple-options.js";
+let _AzureOpenAIClass: typeof AzureOpenAI | undefined;
+async function getAzureOpenAIClass(): Promise<typeof AzureOpenAI> {
+	if (!_AzureOpenAIClass) {
+		const mod = await import("openai");
+		_AzureOpenAIClass = mod.AzureOpenAI;
+	}
+	return _AzureOpenAIClass;
+}
 /**
  * Clamp reasoning effort for models that don't support all levels.
  * gpt-5.x models don't support "minimal" — map to "low".
@@ -94,7 +105,7 @@ export const streamAzureOpenAIResponses: StreamFunction<"azure-openai-responses"
 		try {
 			// Create Azure OpenAI client
 			const apiKey = options?.apiKey || getEnvApiKey(model.provider) || "";
-			const client = createClient(model, apiKey, options);
+			const client = await createClient(model, apiKey, options);
 			let params = buildParams(model, context, options, deploymentName);
 			const nextParams = await options?.onPayload?.(params, model);
 			if (nextParams !== undefined) {
@@ -188,7 +199,7 @@ function resolveAzureConfig(
 	};
 }
-function createClient(model: Model<"azure-openai-responses">, apiKey: string, options?: AzureOpenAIResponsesOptions) {
+async function createClient(model: Model<"azure-openai-responses">, apiKey: string, options?: AzureOpenAIResponsesOptions) {
 	if (!apiKey) {
 		if (!process.env.AZURE_OPENAI_API_KEY) {
 			throw new Error(
@@ -205,8 +216,9 @@ function createClient(model: Model<"azure-openai-responses">, apiKey: string, op
 	}
 	const { baseUrl, apiVersion } = resolveAzureConfig(model, options);
+	const AzureOpenAIClass = await getAzureOpenAIClass();
-	return new AzureOpenAI({
+	return new AzureOpenAIClass({
 		apiKey,
 		apiVersion,
 		dangerouslyAllowBrowser: true,

package/packages/pi-ai/src/providers/google-vertex.ts CHANGED Viewed

@@ -1,9 +1,10 @@
-import {
-	type GenerateContentConfig,
-	type GenerateContentParameters,
-	GoogleGenAI,
-	type ThinkingConfig,
-	ThinkingLevel,
+// Lazy-loaded: Google GenAI SDK is imported on first use, not at startup.
+// This avoids penalizing users who don't use Google Vertex models.
+import type { GoogleGenAI } from "@google/genai";
+import type {
+	GenerateContentConfig,
+	GenerateContentParameters,
+	ThinkingConfig,
 } from "@google/genai";
 import { calculateCost } from "../models.js";
 import type {
@@ -33,6 +34,15 @@ import {
 } from "./google-shared.js";
 import { buildBaseOptions, clampReasoning } from "./simple-options.js";
+let _GoogleVertexClass: typeof GoogleGenAI | undefined;
+async function getGoogleVertexClass(): Promise<typeof GoogleGenAI> {
+	if (!_GoogleVertexClass) {
+		const mod = await import("@google/genai");
+		_GoogleVertexClass = mod.GoogleGenAI;
+	}
+	return _GoogleVertexClass;
+}
 export interface GoogleVertexOptions extends StreamOptions {
 	toolChoice?: "auto" | "none" | "any";
 	thinking?: {
@@ -46,12 +56,14 @@ export interface GoogleVertexOptions extends StreamOptions {
 const API_VERSION = "v1";
-const THINKING_LEVEL_MAP: Record<GoogleThinkingLevel, ThinkingLevel> = {
-	THINKING_LEVEL_UNSPECIFIED: ThinkingLevel.THINKING_LEVEL_UNSPECIFIED,
-	MINIMAL: ThinkingLevel.MINIMAL,
-	LOW: ThinkingLevel.LOW,
-	MEDIUM: ThinkingLevel.MEDIUM,
-	HIGH: ThinkingLevel.HIGH,
+// ThinkingLevel is a string enum where each value equals its key name.
+// Using string literals avoids importing the SDK at module load time.
+const THINKING_LEVEL_MAP: Record<GoogleThinkingLevel, string> = {
+	THINKING_LEVEL_UNSPECIFIED: "THINKING_LEVEL_UNSPECIFIED",
+	MINIMAL: "MINIMAL",
+	LOW: "LOW",
+	MEDIUM: "MEDIUM",
+	HIGH: "HIGH",
 };
 // Counter for generating unique tool call IDs
@@ -86,7 +98,7 @@ export const streamGoogleVertex: StreamFunction<"google-vertex", GoogleVertexOpt
 		try {
 			const project = resolveProject(options);
 			const location = resolveLocation(options);
-			const client = createClient(model, project, location, options?.headers);
+			const client = await createClient(model, project, location, options?.headers);
 			let params = buildParams(model, context, options);
 			const nextParams = await options?.onPayload?.(params, model);
 			if (nextParams !== undefined) {
@@ -318,12 +330,12 @@ export const streamSimpleGoogleVertex: StreamFunction<"google-vertex", SimpleStr
 	} satisfies GoogleVertexOptions);
 };
-function createClient(
+async function createClient(
 	model: Model<"google-vertex">,
 	project: string,
 	location: string,
 	optionsHeaders?: Record<string, string>,
-): GoogleGenAI {
+): Promise<GoogleGenAI> {
 	const httpOptions: { headers?: Record<string, string> } = {};
 	if (model.headers || optionsHeaders) {
@@ -331,8 +343,9 @@ function createClient(
 	}
 	const hasHttpOptions = Object.values(httpOptions).some(Boolean);
+	const GoogleGenAIClass = await getGoogleVertexClass();
-	return new GoogleGenAI({
+	return new GoogleGenAIClass({
 		vertexai: true,
 		project,
 		location,
@@ -393,7 +406,9 @@ function buildParams(
 	if (options.thinking?.enabled && model.reasoning) {
 		const thinkingConfig: ThinkingConfig = { includeThoughts: true };
 		if (options.thinking.level !== undefined) {
-			thinkingConfig.thinkingLevel = THINKING_LEVEL_MAP[options.thinking.level];
+			// Cast safe: string values match ThinkingLevel enum values exactly
+			// eslint-disable-next-line @typescript-eslint/no-explicit-any
+			thinkingConfig.thinkingLevel = THINKING_LEVEL_MAP[options.thinking.level] as any;
 		} else if (options.thinking.budgetTokens !== undefined) {
 			thinkingConfig.thinkingBudget = options.thinking.budgetTokens;
 		}

package/packages/pi-ai/src/providers/mistral.ts CHANGED Viewed

@@ -501,6 +501,9 @@ function toChatMessages(messages: Message[], supportsImages: boolean): ChatCompl
 					}
 					continue;
 				}
+				if (block.type !== "toolCall") {
+					continue;
+				}
 				toolCalls.push({
 					id: block.id,
 					type: "function",

package/packages/pi-ai/src/providers/openai-completions.ts CHANGED Viewed

@@ -1,4 +1,6 @@
-import OpenAI from "openai";
+// Lazy-loaded: OpenAI SDK is imported on first use, not at startup.
+// This avoids penalizing users who don't use OpenAI models.
+import type OpenAI from "openai";
 import type {
 	ChatCompletionAssistantMessageParam,
 	ChatCompletionChunk,
@@ -33,6 +35,15 @@ import { buildCopilotDynamicHeaders, hasCopilotVisionInput } from "./github-copi
 import { buildBaseOptions, clampReasoning } from "./simple-options.js";
 import { transformMessages } from "./transform-messages.js";
+let _OpenAICompletionsClass: typeof OpenAI | undefined;
+async function getOpenAICompletionsClass(): Promise<typeof OpenAI> {
+	if (!_OpenAICompletionsClass) {
+		const mod = await import("openai");
+		_OpenAICompletionsClass = mod.default;
+	}
+	return _OpenAICompletionsClass;
+}
 /**
  * Check if conversation messages contain tool calls or tool results.
  * This is needed because Anthropic (via proxy) requires the tools param
@@ -85,7 +96,7 @@ export const streamOpenAICompletions: StreamFunction<"openai-completions", OpenA
 		try {
 			const apiKey = options?.apiKey || getEnvApiKey(model.provider) || "";
-			const client = createClient(model, context, apiKey, options?.headers);
+			const client = await createClient(model, context, apiKey, options?.headers);
 			let params = buildParams(model, context, options);
 			const nextParams = await options?.onPayload?.(params, model);
 			if (nextParams !== undefined) {
@@ -327,7 +338,7 @@ export const streamSimpleOpenAICompletions: StreamFunction<"openai-completions",
 	} satisfies OpenAICompletionsOptions);
 };
-function createClient(
+async function createClient(
 	model: Model<"openai-completions">,
 	context: Context,
 	apiKey?: string,
@@ -358,8 +369,9 @@ function createClient(
 	}
 	const isZai = model.provider === "zai" || model.baseUrl.includes("api.z.ai");
+	const OpenAIClass = await getOpenAICompletionsClass();
-	return new OpenAI({
+	return new OpenAIClass({
 		apiKey,
 		baseURL: model.baseUrl,
 		dangerouslyAllowBrowser: true,

package/packages/pi-ai/src/providers/openai-responses.ts CHANGED Viewed

@@ -1,4 +1,6 @@
-import OpenAI from "openai";
+// Lazy-loaded: OpenAI SDK is imported on first use, not at startup.
+// This avoids penalizing users who don't use OpenAI models.
+import type OpenAI from "openai";
 import type { ResponseCreateParamsStreaming } from "openai/resources/responses/responses.js";
 import { getEnvApiKey } from "../env-api-keys.js";
 import { supportsXhigh } from "../models.js";
@@ -18,6 +20,15 @@ import { buildCopilotDynamicHeaders, hasCopilotVisionInput } from "./github-copi
 import { convertResponsesMessages, convertResponsesTools, processResponsesStream } from "./openai-responses-shared.js";
 import { buildBaseOptions, clampReasoning } from "./simple-options.js";
+let _OpenAIResponsesClass: typeof OpenAI | undefined;
+async function getOpenAIResponsesClass(): Promise<typeof OpenAI> {
+	if (!_OpenAIResponsesClass) {
+		const mod = await import("openai");
+		_OpenAIResponsesClass = mod.default;
+	}
+	return _OpenAIResponsesClass;
+}
 /**
  * Clamp reasoning effort for models that don't support all levels.
  * gpt-5.x models don't support "minimal" — map to "low".
@@ -98,7 +109,7 @@ export const streamOpenAIResponses: StreamFunction<"openai-responses", OpenAIRes
 		try {
 			// Create OpenAI client
 			const apiKey = options?.apiKey || getEnvApiKey(model.provider) || "";
-			const client = createClient(model, context, apiKey, options?.headers);
+			const client = await createClient(model, context, apiKey, options?.headers);
 			let params = buildParams(model, context, options);
 			const nextParams = await options?.onPayload?.(params, model);
 			if (nextParams !== undefined) {
@@ -156,7 +167,7 @@ export const streamSimpleOpenAIResponses: StreamFunction<"openai-responses", Sim
 	} satisfies OpenAIResponsesOptions);
 };
-function createClient(
+async function createClient(
 	model: Model<"openai-responses">,
 	context: Context,
 	apiKey?: string,
@@ -186,7 +197,8 @@ function createClient(
 		Object.assign(headers, optionsHeaders);
 	}
-	return new OpenAI({
+	const OpenAIClass = await getOpenAIResponsesClass();
+	return new OpenAIClass({
 		apiKey,
 		baseURL: model.baseUrl,
 		dangerouslyAllowBrowser: true,

package/packages/pi-ai/src/types.ts CHANGED Viewed

@@ -159,6 +159,22 @@ export interface ToolCall {
 	thoughtSignature?: string; // Google-specific: opaque signature for reusing thought context
 }
+/** Server-side tool use (e.g., Anthropic native web search). Executed by the API, not the client. */
+export interface ServerToolUseContent {
+	type: "serverToolUse";
+	id: string;
+	name: string; // e.g., "web_search"
+	input: unknown;
+}
+/** Result of a server-side tool execution, paired with a ServerToolUseContent by toolUseId. */
+export interface WebSearchResultContent {
+	type: "webSearchResult";
+	toolUseId: string;
+	/** Search results or error from the server. Opaque — stored for API replay. */
+	content: unknown;
+}
 export interface Usage {
 	input: number;
 	output: number;
@@ -184,7 +200,7 @@ export interface UserMessage {
 export interface AssistantMessage {
 	role: "assistant";
-	content: (TextContent | ThinkingContent | ToolCall)[];
+	content: (TextContent | ThinkingContent | ToolCall | ServerToolUseContent | WebSearchResultContent)[];
 	api: Api;
 	provider: Provider;
 	model: string;
@@ -233,6 +249,8 @@ export type AssistantMessageEvent =
 	| { type: "toolcall_start"; contentIndex: number; partial: AssistantMessage }
 	| { type: "toolcall_delta"; contentIndex: number; delta: string; partial: AssistantMessage }
 	| { type: "toolcall_end"; contentIndex: number; toolCall: ToolCall; partial: AssistantMessage }
+	| { type: "server_tool_use"; contentIndex: number; partial: AssistantMessage }
+	| { type: "web_search_result"; contentIndex: number; partial: AssistantMessage }
 	| { type: "done"; reason: Extract<StopReason, "stop" | "length" | "toolUse">; message: AssistantMessage }
 	| { type: "error"; reason: Extract<StopReason, "aborted" | "error">; error: AssistantMessage };

package/packages/pi-coding-agent/dist/core/agent-session.js CHANGED Viewed

@@ -2041,7 +2041,7 @@ export class AgentSession {
         if (message.retryAfterMs !== undefined) {
             const cap = settings.maxDelayMs > 0 ? settings.maxDelayMs : Infinity;
             if (message.retryAfterMs > cap) {
-                // Server wants us to wait longer than our max — give up immediately
+                // Server wants us to wait longer than maxDelayMs — give up to let auto-mode handle recovery
                 this._emit({
                     type: "auto_retry_end",
                     success: false,