npm - pi-sap-aicore - Versions diffs - 0.1.0 - Mend

pi-sap-aicore 0.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (17) hide show

package/LICENSE +21 -0
package/README.md +296 -0
package/index.ts +68 -0
package/package.json +40 -0
package/scripts/diagnose-streaming.mjs +99 -0
package/scripts/list-sap-models.mjs +92 -0
package/scripts/update-models.mjs +107 -0
package/src/auth.ts +104 -0
package/src/foundation-params.ts +55 -0
package/src/models-config.ts +93 -0
package/src/models-snapshot.json +527 -0
package/src/stream-foundation.ts +361 -0
package/src/stream.ts +1051 -0
package/src/to-pi-model.ts +21 -0
package/src/translate-foundation.ts +154 -0
package/src/translate.ts +218 -0
package/tsconfig.json +16 -0

package/src/to-pi-model.ts ADDED Viewed

@@ -0,0 +1,21 @@
+import type { Api } from "@earendil-works/pi-ai";
+import type { ProviderModelConfig } from "@earendil-works/pi-coding-agent";
+import type { SapModel } from "./models-config.ts";
+export function toPiModel(model: SapModel, api: Api): ProviderModelConfig {
+	const input = model.modalities.input.filter(
+		(m): m is "text" | "image" => m === "text" || m === "image",
+	);
+	return {
+		id: model.id,
+		name: model.name,
+		api,
+		reasoning: model.reasoning,
+		input,
+		cost: model.cost,
+		contextWindow: model.limit.context,
+		maxTokens: model.limit.output,
+		thinkingLevelMap: model.thinkingLevelMap,
+	};
+}

package/src/translate-foundation.ts ADDED Viewed

@@ -0,0 +1,154 @@
+import type {
+	AssistantMessage,
+	Context,
+	Message,
+	TextContent,
+	Tool,
+	ToolResultMessage,
+	UserMessage,
+} from "@earendil-works/pi-ai";
+import type {
+	AzureOpenAiChatCompletionRequestAssistantMessage,
+	AzureOpenAiChatCompletionRequestMessage,
+	AzureOpenAiChatCompletionRequestToolMessage,
+	AzureOpenAiChatCompletionRequestUserMessage,
+	AzureOpenAiChatCompletionTool,
+} from "@sap-ai-sdk/foundation-models";
+// pi `Context` → Azure OpenAI chat request. This is the orchestration
+// `translate.ts` minus the Anthropic `cache_control` tagging — that is an
+// Anthropic-via-orchestration concern and has no meaning on the direct
+// OpenAI endpoint, so the foundation path is strictly simpler. The Azure
+// message/content/tool shapes are the standard OpenAI ones (each carries an
+// `& Record<string, any>` escape hatch), so inline literals type-check
+// against the message-level types without importing the content-part types
+// (which the package doesn't re-export from its root).
+export function piContextToAzureOpenAi(context: Context): {
+	messages: AzureOpenAiChatCompletionRequestMessage[];
+	tools: AzureOpenAiChatCompletionTool[];
+} {
+	const messages: AzureOpenAiChatCompletionRequestMessage[] = [];
+	if (context.systemPrompt) {
+		messages.push({ role: "system", content: context.systemPrompt });
+	}
+	for (const msg of context.messages) {
+		messages.push(...piMessageToAzureOpenAi(msg));
+	}
+	const tools = (context.tools ?? []).map(piToolToAzureOpenAi);
+	return { messages, tools };
+}
+function piMessageToAzureOpenAi(
+	msg: Message,
+): AzureOpenAiChatCompletionRequestMessage[] {
+	switch (msg.role) {
+		case "user":
+			return [piUserToAzureOpenAi(msg)];
+		case "assistant":
+			return [piAssistantToAzureOpenAi(msg)];
+		case "toolResult":
+			return piToolResultToAzureOpenAi(msg);
+	}
+}
+function piUserToAzureOpenAi(
+	msg: UserMessage,
+): AzureOpenAiChatCompletionRequestUserMessage {
+	if (typeof msg.content === "string") {
+		return { role: "user", content: msg.content };
+	}
+	const items = msg.content.map((part) =>
+		part.type === "text"
+			? { type: "text" as const, text: part.text }
+			: {
+					type: "image_url" as const,
+					image_url: { url: `data:${part.mimeType};base64,${part.data}` },
+				},
+	);
+	return { role: "user", content: items };
+}
+function piAssistantToAzureOpenAi(
+	msg: AssistantMessage,
+): AzureOpenAiChatCompletionRequestAssistantMessage {
+	let text = "";
+	const toolCalls: {
+		id: string;
+		type: "function";
+		function: { name: string; arguments: string };
+	}[] = [];
+	for (const block of msg.content) {
+		if (block.type === "text") {
+			text += block.text;
+		} else if (block.type === "toolCall") {
+			toolCalls.push({
+				id: block.id,
+				type: "function",
+				function: {
+					name: block.name,
+					arguments: JSON.stringify(block.arguments),
+				},
+			});
+		}
+	}
+	// OpenAI rejects an assistant message with neither content nor tool_calls.
+	// Match the orchestration path: substitute a single space when there is no
+	// text and no tool call, so conversation alternation stays 1:1 with pi's log.
+	const result: AzureOpenAiChatCompletionRequestAssistantMessage = {
+		role: "assistant",
+		content: text || (toolCalls.length === 0 ? " " : ""),
+	};
+	if (toolCalls.length > 0) result.tool_calls = toolCalls;
+	return result;
+}
+function piToolResultToAzureOpenAi(
+	msg: ToolResultMessage,
+): AzureOpenAiChatCompletionRequestMessage[] {
+	const text = msg.content
+		.filter((part): part is TextContent => part.type === "text")
+		.map((part) => part.text)
+		.join("\n");
+	const toolMessage: AzureOpenAiChatCompletionRequestToolMessage = {
+		role: "tool",
+		tool_call_id: msg.toolCallId,
+		content: text,
+	};
+	// The tool message schema is text-only, so image blocks produced by pi
+	// tools (e.g. `read` on an image) are hoisted into a synthetic user message
+	// right after the tool result so vision-capable models still see the bytes.
+	const images = msg.content.filter(
+		(part): part is { type: "image"; data: string; mimeType: string } =>
+			part.type === "image",
+	);
+	if (images.length === 0) return [toolMessage];
+	const imageItems = images.map((img) => ({
+		type: "image_url" as const,
+		image_url: { url: `data:${img.mimeType};base64,${img.data}` },
+	}));
+	const imageMessage: AzureOpenAiChatCompletionRequestUserMessage = {
+		role: "user",
+		content: imageItems,
+	};
+	return [toolMessage, imageMessage];
+}
+function piToolToAzureOpenAi(tool: Tool): AzureOpenAiChatCompletionTool {
+	return {
+		type: "function",
+		function: {
+			name: tool.name,
+			description: tool.description,
+			parameters: tool.parameters as unknown as Record<string, unknown>,
+		},
+	};
+}

package/src/translate.ts ADDED Viewed

@@ -0,0 +1,218 @@
+import type {
+	AssistantMessage,
+	Context,
+	Message,
+	TextContent,
+	Tool,
+	ToolResultMessage,
+	UserMessage,
+} from "@earendil-works/pi-ai";
+import type {
+	AssistantChatMessage,
+	ChatCompletionTool,
+	ChatMessage,
+	UserChatMessageContent,
+	UserChatMessageContentItem,
+} from "@sap-ai-sdk/orchestration";
+// Anthropic prompt caching via SAP orchestration is undocumented. SAP's
+// ChatMessage schemas are strictly typed (no Record<string,any> escape
+// hatch on content), `cache_control` appears nowhere in
+// @sap-ai-sdk/orchestration, and the orchestration server may reject
+// unknown fields with a 400. Opt-in via PI_SAP_AICORE_CACHE_CONTROL=1 so
+// users can probe their own tenant without forcing the risk on everyone
+// — if SAP accepts it, `cacheRead`/`cacheWrite` in the Usage block start
+// reporting non-zero numbers and pi's cost line drops ~10× on cached
+// turns. If SAP rejects it, the error chain will say so.
+const CACHE_CONTROL_ENABLED =
+	process.env.PI_SAP_AICORE_CACHE_CONTROL === "1";
+type CacheControl = { type: "ephemeral" };
+const EPHEMERAL: CacheControl = { type: "ephemeral" };
+export function piContextToOrchestration(context: Context): {
+	messages: ChatMessage[];
+	tools: ChatCompletionTool[];
+} {
+	const messages: ChatMessage[] = [];
+	if (context.systemPrompt) {
+		messages.push(
+			tagCacheControl(
+				{ role: "system", content: context.systemPrompt },
+				CACHE_CONTROL_ENABLED,
+			),
+		);
+	}
+	const pi = context.messages;
+	// Anthropic caches up to 4 breakpoints; tagging the LAST user message
+	// (after the system prompt) is the standard "keep the long prefix
+	// cached" pattern. We tag at most 1 here for safety; expand later
+	// once SAP behaviour is confirmed.
+	const lastUserIdx = lastIndexWhere(pi, (m) => m.role === "user");
+	for (let i = 0; i < pi.length; i++) {
+		const translated = piMessageToOrchestration(pi[i]);
+		const tagLast = CACHE_CONTROL_ENABLED && i === lastUserIdx;
+		if (tagLast && translated.length > 0) {
+			translated[translated.length - 1] = tagCacheControl(
+				translated[translated.length - 1],
+				true,
+			);
+		}
+		messages.push(...translated);
+	}
+	const tools = (context.tools ?? []).map(piToolToOrchestration);
+	return { messages, tools };
+}
+function lastIndexWhere<T>(arr: T[], pred: (t: T) => boolean): number {
+	for (let i = arr.length - 1; i >= 0; i--) if (pred(arr[i])) return i;
+	return -1;
+}
+// Tag a translated message's last text content with Anthropic's
+// `cache_control: {type: "ephemeral"}`. Casts through `any` because
+// SAP's typings forbid it (Anthropic-native field that SAP doesn't
+// expose in its schema — see note at top of file).
+function tagCacheControl(msg: ChatMessage, enabled: boolean): ChatMessage {
+	if (!enabled) return msg;
+	if (typeof msg.content === "string") {
+		return {
+			...msg,
+			content: [
+				{ type: "text", text: msg.content, cache_control: EPHEMERAL } as any,
+			],
+		} as ChatMessage;
+	}
+	if (Array.isArray(msg.content) && msg.content.length > 0) {
+		const items = msg.content.slice();
+		const last = items[items.length - 1] as any;
+		items[items.length - 1] = { ...last, cache_control: EPHEMERAL };
+		return { ...msg, content: items } as ChatMessage;
+	}
+	return msg;
+}
+function piMessageToOrchestration(msg: Message): ChatMessage[] {
+	switch (msg.role) {
+		case "user":
+			return [piUserToOrchestration(msg)];
+		case "assistant":
+			return [piAssistantToOrchestration(msg)];
+		case "toolResult":
+			return piToolResultToOrchestration(msg);
+	}
+}
+function piUserToOrchestration(msg: UserMessage): ChatMessage {
+	if (typeof msg.content === "string") {
+		return { role: "user", content: msg.content };
+	}
+	const items: UserChatMessageContentItem[] = msg.content.map((part) => {
+		if (part.type === "text") {
+			return { type: "text", text: part.text };
+		}
+		return {
+			type: "image_url",
+			image_url: { url: `data:${part.mimeType};base64,${part.data}` },
+		};
+	});
+	return { role: "user", content: items as UserChatMessageContent };
+}
+function piAssistantToOrchestration(msg: AssistantMessage): ChatMessage {
+	let text = "";
+	const toolCalls: NonNullable<AssistantChatMessage["tool_calls"]> = [];
+	for (const block of msg.content) {
+		if (block.type === "text") {
+			text += block.text;
+		} else if (block.type === "toolCall") {
+			toolCalls.push({
+				id: block.id,
+				type: "function",
+				function: {
+					name: block.name,
+					arguments: JSON.stringify(block.arguments),
+				},
+			});
+		}
+	}
+	// Bedrock (which SAP orchestration wraps) rejects assistant messages with
+	// no text AND no tool_calls — "Assistant message has neither text nor
+	// tool_use blocks." Pi can produce these when a prior stream was
+	// interrupted or the turn contained only block types we don't translate
+	// (e.g. reasoning-only). Substitute a single space so the message
+	// validates while preserving conversation alternation 1:1 with pi's log.
+	const result: AssistantChatMessage = {
+		role: "assistant",
+		content: text || (toolCalls.length === 0 ? " " : ""),
+	};
+	if (toolCalls.length > 0) result.tool_calls = toolCalls;
+	return result;
+}
+function piToolResultToOrchestration(msg: ToolResultMessage): ChatMessage[] {
+	const text = msg.content
+		.filter((part): part is TextContent => part.type === "text")
+		.map((part) => part.text)
+		.join("\n");
+	const toolMessage: ChatMessage = {
+		role: "tool",
+		tool_call_id: msg.toolCallId,
+		content: text,
+	};
+	// SAP's ToolChatMessage.content schema is text-only (`string |
+	// TextContent[]`), so any image blocks produced by pi tools (most
+	// commonly the `read` tool on an image file) get silently dropped.
+	// Hoist them into a synthetic user message immediately after the
+	// tool result so vision-capable models actually see the bytes.
+	const images = msg.content.filter(
+		(part): part is { type: "image"; data: string; mimeType: string } =>
+			part.type === "image",
+	);
+	if (images.length === 0) return [toolMessage];
+	const imageItems: UserChatMessageContentItem[] = images.map((img) => ({
+		type: "image_url",
+		image_url: { url: `data:${img.mimeType};base64,${img.data}` },
+	}));
+	const imageMessage: ChatMessage = {
+		role: "user",
+		content: imageItems as UserChatMessageContent,
+	};
+	return [toolMessage, imageMessage];
+}
+function piToolToOrchestration(tool: Tool): ChatCompletionTool {
+	return {
+		type: "function",
+		function: {
+			name: tool.name,
+			description: tool.description,
+			parameters: tool.parameters as unknown as Record<string, unknown>,
+		},
+	};
+}
+export function mapFinishReason(
+	reason: string | undefined,
+): "stop" | "length" | "toolUse" {
+	switch (reason) {
+		case "length":
+			return "length";
+		case "tool_calls":
+		case "function_call":
+			return "toolUse";
+		default:
+			return "stop";
+	}
+}

package/tsconfig.json ADDED Viewed

@@ -0,0 +1,16 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "ESNext",
+    "moduleResolution": "Bundler",
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "resolveJsonModule": true,
+    "noEmit": true,
+    "isolatedModules": true,
+    "allowImportingTsExtensions": true,
+    "verbatimModuleSyntax": true
+  },
+  "include": ["index.ts", "src/**/*.ts"]
+}