npm - @lota-sdk/core - Versions diffs - 0.4.46 → 0.4.48 - Mend

@lota-sdk/core 0.4.46 → 0.4.48

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/package.json +2 -2
package/src/ai-gateway/ai-gateway.ts +142 -2
package/src/ai-gateway/index.ts +1 -0

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@lota-sdk/core",
-  "version": "0.4.46",
+  "version": "0.4.48",
   "files": [
     "src",
     "infrastructure/schema"
@@ -32,7 +32,7 @@
     "@ai-sdk/provider": "^3.0.9",
     "@chat-adapter/slack": "^4.26.0",
     "@chat-adapter/state-ioredis": "^4.26.0",
-    "@lota-sdk/shared": "0.4.46",
+    "@lota-sdk/shared": "0.4.48",
     "@mendable/firecrawl-js": "^4.20.0",
     "@surrealdb/node": "^3.0.3",
     "ai": "^6.0.170",

package/src/ai-gateway/ai-gateway.ts CHANGED Viewed

@@ -1,3 +1,5 @@
+import { createHash } from 'node:crypto'
 import { devToolsMiddleware } from '@ai-sdk/devtools'
 import { createOpenAI } from '@ai-sdk/openai'
 import type { JSONSchema7 } from '@ai-sdk/provider'
@@ -37,6 +39,17 @@ class AiGatewayStreamAttemptTag extends Context.Service<
 const EXPECTED_GATEWAY_KEY_PREFIX = 'sk-bf-'
 const AI_GATEWAY_VIRTUAL_KEY_HEADER = 'x-bf-vk'
+const AI_GATEWAY_PASSTHROUGH_EXTRA_PARAMS_HEADER = 'x-bf-passthrough-extra-params'
+const AI_GATEWAY_SESSION_ID_HEADER = 'x-bf-session-id'
+const AI_GATEWAY_SESSION_TTL_HEADER = 'x-bf-session-ttl'
+const AZURE_OPENAI_PROMPT_CACHE_RETENTION = '24h'
+const AZURE_OPENAI_PROMPT_CACHE_SESSION_TTL = '24h'
+const AZURE_OPENAI_PROMPT_CACHE_KEY_PREFIX = 'azpc'
+const AZURE_OPENAI_PROMPT_CACHE_HASH_LENGTH = 48
+const AZURE_OPENAI_PROMPT_CACHE_MAX_STRING_LENGTH = 120_000
+const AZURE_OPENAI_PROMPT_CACHE_MAX_ARRAY_ITEMS = 80
+const AZURE_OPENAI_PROMPT_CACHE_MAX_OBJECT_KEYS = 80
+const AZURE_OPENAI_PROMPT_CACHE_MAX_DEPTH = 8
 const AI_GATEWAY_TIMEOUT_MS = 360_000
 const AI_GATEWAY_STREAM_IDLE_TIMEOUT_MS = 180_000
 const AI_GATEWAY_MAX_RETRIES = 4
@@ -512,7 +525,11 @@ export function makeAiGatewayService(
       })
     }
     const baseURL = yield* normalizeAiGatewayUrlEffect(config.aiGateway.url)
-    const provider = createOpenAI({ baseURL, apiKey, headers: { [AI_GATEWAY_VIRTUAL_KEY_HEADER]: apiKey } })
+    const provider = createOpenAI({
+      baseURL,
+      apiKey,
+      headers: { [AI_GATEWAY_VIRTUAL_KEY_HEADER]: apiKey, [AI_GATEWAY_PASSTHROUGH_EXTRA_PARAMS_HEADER]: 'true' },
+    })
     return AiGatewayTag.of({ semaphore, provider })
   })
@@ -728,6 +745,127 @@ function isOpenRouterModel(modelId: string): boolean {
   return modelId.trim().toLowerCase().startsWith('openrouter/')
 }
+function isAzureOpenAiPromptCacheModel(modelId: string): boolean {
+  const normalized = modelId.trim().toLowerCase()
+  if (!normalized) return false
+  const [providerPrefix, ...modelParts] = normalized.split('/')
+  if (modelParts.length > 0) {
+    if (providerPrefix !== 'azure') return false
+    return isAzureOpenAiPromptCacheModel(modelParts.join('/'))
+  }
+  return (
+    normalized === 'main-gpt-model' ||
+    normalized === 'mini-gpt-model' ||
+    normalized === 'nano-gpt-model' ||
+    normalized === 'gpt-5.5' ||
+    normalized.startsWith('gpt-5.5-') ||
+    normalized === 'gpt-5.4' ||
+    normalized.startsWith('gpt-5.4-')
+  )
+}
+function hashAzureOpenAiPromptCacheValue(value: string): string {
+  return createHash('sha256').update(value).digest('hex').slice(0, AZURE_OPENAI_PROMPT_CACHE_HASH_LENGTH)
+}
+function stablePromptCacheStringify(value: unknown): string {
+  return JSON.stringify(normalizePromptCacheValue(value, 0))
+}
+function normalizePromptCacheValue(value: unknown, depth: number): unknown {
+  if (value === null || typeof value === 'boolean' || typeof value === 'number') return value
+  if (typeof value === 'string') {
+    return value.length > AZURE_OPENAI_PROMPT_CACHE_MAX_STRING_LENGTH
+      ? value.slice(0, AZURE_OPENAI_PROMPT_CACHE_MAX_STRING_LENGTH)
+      : value
+  }
+  if (typeof value === 'bigint') return value.toString()
+  if (value instanceof Uint8Array) {
+    return {
+      type: 'uint8array',
+      length: value.byteLength,
+      sha256: createHash('sha256').update(value).digest('hex').slice(0, AZURE_OPENAI_PROMPT_CACHE_HASH_LENGTH),
+    }
+  }
+  if (Array.isArray(value)) {
+    return value
+      .slice(0, AZURE_OPENAI_PROMPT_CACHE_MAX_ARRAY_ITEMS)
+      .map((item) => normalizePromptCacheValue(item, depth + 1))
+  }
+  if (!isRecord(value) || depth >= AZURE_OPENAI_PROMPT_CACHE_MAX_DEPTH) return null
+  return Object.fromEntries(
+    Object.entries(value)
+      .filter(([, item]) => item !== undefined && typeof item !== 'function' && typeof item !== 'symbol')
+      .sort(([left], [right]) => left.localeCompare(right))
+      .slice(0, AZURE_OPENAI_PROMPT_CACHE_MAX_OBJECT_KEYS)
+      .map(([key, item]) => [key, normalizePromptCacheValue(item, depth + 1)]),
+  )
+}
+function readExplicitOpenAiPromptCacheKey(openaiOptions: Record<string, unknown>): string | null {
+  const promptCacheKey = openaiOptions.promptCacheKey
+  return typeof promptCacheKey === 'string' && promptCacheKey.trim().length > 0 ? promptCacheKey.trim() : null
+}
+function buildAzureOpenAiPromptCacheKey(params: AiGatewayCallOptions, modelId: string): string {
+  const payload = {
+    version: 1,
+    model: modelId.trim().toLowerCase(),
+    prompt: params.prompt,
+    responseFormat: params.responseFormat,
+    tools: params.tools,
+  }
+  return `${AZURE_OPENAI_PROMPT_CACHE_KEY_PREFIX}_${hashAzureOpenAiPromptCacheValue(stablePromptCacheStringify(payload))}`
+}
+function buildAzureOpenAiPromptCacheSessionId(promptCacheKey: string): string {
+  if (promptCacheKey.startsWith(`${AZURE_OPENAI_PROMPT_CACHE_KEY_PREFIX}_`)) return promptCacheKey
+  return `${AZURE_OPENAI_PROMPT_CACHE_KEY_PREFIX}_${hashAzureOpenAiPromptCacheValue(promptCacheKey)}`
+}
+function withHeaderIfMissing(
+  headers: Record<string, string | undefined>,
+  name: string,
+  value: string,
+): Record<string, string | undefined> {
+  for (const key of Object.keys(headers)) {
+    if (key.toLowerCase() === name.toLowerCase()) return headers
+  }
+  return { ...headers, [name]: value }
+}
+export function addAzureOpenAiPromptCacheRetention(
+  params: AiGatewayCallOptions,
+  modelId?: string,
+): AiGatewayCallOptions {
+  if (!modelId || !isAzureOpenAiPromptCacheModel(modelId)) {
+    return params
+  }
+  const providerOptions = isRecord(params.providerOptions) ? { ...params.providerOptions } : {}
+  const openaiOptions = isRecord(providerOptions.openai) ? { ...providerOptions.openai } : {}
+  const promptCacheKey =
+    readExplicitOpenAiPromptCacheKey(openaiOptions) ?? buildAzureOpenAiPromptCacheKey(params, modelId)
+  const sessionId = buildAzureOpenAiPromptCacheSessionId(promptCacheKey)
+  const headersWithSession = withHeaderIfMissing(
+    withHeaderIfMissing({ ...params.headers }, AI_GATEWAY_SESSION_ID_HEADER, sessionId),
+    AI_GATEWAY_SESSION_TTL_HEADER,
+    AZURE_OPENAI_PROMPT_CACHE_SESSION_TTL,
+  )
+  return {
+    ...params,
+    headers: headersWithSession,
+    providerOptions: {
+      ...providerOptions,
+      openai: { ...openaiOptions, promptCacheKey, promptCacheRetention: AZURE_OPENAI_PROMPT_CACHE_RETENTION },
+    } as AiGatewayCallOptions['providerOptions'],
+  }
+}
 function mergeAbortSignals(signals: Array<AbortSignal | undefined>): { signal?: AbortSignal; cleanup: () => void } {
   const activeSignals = signals.filter((signal): signal is AbortSignal => Boolean(signal))
   if (activeSignals.length === 0) return { cleanup: () => undefined }
@@ -1106,7 +1244,9 @@ function createAiGatewayLanguageModelMiddleware(
       Promise.resolve(
         addAiGatewayReasoningRawChunks(
           normalizeAiGatewayJsonSchemas(
-            providerId === OPENAI_CHAT_PROVIDER_ID ? normalizeAiGatewayChatProviderOptions(params, modelId) : params,
+            providerId === OPENAI_CHAT_PROVIDER_ID
+              ? normalizeAiGatewayChatProviderOptions(addAzureOpenAiPromptCacheRetention(params, modelId), modelId)
+              : addAzureOpenAiPromptCacheRetention(params, modelId),
           ),
           type,
         ),

package/src/ai-gateway/index.ts CHANGED Viewed

@@ -9,6 +9,7 @@ export {
   aiGatewayModel,
   aiGatewayOpenRouterResponseHealingModel,
   createAiGatewayModels,
+  addAzureOpenAiPromptCacheRetention,
   extractAiGatewayChatReasoningDeltaText,
   extractAiGatewayChatReasoningText,
   injectAiGatewayChatReasoningContent,