npm - @wrongstack/providers - Versions diffs - 0.267.0 → 0.268.0 - Mend

@wrongstack/providers 0.267.0 → 0.268.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/dist/index.d.ts CHANGED Viewed

@@ -93,7 +93,7 @@ declare abstract class WireAdapter implements Provider {
     /** Map Request fields to the wire request body. */
     protected abstract buildBody(req: Request): Record<string, unknown>;
     /** Translate wire SSE events into canonical StreamEvent[]. */
-    protected abstract parseStream(body: ReadableStream<Uint8Array> | NodeJS.ReadableStream | null, fallbackModel: string): AsyncIterable<StreamEvent>;
+    protected abstract parseStream(body: ReadableStream<Uint8Array> | NodeJS.ReadableStream | null, fallbackModel: string, req: Request): AsyncIterable<StreamEvent>;
     /** Build a ProviderError from an HTTP failure response. */
     protected translateError(status: number, body: string): ProviderError;
 }
@@ -115,7 +115,7 @@ declare class AnthropicProvider extends WireAdapter {
     protected buildUrl(_req: Request): string;
     protected buildHeaders(req: Request): Record<string, string>;
     protected buildBody(req: Request): Record<string, unknown>;
-    protected parseStream(body: Parameters<typeof parseSSE>[0], fallbackModel: string): AsyncIterable<StreamEvent>;
+    protected parseStream(body: Parameters<typeof parseSSE>[0], fallbackModel: string, req: Request): AsyncIterable<StreamEvent>;
     protected translateError(status: number, text: string): ProviderError;
     private normalizeMessage;
 }
@@ -197,6 +197,7 @@ interface OpenAIProviderOptions {
     quirks?: ConvertOptions & {
         parallelToolsDisabled?: boolean | undefined;
         jsonArgumentsBuggy?: boolean | undefined;
+        thinkingParam?: 'zai-glm' | 'kimi-toggle' | 'always-on' | undefined;
     } | undefined;
     id?: string | undefined;
     capabilities?: Partial<Capabilities> | undefined;
@@ -231,6 +232,7 @@ interface CompatibilityQuirks {
     parallelToolsDisabled?: boolean | undefined;
     jsonArgumentsBuggy?: boolean | undefined;
     emptyToolCallContent?: 'null' | 'empty_string' | undefined;
+    thinkingParam?: 'zai-glm' | 'kimi-toggle' | 'always-on' | undefined;
 }
 interface OpenAICompatibleOptions {
     id: string;
@@ -260,6 +262,7 @@ declare class OpenAICompatibleProvider extends OpenAIProvider {
      * OpenAI's newer `max_completion_tokens`. Keep the legacy field here. See #10.
      */
     protected tokenLimitParam(): string;
+    protected buildBody(req: Request): Record<string, unknown>;
     protected buildHeaders(req: Request): Record<string, string>;
 }

package/dist/index.js CHANGED Viewed

@@ -271,6 +271,13 @@ var init_aggregate = __esm({
 // src/anthropic.ts
 init_tool_input();
+// src/object-utils.ts
+function isPlainObject(value) {
+  return typeof value === "object" && value !== null && !Array.isArray(value);
+}
+// src/error-parse.ts
 function parseProviderHttpError(providerId, status, rawText) {
   const body = parseBody(rawText);
   const retryable = isRetryable(status, body.type);
@@ -288,9 +295,9 @@ function parseBody(rawText) {
   } catch {
     return body;
   }
-  if (!isRecord(parsed)) return body;
+  if (!isPlainObject(parsed)) return body;
   const errField = parsed["error"];
-  if (isRecord(errField)) {
+  if (isPlainObject(errField)) {
     const t = stringOf(errField["type"]) ?? stringOf(errField["status"]);
     const m = stringOf(errField["message"]);
     if (t) body.type = t;
@@ -317,9 +324,6 @@ function isRetryable(status, type) {
   if (type === "overloaded_error" || type === "rate_limit_error") return true;
   return false;
 }
-function isRecord(v) {
-  return typeof v === "object" && v !== null && !Array.isArray(v);
-}
 function stringOf(v) {
   return typeof v === "string" && v.length > 0 ? v : void 0;
 }
@@ -719,7 +723,7 @@ var WireAdapter = class {
     if (this.streamHangTimeoutMs > 0) {
       sseBody = this.wrapWithHangDetection(sseBody, req.model);
     }
-    yield* this.parseStream(sseBody, req.model);
+    yield* this.parseStream(sseBody, req.model, req);
   }
   /**
    * Wrap a readable stream body to log a compact status line per incoming
@@ -891,7 +895,12 @@ var AnthropicProvider = class extends WireAdapter {
       messages: req.messages.map((m) => this.normalizeMessage(m)),
       stream: true
     };
-    if (req.system && req.system.length > 0) body["system"] = req.system;
+    if (req.system && req.system.length > 0) {
+      const systemBlocks = req.system;
+      body["system"] = systemBlocks.map(
+        (b, index) => req.cache?.ttl && index === systemBlocks.length - 1 ? { ...b, cache_control: { type: "ephemeral", ttl: req.cache.ttl } } : b
+      );
+    }
     if (req.tools && req.tools.length > 0) body["tools"] = toolsToAnthropic(req.tools);
     if (req.temperature !== void 0) body["temperature"] = req.temperature;
     if (req.topP !== void 0) body["top_p"] = req.topP;
@@ -899,8 +908,8 @@ var AnthropicProvider = class extends WireAdapter {
     if (req.toolChoice) body["tool_choice"] = req.toolChoice;
     return body;
   }
-  parseStream(body, fallbackModel) {
-    return parseAnthropicStream(body, fallbackModel);
+  parseStream(body, fallbackModel, req) {
+    return parseAnthropicStream(body, fallbackModel, req.cache?.ttl);
   }
   translateError(status, text) {
     return parseProviderHttpError(this.id, status, text);
@@ -934,7 +943,7 @@ function sanitizeAnthropicBlock(b) {
       return b;
   }
 }
-async function* parseAnthropicStream(body, fallbackModel) {
+async function* parseAnthropicStream(body, fallbackModel, cacheTtl) {
   const blocks = /* @__PURE__ */ new Map();
   let model = fallbackModel;
   let usage = { input: 0, output: 0 };
@@ -951,11 +960,14 @@ async function* parseAnthropicStream(body, fallbackModel) {
       case "message_start": {
         const message = ev["message"];
         if (message?.model) model = message.model;
+        const cacheWrite = message?.usage?.cache_creation_input_tokens;
         usage = {
           input: message?.usage?.input_tokens ?? 0,
           output: 0,
           cacheRead: message?.usage?.cache_read_input_tokens,
-          cacheWrite: message?.usage?.cache_creation_input_tokens
+          cacheWrite,
+          cacheWrite5m: cacheTtl === "1h" ? void 0 : cacheWrite,
+          cacheWrite1h: cacheTtl === "1h" ? cacheWrite : void 0
         };
         if (!started) {
           started = true;
@@ -2181,7 +2193,8 @@ var VALID_QUIRK_KEYS = /* @__PURE__ */ new Set([
   "preserveToolCallIds",
   "parallelToolsDisabled",
   "jsonArgumentsBuggy",
-  "emptyToolCallContent"
+  "emptyToolCallContent",
+  "thinkingParam"
 ]);
 function isCompatibilityQuirks(value) {
   if (value === void 0) return true;
@@ -2191,6 +2204,8 @@ function isCompatibilityQuirks(value) {
     if (!VALID_QUIRK_KEYS.has(key)) return false;
     if (key === "emptyToolCallContent") {
       if (v !== "null" && v !== "empty_string") return false;
+    } else if (key === "thinkingParam") {
+      if (v !== "zai-glm" && v !== "kimi-toggle" && v !== "always-on") return false;
     } else if (typeof v !== "boolean") {
       return false;
     }
@@ -2231,6 +2246,11 @@ var OpenAICompatibleProvider = class extends OpenAIProvider {
   tokenLimitParam() {
     return "max_tokens";
   }
+  buildBody(req) {
+    const body = super.buildBody(req);
+    applyThinkingParams(body, req, this.opts.quirks?.thinkingParam);
+    return body;
+  }
   buildHeaders(req) {
     return {
       ...super.buildHeaders(req),
@@ -2238,6 +2258,36 @@ var OpenAICompatibleProvider = class extends OpenAIProvider {
     };
   }
 };
+function applyThinkingParams(body, req, mode) {
+  if (!mode || !req.reasoning) return;
+  if (mode === "always-on") {
+    return;
+  }
+  if (req.reasoning.enabled === false) {
+    body["thinking"] = { type: "disabled" };
+    return;
+  }
+  if (mode === "kimi-toggle" && req.reasoning.enabled === true) {
+    body["thinking"] = { type: "enabled" };
+  }
+  if (mode === "zai-glm" && req.reasoning.effort) {
+    body["reasoning_effort"] = mapZaiReasoningEffort(req.reasoning.effort);
+  }
+}
+function mapZaiReasoningEffort(effort) {
+  switch (effort) {
+    case "none":
+    case "minimal":
+      return "none";
+    case "low":
+    case "medium":
+      return "high";
+    case "xhigh":
+      return "max";
+    default:
+      return effort;
+  }
+}
 // src/wire-format.ts
 var WireFormatProvider = class extends WireAdapter {
@@ -3033,9 +3083,6 @@ function normalizeToolResultContent(raw, opts) {
   if (raw === void 0 || raw === null) return "";
   return JSON.stringify(raw);
 }
-function isPlainObject(v) {
-  return typeof v === "object" && v !== null && !Array.isArray(v);
-}
 function contentFromOpenAI(choice, opts = {}) {
   const out = [];
   const text = choice.message.content;