npm - ai - Versions diffs - 5.0.0-beta.19 → 5.0.0-beta.20 - Mend

ai 5.0.0-beta.19 → 5.0.0-beta.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

package/CHANGELOG.md +8 -0
package/dist/bin/ai.js +32 -3
package/dist/bin/ai.js.map +1 -1
package/dist/bin/ai.min.js +4 -4
package/dist/index.js +32 -3
package/dist/index.js.map +1 -1
package/dist/index.mjs +32 -3
package/dist/index.mjs.map +1 -1
package/dist/internal/index.js +32 -3
package/dist/internal/index.js.map +1 -1
package/dist/internal/index.mjs +32 -3
package/dist/internal/index.mjs.map +1 -1
package/package.json +5 -5

package/CHANGELOG.md CHANGED Viewed

@@ -1,5 +1,13 @@
 # ai
+## 5.0.0-beta.20
+### Patch Changes
+- 4c8f834: feat: automatically respect rate limit headers in retry logic
+  Added automatic support for respecting rate limit headers (`retry-after-ms` and `retry-after`) in the SDK's retry logic. When these headers are present and contain reasonable values (0-60 seconds), the retry mechanism will use the server-specified delay instead of exponential backoff. This matches the behavior of Anthropic and OpenAI client SDKs and improves rate limit handling without requiring any API changes.
 ## 5.0.0-beta.19
 ### Patch Changes

package/dist/bin/ai.js CHANGED Viewed

@@ -1349,7 +1349,33 @@ var RetryError = class extends import_provider3.AISDKError {
 _a3 = symbol3;
 // src/util/retry-with-exponential-backoff.ts
-var retryWithExponentialBackoff = ({
+function getRetryDelay(error, exponentialBackoffDelay) {
+  const headers = error.responseHeaders;
+  if (!headers)
+    return exponentialBackoffDelay;
+  let timeoutMillis;
+  const retryAfterMs = headers["retry-after-ms"];
+  if (retryAfterMs) {
+    const timeoutMs = parseFloat(retryAfterMs);
+    if (!Number.isNaN(timeoutMs)) {
+      timeoutMillis = timeoutMs;
+    }
+  }
+  const retryAfter = headers["retry-after"];
+  if (retryAfter && timeoutMillis === void 0) {
+    const timeoutSeconds = parseFloat(retryAfter);
+    if (!Number.isNaN(timeoutSeconds)) {
+      timeoutMillis = timeoutSeconds * 1e3;
+    } else {
+      timeoutMillis = Date.parse(retryAfter) - Date.now();
+    }
+  }
+  if (timeoutMillis !== void 0 && 0 <= timeoutMillis && timeoutMillis < 60 * 1e3) {
+    return timeoutMillis;
+  }
+  return exponentialBackoffDelay;
+}
+var retryWithExponentialBackoffRespectingRetryHeaders = ({
   maxRetries = 2,
   initialDelayInMs = 2e3,
   backoffFactor = 2
@@ -1383,7 +1409,8 @@ async function _retryWithExponentialBackoff(f, {
       });
     }
     if (error instanceof Error && import_provider4.APICallError.isInstance(error) && error.isRetryable === true && tryNumber <= maxRetries) {
-      await (0, import_provider_utils3.delay)(delayInMs);
+      const actualDelay = getRetryDelay(error, delayInMs);
+      await (0, import_provider_utils3.delay)(actualDelay);
       return _retryWithExponentialBackoff(
         f,
         { maxRetries, delayInMs: backoffFactor * delayInMs, backoffFactor },
@@ -1424,7 +1451,9 @@ function prepareRetries({
   const maxRetriesResult = maxRetries != null ? maxRetries : 2;
   return {
     maxRetries: maxRetriesResult,
-    retry: retryWithExponentialBackoff({ maxRetries: maxRetriesResult })
+    retry: retryWithExponentialBackoffRespectingRetryHeaders({
+      maxRetries: maxRetriesResult
+    })
   };
 }