npm - @azumag/opencode-rate-limit-fallback - Versions diffs - 1.0.19 → 1.0.21 - Mend

@azumag/opencode-rate-limit-fallback 1.0.19 → 1.0.21

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +17 -14
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -214,7 +214,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
         }
         return null;
     }
-    async function handleRateLimitFallback(sessionID, currentProviderID, currentModelID) {
+    async function handleRateLimitFallback(sessionID, currentProviderID, currentModelID, skipAbort = false) {
         try {
             // Prevent duplicate fallback processing within 5 seconds
             const lastFallback = fallbackInProgress.get(sessionID);
@@ -316,21 +316,22 @@ export const RateLimitFallback = async ({ client, directory }) => {
                 parts: parts,
                 model: { providerID: nextModel.providerID, modelID: nextModel.modelID },
             };
-            // abort → promptAsync: works in TUI, fails in headless (server disposes)
-            // promptAsync → abort: fails in TUI (abort kills the new prompt too)
+            // abort → promptAsync: abort the old request first, then send fallback prompt
+            // This prevents the abort from killing the new fallback prompt.
             //
-            // Use abort → promptAsync as the primary path (TUI confirmed working).
-            // Headless mode (opencode run) is a known limitation — the server
-            // dispose sequence interrupts the new prompt before it can complete.
+            // For session.error events, the request is already in error state, so we
+            // only send promptAsync (skipAbort = true). For retry status, we send both.
             //
             // promptAsync: HTTP POST /session/{id}/prompt_async → 204 (SDK sdk.gen.js).
             const t0 = Date.now();
-            try {
-                await client.session.abort({ path: { id: sessionID } });
-                logToFile(`abort succeeded for session ${sessionID} (${Date.now() - t0}ms)`);
-            }
-            catch (abortErr) {
-                logToFile(`abort failed (${Date.now() - t0}ms): ${abortErr}`);
+            if (!skipAbort) {
+                try {
+                    await client.session.abort({ path: { id: sessionID } });
+                    logToFile(`abort succeeded for session ${sessionID} (${Date.now() - t0}ms)`);
+                }
+                catch (abortErr) {
+                    logToFile(`abort failed (${Date.now() - t0}ms): ${abortErr}`);
+                }
             }
             const t1 = Date.now();
             await client.session.promptAsync({
@@ -399,7 +400,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
                     catch {
                         console.log("[rate-limit-fallback] Rate limit error detected, attempting fallback");
                     }
-                    await handleRateLimitFallback(sessionID, "", "");
+                    await handleRateLimitFallback(sessionID, "", "", true); // skipAbort = true (already in error state)
                 }
             }
             if (event.type === "message.updated") {
@@ -438,7 +439,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
                     catch {
                         console.log("[rate-limit-fallback] Rate limit error in message, attempting fallback");
                     }
-                    await handleRateLimitFallback(info.sessionID, info.providerID || "", info.modelID || "");
+                    await handleRateLimitFallback(info.sessionID, info.providerID || "", info.modelID || "", true); // skipAbort = true (already in error state)
                 }
             }
             if (event.type === "session.status") {
@@ -457,6 +458,8 @@ export const RateLimitFallback = async ({ client, directory }) => {
                 catch {
                     console.log("[rate-limit-fallback] session.status:", status);
                 }
+                // Note: interrupted status is handled by the fallback sequence (abort → promptAsync).
+                // We don't need to handle it separately here as it would cause duplicate prompt sends.
                 if (status?.type === "retry" && status?.message) {
                     const message = status.message.toLowerCase();
                     const isRateLimitRetry = message.includes("usage limit") ||

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@azumag/opencode-rate-limit-fallback",
-  "version": "1.0.19",
+  "version": "1.0.21",
   "description": "OpenCode plugin that automatically switches to fallback models when rate limited",
   "type": "module",
   "main": "./dist/index.js",