npm - @azumag/opencode-rate-limit-fallback - Versions diffs - 1.0.18 → 1.0.20 - Mend

@azumag/opencode-rate-limit-fallback 1.0.18 → 1.0.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +33 -22
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -214,7 +214,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
         }
         return null;
     }
-    async function handleRateLimitFallback(sessionID, currentProviderID, currentModelID) {
+    async function handleRateLimitFallback(sessionID, currentProviderID, currentModelID, skipAbort = false) {
         try {
             // Prevent duplicate fallback processing within 5 seconds
             const lastFallback = fallbackInProgress.get(sessionID);
@@ -316,35 +316,29 @@ export const RateLimitFallback = async ({ client, directory }) => {
                 parts: parts,
                 model: { providerID: nextModel.providerID, modelID: nextModel.modelID },
             };
-            // CRITICAL PATH: promptAsync BEFORE abort.
+            // promptAsync → abort: send fallback prompt first, then abort the old request
+            // This prevents the abort from killing the new fallback prompt.
             //
-            // In headless mode (opencode run), abort → promptAsync fails because:
-            //   1. abort triggers server dispose sequence
-            //   2. promptAsync is accepted and message created
-            //   3. Server starts processing (busy) but dispose interrupts it (idle)
-            //   4. server.instance.disposed — all within ~6ms
-            //
-            // By sending promptAsync FIRST, the server knows there is pending work
-            // before abort triggers the dispose check. When abort cancels the retry
-            // loop and the session goes idle, the server should process the queued
-            // prompt instead of disposing.
+            // For session.error events, the request is already in error state, so we
+            // only send promptAsync (skipAbort = true). For retry status, we send both.
             //
             // promptAsync: HTTP POST /session/{id}/prompt_async → 204 (SDK sdk.gen.js).
-            // prompt (sync): blocks until generation completes — do NOT use.
             const t0 = Date.now();
             await client.session.promptAsync({
                 path: { id: sessionID },
                 body: promptBody,
             });
-            logToFile(`promptAsync completed for session ${sessionID} (${Date.now() - t0}ms) with model ${nextModel.providerID}/${nextModel.modelID}`);
             const t1 = Date.now();
-            try {
-                await client.session.abort({ path: { id: sessionID } });
-                logToFile(`abort succeeded for session ${sessionID} (${Date.now() - t1}ms, total ${Date.now() - t0}ms)`);
-            }
-            catch (abortErr) {
-                logToFile(`abort failed (${Date.now() - t1}ms): ${abortErr}`);
+            if (!skipAbort) {
+                try {
+                    await client.session.abort({ path: { id: sessionID } });
+                    logToFile(`abort succeeded for session ${sessionID} (${Date.now() - t1}ms, total ${Date.now() - t0}ms)`);
+                }
+                catch (abortErr) {
+                    logToFile(`abort failed (${Date.now() - t1}ms): ${abortErr}`);
+                }
             }
+            logToFile(`promptAsync completed for session ${sessionID} (${Date.now() - t0}ms) with model ${nextModel.providerID}/${nextModel.modelID}`);
             // Toast is best-effort notification. The toast() function (line ~185) has
             // built-in fallback: showToast failure → app.log. After promptAsync the
             // server may already be disposing, so both showToast and app.log could fail.
@@ -406,7 +400,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
                     catch {
                         console.log("[rate-limit-fallback] Rate limit error detected, attempting fallback");
                     }
-                    await handleRateLimitFallback(sessionID, "", "");
+                    await handleRateLimitFallback(sessionID, "", "", true); // skipAbort = true (already in error state)
                 }
             }
             if (event.type === "message.updated") {
@@ -445,7 +439,7 @@ export const RateLimitFallback = async ({ client, directory }) => {
                     catch {
                         console.log("[rate-limit-fallback] Rate limit error in message, attempting fallback");
                     }
-                    await handleRateLimitFallback(info.sessionID, info.providerID || "", info.modelID || "");
+                    await handleRateLimitFallback(info.sessionID, info.providerID || "", info.modelID || "", true); // skipAbort = true (already in error state)
                 }
             }
             if (event.type === "session.status") {
@@ -464,6 +458,23 @@ export const RateLimitFallback = async ({ client, directory }) => {
                 catch {
                     console.log("[rate-limit-fallback] session.status:", status);
                 }
+                if (status?.type === "interrupted") {
+                    // Handle interrupted session - resend prompt with fallback model (skip abort)
+                    logToFile("Session interrupted, attempting to resend prompt");
+                    try {
+                        await client.app.log({
+                            body: {
+                                service: "rate-limit-fallback",
+                                level: "info",
+                                message: "Session interrupted, attempting to resend prompt",
+                            },
+                        });
+                    }
+                    catch {
+                        console.log("[rate-limit-fallback] Session interrupted, attempting to resend prompt");
+                    }
+                    await handleRateLimitFallback(props.sessionID, "", "", true); // skipAbort = true
+                }
                 if (status?.type === "retry" && status?.message) {
                     const message = status.message.toLowerCase();
                     const isRateLimitRetry = message.includes("usage limit") ||

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@azumag/opencode-rate-limit-fallback",
-  "version": "1.0.18",
+  "version": "1.0.20",
   "description": "OpenCode plugin that automatically switches to fallback models when rate limited",
   "type": "module",
   "main": "./dist/index.js",