npm - opencode-qwen-cli-auth - Versions diffs - 2.2.6 → 2.2.8 - Mend

opencode-qwen-cli-auth 2.2.6 → 2.2.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +99 -29
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -15,10 +15,13 @@ import { PROVIDER_ID, AUTH_LABELS, DEVICE_FLOW, PORTAL_HEADERS } from "./lib/con
 import { logError, logInfo, logWarn, LOGGING_ENABLED } from "./lib/logger.js";
 const CHAT_REQUEST_TIMEOUT_MS = 30000;
 const CHAT_MAX_RETRIES = 0;
+const CHAT_MAX_TOKENS_CAP = 2048;
+const CHAT_DEFAULT_MAX_TOKENS = 2048;
 const MAX_CONSECUTIVE_POLL_FAILURES = 3;
 const QUOTA_DEGRADE_MAX_TOKENS = 1024;
 const CLI_FALLBACK_TIMEOUT_MS = 8000;
 const CLI_FALLBACK_MAX_BUFFER_CHARS = 1024 * 1024;
+const ENABLE_CLI_FALLBACK = process.env.OPENCODE_QWEN_ENABLE_CLI_FALLBACK === "1";
 const PLUGIN_USER_AGENT = "opencode-qwen-cli-auth/2.2.1";
 const CLIENT_ONLY_BODY_FIELDS = new Set([
     "providerID",
@@ -97,6 +100,34 @@ function appendLimitedText(current, chunk) {
     }
     return next.slice(next.length - CLI_FALLBACK_MAX_BUFFER_CHARS);
 }
+function isRequestInstance(value) {
+    return typeof Request !== "undefined" && value instanceof Request;
+}
+async function normalizeFetchInvocation(input, init) {
+    const requestInit = init ? { ...init } : {};
+    let requestInput = input;
+    if (!isRequestInstance(input)) {
+        return { requestInput, requestInit };
+    }
+    requestInput = input.url;
+    if (!requestInit.method) {
+        requestInit.method = input.method;
+    }
+    if (!requestInit.headers) {
+        requestInit.headers = new Headers(input.headers);
+    }
+    if (requestInit.body === undefined) {
+        try {
+            requestInit.body = await input.clone().text();
+        }
+        catch (_error) {
+        }
+    }
+    if (!requestInit.signal) {
+        requestInit.signal = input.signal;
+    }
+    return { requestInput, requestInit };
+}
 function getHeaderValue(headers, headerName) {
     if (!headers) {
         return undefined;
@@ -178,6 +209,14 @@ function sanitizeOutgoingPayload(payload) {
         delete sanitized.stream_options;
         changed = true;
     }
+    if (typeof sanitized.max_tokens === "number" && sanitized.max_tokens > CHAT_MAX_TOKENS_CAP) {
+        sanitized.max_tokens = CHAT_MAX_TOKENS_CAP;
+        changed = true;
+    }
+    if (typeof sanitized.max_completion_tokens === "number" && sanitized.max_completion_tokens > CHAT_MAX_TOKENS_CAP) {
+        sanitized.max_completion_tokens = CHAT_MAX_TOKENS_CAP;
+        changed = true;
+    }
     return changed ? sanitized : payload;
 }
 function createQuotaDegradedPayload(payload) {
@@ -543,7 +582,9 @@ async function sendWithTimeout(input, requestInit) {
     }
 }
 async function failFastFetch(input, init) {
-    const requestInit = init ? { ...init } : {};
+    const normalized = await normalizeFetchInvocation(input, init);
+    const requestInput = normalized.requestInput;
+    const requestInit = normalized.requestInit;
     const sourceSignal = requestInit.signal;
     const rawPayload = parseJsonRequestBody(requestInit);
     const sessionID = typeof rawPayload?.sessionID === "string" ? rawPayload.sessionID : undefined;
@@ -565,10 +606,14 @@ async function failFastFetch(input, init) {
             request_id: context.requestId,
             sessionID: context.sessionID,
             modelID: context.modelID,
+            max_tokens: typeof payload?.max_tokens === "number" ? payload.max_tokens : undefined,
+            max_completion_tokens: typeof payload?.max_completion_tokens === "number" ? payload.max_completion_tokens : undefined,
+            message_count: Array.isArray(payload?.messages) ? payload.messages.length : undefined,
+            stream: payload?.stream === true,
         });
     }
     try {
-        let response = await sendWithTimeout(input, requestInit);
+        let response = await sendWithTimeout(requestInput, requestInit);
         if (LOGGING_ENABLED) {
             logInfo("Qwen request response", {
                 request_id: context.requestId,
@@ -593,7 +638,7 @@ async function failFastFetch(input, init) {
                             attempt: 2,
                         });
                     }
-                    response = await sendWithTimeout(input, fallbackInit);
+                    response = await sendWithTimeout(requestInput, fallbackInit);
                     if (LOGGING_ENABLED) {
                         logInfo("Qwen request response", {
                             request_id: context.requestId,
@@ -607,6 +652,27 @@ async function failFastFetch(input, init) {
                         return response;
                     }
                     const fallbackBody = await response.text().catch(() => "");
+                    if (ENABLE_CLI_FALLBACK) {
+                        const cliFallback = await runQwenCliFallback(payload, context, sourceSignal);
+                        if (cliFallback.ok) {
+                            return cliFallback.response;
+                        }
+                        if (cliFallback.reason === "cli_aborted") {
+                            return makeFailFastErrorResponse(400, "request_aborted", "Qwen request was aborted");
+                        }
+                        if (LOGGING_ENABLED) {
+                            logWarn("Qwen CLI fallback failed", {
+                                request_id: context.requestId,
+                                sessionID: context.sessionID,
+                                modelID: context.modelID,
+                                reason: cliFallback.reason,
+                                stderr: cliFallback.stderr,
+                            });
+                        }
+                    }
+                    return makeQuotaFailFastResponse(fallbackBody, response.headers, context);
+                }
+                if (ENABLE_CLI_FALLBACK) {
                     const cliFallback = await runQwenCliFallback(payload, context, sourceSignal);
                     if (cliFallback.ok) {
                         return cliFallback.response;
@@ -623,23 +689,6 @@ async function failFastFetch(input, init) {
                             stderr: cliFallback.stderr,
                         });
                     }
-                    return makeQuotaFailFastResponse(fallbackBody, response.headers, context);
-                }
-                const cliFallback = await runQwenCliFallback(payload, context, sourceSignal);
-                if (cliFallback.ok) {
-                    return cliFallback.response;
-                }
-                if (cliFallback.reason === "cli_aborted") {
-                    return makeFailFastErrorResponse(400, "request_aborted", "Qwen request was aborted");
-                }
-                if (LOGGING_ENABLED) {
-                    logWarn("Qwen CLI fallback failed", {
-                        request_id: context.requestId,
-                        sessionID: context.sessionID,
-                        modelID: context.modelID,
-                        reason: cliFallback.reason,
-                        stderr: cliFallback.stderr,
-                    });
                 }
             }
             return makeQuotaFailFastResponse(firstBody, response.headers, context);
@@ -872,21 +921,21 @@ export const QwenAuthPlugin = async (_input) => {
                     maxRetries: CHAT_MAX_RETRIES,
                 },
                 models: {
-                    "coder-model": {
-                        id: "coder-model",
-                        name: "Qwen Coder (Qwen 3.5 Plus)",
+                    "coder-model": {
+                        id: "coder-model",
+                        name: "Qwen Coder (Qwen 3.5 Plus)",
                         // Qwen does not support reasoning_effort from OpenCode UI
                         // Thinking is always enabled by default on server side (qwen3.5-plus)
                         reasoning: false,
-                        limit: { context: 1048576, output: 65536 },
+                        limit: { context: 1048576, output: CHAT_MAX_TOKENS_CAP },
                         cost: { input: 0, output: 0 },
                         modalities: { input: ["text"], output: ["text"] },
                     },
-                    "vision-model": {
-                        id: "vision-model",
-                        name: "Qwen VL Plus (vision)",
-                        reasoning: false,
-                        limit: { context: 131072, output: 8192 },
+                    "vision-model": {
+                        id: "vision-model",
+                        name: "Qwen VL Plus (vision)",
+                        reasoning: false,
+                        limit: { context: 131072, output: CHAT_MAX_TOKENS_CAP },
                         cost: { input: 0, output: 0 },
                         modalities: { input: ["text"], output: ["text"] },
                     },
@@ -901,12 +950,33 @@ export const QwenAuthPlugin = async (_input) => {
                 if (typeof output.options.timeout !== "number" || output.options.timeout > CHAT_REQUEST_TIMEOUT_MS) {
                     output.options.timeout = CHAT_REQUEST_TIMEOUT_MS;
                 }
+                if (typeof output.max_tokens !== "number" || output.max_tokens > CHAT_MAX_TOKENS_CAP) {
+                    output.max_tokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
+                if (typeof output.max_completion_tokens !== "number" || output.max_completion_tokens > CHAT_MAX_TOKENS_CAP) {
+                    output.max_completion_tokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
+                if (typeof output.maxTokens !== "number" || output.maxTokens > CHAT_MAX_TOKENS_CAP) {
+                    output.maxTokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
+                if (typeof output.options.max_tokens !== "number" || output.options.max_tokens > CHAT_MAX_TOKENS_CAP) {
+                    output.options.max_tokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
+                if (typeof output.options.max_completion_tokens !== "number" || output.options.max_completion_tokens > CHAT_MAX_TOKENS_CAP) {
+                    output.options.max_completion_tokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
+                if (typeof output.options.maxTokens !== "number" || output.options.maxTokens > CHAT_MAX_TOKENS_CAP) {
+                    output.options.maxTokens = CHAT_DEFAULT_MAX_TOKENS;
+                }
                 if (LOGGING_ENABLED) {
                     logInfo("Applied chat.params hotfix", {
                         sessionID: input?.sessionID,
                         modelID: input?.model?.id,
                         timeout: output.options.timeout,
                         maxRetries: output.options.maxRetries,
+                        max_tokens: output.max_tokens,
+                        max_completion_tokens: output.max_completion_tokens,
+                        maxTokens: output.maxTokens,
                     });
                 }
             }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "opencode-qwen-cli-auth",
-  "version": "2.2.6",
+  "version": "2.2.8",
   "description": "Qwen OAuth authentication plugin for opencode - use your Qwen account instead of API keys",
   "main": "./dist/index.js",
   "types": "./dist/index.d.ts",