npm - opencodekit - Versions diffs - 0.20.0 → 0.20.2 - Mend

opencodekit 0.20.0 → 0.20.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

package/dist/index.js +1 -1
package/dist/template/.opencode/dcp.jsonc +31 -24
package/dist/template/.opencode/memory.db +0 -0
package/dist/template/.opencode/memory.db-shm +0 -0
package/dist/template/.opencode/memory.db-wal +0 -0
package/dist/template/.opencode/opencode.json +4 -4
package/dist/template/.opencode/package.json +1 -1
package/dist/template/.opencode/plugin/copilot-auth.ts +161 -53
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -20,7 +20,7 @@ var __require = /* @__PURE__ */ createRequire(import.meta.url);
 //#endregion
 //#region package.json
-var version = "0.20.0";
+var version = "0.20.2";
 //#endregion
 //#region src/utils/license.ts

package/dist/template/.opencode/dcp.jsonc CHANGED Viewed

@@ -24,11 +24,11 @@
 	},
 	// Glob patterns for files that should never be auto-pruned
 	// Keep tight: broad patterns reduce DCP effectiveness
+	// .opencode/** and .beads/** removed — memory-* and tilth_* outputs
+	// already survive compression via compress.protectedTools
 	"protectedFilePatterns": [
 		"**/.env*",
 		"**/AGENTS.md",
-		"**/.opencode/**",
-		"**/.beads/**",
 		"**/package.json",
 		"**/tsconfig.json"
 	],
@@ -43,34 +43,41 @@
 		// v3.1.0: active summary tokens extend effective maxContextLimit
 		"summaryBuffer": true,
 		// Soft upper threshold: above this, strong compression nudges fire
-		// Accepts number or "X%" of model context window
-		"maxContextLimit": "80%",
+		// Use numeric values — percentage requires modelContextLimit from runtime
+		// which may be unavailable for some provider/model combos (e.g. GitHub Copilot)
+		// Rule: must be BELOW OpenCode emergency threshold (model_max - reserved - max_output)
+		// For Copilot Claude (216k ctx, 64k out, 16k reserved): emergency = 136k
+		// So DCP must start compressing well before 136k
+		"maxContextLimit": 100000,
 		// Per-model override for maxContextLimit (takes priority over global)
-		// Aligned to claude-opus-4.6 (216k context, 64k output) as primary build agent
 		"modelMaxLimits": {
-			"github-copilot/claude-opus-4.6": 192000,
-			"github-copilot/claude-opus-4.5": 192000,
-			"github-copilot/claude-sonnet-4.6": 192000,
-			"github-copilot/claude-sonnet-4.5": 192000,
-			"github-copilot/claude-sonnet-4": 192000,
-			"github-copilot/claude-haiku-4.5": 172000,
-			"github-copilot/gpt-5.4": 192000,
-			"github-copilot/gpt-5.3-codex": 192000,
-			"github-copilot/gemini-3.1-pro-preview": 192000
+			// Claude: 216k ctx, 64k out → emergency at 136k → DCP starts at 110k
+			"github-copilot/claude-opus-4.6": 110000,
+			"github-copilot/claude-opus-4.5": 110000,
+			"github-copilot/claude-sonnet-4.6": 110000,
+			"github-copilot/claude-sonnet-4.5": 110000,
+			"github-copilot/claude-sonnet-4": 110000,
+			// Haiku: smaller model, be more conservative
+			"github-copilot/claude-haiku-4.5": 90000,
+			// GPT/Gemini: assume similar 200k+ windows
+			"github-copilot/gpt-5.4": 110000,
+			"github-copilot/gpt-5.3-codex": 110000,
+			"github-copilot/gemini-3.1-pro-preview": 110000
 		},
 		// Soft lower threshold: below this, turn/iteration reminders are off
-		"minContextLimit": "35%",
+		// Use numeric values — same reason as maxContextLimit above
+		"minContextLimit": 50000,
 		// Per-model override for minContextLimit (takes priority over global)
 		"modelMinLimits": {
-			"github-copilot/claude-opus-4.6": "30%",
-			"github-copilot/claude-opus-4.5": "35%",
-			"github-copilot/claude-sonnet-4.6": "35%",
-			"github-copilot/claude-sonnet-4.5": "35%",
-			"github-copilot/claude-sonnet-4": "35%",
-			"github-copilot/claude-haiku-4.5": "25%",
-			"github-copilot/gpt-5.4": "30%",
-			"github-copilot/gpt-5.3-codex": "30%",
-			"github-copilot/gemini-3.1-pro-preview": "30%"
+			"github-copilot/claude-opus-4.6": 65000,
+			"github-copilot/claude-opus-4.5": 65000,
+			"github-copilot/claude-sonnet-4.6": 65000,
+			"github-copilot/claude-sonnet-4.5": 65000,
+			"github-copilot/claude-sonnet-4": 65000,
+			"github-copilot/claude-haiku-4.5": 50000,
+			"github-copilot/gpt-5.4": 65000,
+			"github-copilot/gpt-5.3-codex": 65000,
+			"github-copilot/gemini-3.1-pro-preview": 65000
 		},
 		// How often context-limit nudge fires above maxContextLimit (1 = every fetch)
 		"nudgeFrequency": 5,

package/dist/template/.opencode/memory.db CHANGED Viewed

Binary file

package/dist/template/.opencode/memory.db-shm CHANGED Viewed

Binary file

package/dist/template/.opencode/memory.db-wal CHANGED Viewed

Binary file

package/dist/template/.opencode/opencode.json CHANGED Viewed

@@ -175,7 +175,7 @@
             "output": 32000
           },
           "options": {
-            "thinking_budget": 10000,
+            "thinking_budget": 24000,
             "type": "enabled"
           },
           "reasoning": true,
@@ -229,7 +229,7 @@
           },
           "options": {
             "thinking": {
-              "budget_tokens": 16000,
+              "budget_tokens": 24000,
               "type": "enabled"
             }
           },
@@ -324,7 +324,7 @@
           },
           "options": {
             "thinking": {
-              "budget_tokens": 16000,
+              "budget_tokens": 24000,
               "type": "enabled"
             }
           },
@@ -1674,6 +1674,6 @@
     ]
   },
   "compaction": {
-    "reserved": 128000
+    "reserved": 16000
   }
 }

package/dist/template/.opencode/package.json CHANGED Viewed

@@ -12,7 +12,7 @@
   },
   "dependencies": {
     "@google/stitch-sdk": "^0.0.3",
-    "@opencode-ai/plugin": "1.3.13"
+    "@opencode-ai/plugin": "1.3.17"
   },
   "devDependencies": {
     "@types/node": "^25.3.0",

package/dist/template/.opencode/plugin/copilot-auth.ts CHANGED Viewed

@@ -94,6 +94,51 @@ function getUrls(domain: string) {
 const sleep = (ms: number) => new Promise((resolve) => setTimeout(resolve, ms));
+function getRequestUrl(input: RequestInfo | URL): string {
+	if (typeof input === "string") return input;
+	if (input instanceof URL) return input.toString();
+	if (typeof Request !== "undefined" && input instanceof Request) {
+		return input.url;
+	}
+	return input.toString();
+}
+function extractClaudeThinkingBudget(body: any): number | undefined {
+	const candidates = [body?.thinking_budget, body?.thinking?.budget_tokens];
+	for (const candidate of candidates) {
+		if (typeof candidate === "number" && Number.isFinite(candidate)) {
+			const normalized = Math.trunc(candidate);
+			if (normalized > 0) return normalized;
+		}
+	}
+	return undefined;
+}
+function getErrorMessage(error: unknown): string {
+	if (error instanceof Error) return error.message;
+	if (typeof error === "string") return error;
+	try {
+		return JSON.stringify(error);
+	} catch {
+		return String(error);
+	}
+}
+function isTransientUpstreamTimeoutError(error: unknown): boolean {
+	const message = getErrorMessage(error).toLowerCase();
+	return (
+		message.includes("upstream idle timeout") ||
+		message.includes("mid_stream") ||
+		message.includes("sse read timed out") ||
+		message.includes("socket connection was closed unexpectedly") ||
+		message.includes("connection reset") ||
+		message.includes("econnreset") ||
+		message.includes("etimedout")
+	);
+}
 // Rate limit handling configuration
 const RATE_LIMIT_CONFIG = {
 	maxDelayMs: 60000, // Cap at 60 seconds
@@ -553,7 +598,7 @@ export const CopilotAuthPlugin: Plugin = async ({ client: sdk }) => {
 									? JSON.parse(init.body)
 									: init?.body;
-							const url = input.toString();
+							const url = getRequestUrl(input);
 							// Check if this is a Claude model request
 							const modelId = body?.model || "";
@@ -574,18 +619,34 @@ export const CopilotAuthPlugin: Plugin = async ({ client: sdk }) => {
 								// For Claude models, add thinking_budget to enable reasoning
 								// The Copilot API accepts this parameter and returns reasoning_text/reasoning_opaque
 								if (isClaudeModel) {
-									// Use configured thinking_budget from model options, or default to 10000
-									const thinkingBudget = body.thinking_budget || 10000;
-									// Fix for "Invalid signature in thinking block" error:
-									// The Copilot API uses reasoning_text/reasoning_opaque format for thinking
-									// When these are passed back without proper signature, it causes errors
-									// Solution: Ensure reasoning_opaque is present when reasoning_text exists,
-									// or remove reasoning content entirely if signature is invalid/missing
+									const thinkingBudget = extractClaudeThinkingBudget(body);
+									const isThinkingEnabled = thinkingBudget != null;
 									const cleanedMessages = body.messages.map(
 										(msg: any, idx: number) => {
 											if (msg.role !== "assistant") return msg;
+											// If thinking is disabled, strip all reasoning metadata to prevent
+											// stale reasoning context from continuing across turns.
+											if (!isThinkingEnabled) {
+												const {
+													reasoning_text: _reasoningText,
+													reasoning_opaque: _reasoningOpaque,
+													...baseMsg
+												} = msg;
+												if (!Array.isArray(baseMsg.content)) return baseMsg;
+												const cleanedContent = baseMsg.content.filter(
+													(part: any) => part.type !== "thinking",
+												);
+												return {
+													...baseMsg,
+													content:
+														cleanedContent.length > 0 ? cleanedContent : null,
+												};
+											}
 											// Log message structure for debugging
 											log("debug", `Processing assistant message ${idx}`, {
 												has_reasoning_text: !!msg.reasoning_text,
@@ -605,11 +666,6 @@ export const CopilotAuthPlugin: Plugin = async ({ client: sdk }) => {
 											}
 											// If content is an array, strip ALL thinking blocks.
-											// Reasoning is communicated via reasoning_text/reasoning_opaque
-											// fields, not via thinking blocks in the content array.
-											// Even thinking blocks WITH signatures can cause
-											// "Invalid signature in thinking block" errors when
-											// signatures are expired or from a different context.
 											if (Array.isArray(msg.content)) {
 												const hasThinkingBlock = msg.content.some(
 													(part: any) => part.type === "thinking",
@@ -634,15 +690,31 @@ export const CopilotAuthPlugin: Plugin = async ({ client: sdk }) => {
 										},
 									);
-									modifiedBody = {
-										...body,
+									const nextBody: Record<string, any> = {
+										...(modifiedBody || body),
 										messages: cleanedMessages,
-										thinking_budget: thinkingBudget,
 									};
-									log("info", `Adding thinking_budget for Claude model`, {
-										model: modelId,
-										thinking_budget: thinkingBudget,
-									});
+									if (isThinkingEnabled) {
+										nextBody.thinking_budget = thinkingBudget;
+										log("info", `Adding thinking_budget for Claude model`, {
+											model: modelId,
+											thinking_budget: thinkingBudget,
+										});
+									} else {
+										delete nextBody.thinking_budget;
+										log(
+											"info",
+											`Claude thinking disabled for this request (no thinking budget set)`,
+											{ model: modelId },
+										);
+									}
+									// Copilot OpenAI-compatible endpoint expects `thinking_budget`.
+									// Remove Anthropic-style `thinking` object to avoid mixed payloads.
+									delete nextBody.thinking;
+									modifiedBody = nextBody;
 								}
 								// For GPT models (o1, gpt-5, etc.), add reasoning parameter
@@ -839,46 +911,82 @@ export const CopilotAuthPlugin: Plugin = async ({ client: sdk }) => {
 							}
 						}
-						try {
-							if (currentModel) {
-								await shapeRequestForModel(currentModel);
-							}
-							const response = await fetch(input, activeFinalInit);
+						const maxFetchAttempts = 2;
-							if (response.status === 429) {
-								try {
-									await response.body?.cancel();
-								} catch {}
+						for (let attempt = 1; attempt <= maxFetchAttempts; attempt++) {
+							try {
+								if (currentModel) {
+									await shapeRequestForModel(currentModel);
+								}
+								const response = await fetch(input, activeFinalInit);
-								const retryAfterMs = parseRetryAfter(response);
-								const cooldownMs = clampCooldownMs(
-									retryAfterMs,
-									RATE_LIMIT_CONFIG.defaultCooldownMs,
-								);
+								if (response.status === 429) {
+									try {
+										await response.body?.cancel();
+									} catch {}
-								if (currentModel) {
-									markModelRateLimited(currentModel, cooldownMs);
-									openFamilyCircuitBreaker(currentModel, cooldownMs);
+									const retryAfterMs = parseRetryAfter(response);
+									const cooldownMs = clampCooldownMs(
+										retryAfterMs,
+										RATE_LIMIT_CONFIG.defaultCooldownMs,
+									);
+									if (currentModel) {
+										markModelRateLimited(currentModel, cooldownMs);
+										openFamilyCircuitBreaker(currentModel, cooldownMs);
+									}
+									throw new Error(
+										`[Copilot] Rate limited: ${currentModel || "model"} cooling down. Retry in ${formatRetryAfter(Math.ceil(cooldownMs / 1000))}.`,
+									);
 								}
-								throw new Error(
-									`[Copilot] Rate limited: ${currentModel || "model"} cooling down. Retry in ${formatRetryAfter(Math.ceil(cooldownMs / 1000))}.`,
-								);
-							}
+								// Response transformation is handled by the custom SDK at
+								// .opencode/plugin/sdk/copilot/
+								return response;
+							} catch (error) {
+								const errorMessage = getErrorMessage(error);
+								if (
+									errorMessage.includes("Rate limited") ||
+									errorMessage.includes("Local request queue saturated")
+								) {
+									throw error instanceof Error
+										? error
+										: new Error(errorMessage);
+								}
+								if (
+									attempt < maxFetchAttempts &&
+									isTransientUpstreamTimeoutError(error)
+								) {
+									const retryDelayMs = 750 * attempt;
+									log(
+										"warn",
+										`Transient upstream timeout from Copilot, retrying request`,
+										{
+											model: currentModel || undefined,
+											attempt,
+											retry_delay_ms: retryDelayMs,
+											error: errorMessage,
+										},
+									);
+									await sleep(retryDelayMs);
+									continue;
+								}
-							// Response transformation is handled by the custom SDK at
-							// .opencode/plugin/sdk/copilot/
-							return response;
-						} catch (error) {
-							const lastError = error as Error;
-							if (
-								lastError.message.includes("Rate limited") ||
-								lastError.message.includes("Local request queue saturated")
-							) {
-								throw lastError;
+								if (isTransientUpstreamTimeoutError(error)) {
+									throw new Error(
+										`[Copilot] Upstream idle timeout while streaming ${currentModel || "request"}. Retry with a lower thinking budget or switch to a lower-latency Claude variant.`,
+									);
+								}
+								throw error;
 							}
-							throw error;
 						}
+						throw new Error(
+							`[Copilot] Failed request after ${maxFetchAttempts} attempts.`,
+						);
 					},
 				};
 			},

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
 	"name": "opencodekit",
-	"version": "0.20.0",
+	"version": "0.20.2",
 	"description": "CLI tool for bootstrapping and managing OpenCodeKit projects",
 	"keywords": [
 		"agents",