npm - cascade-ai - Versions diffs - 0.12.7 → 0.12.9 - Mend

cascade-ai 0.12.7 → 0.12.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/dist/cli.cjs +86 -12
package/dist/cli.cjs.map +1 -1
package/dist/cli.js +86 -12
package/dist/cli.js.map +1 -1
package/dist/desktop-core.cjs +299112 -0
package/dist/index.cjs +82 -9
package/dist/index.cjs.map +1 -1
package/dist/index.d.cts +7 -0
package/dist/index.d.ts +7 -0
package/dist/index.js +82 -9
package/dist/index.js.map +1 -1
package/package.json +1 -1

package/dist/cli.js CHANGED Viewed

@@ -54,7 +54,7 @@ var __export = (target, all) => {
 var CASCADE_VERSION, CASCADE_CONFIG_FILE, CASCADE_DB_FILE, CASCADE_DASHBOARD_SECRET_FILE, GLOBAL_CONFIG_DIR, GLOBAL_DB_FILE, GLOBAL_KEYSTORE_FILE, GLOBAL_RUNTIME_DB_FILE, DEFAULT_DASHBOARD_PORT, DEFAULT_CONTEXT_LIMIT, DEFAULT_AUTO_SUMMARIZE_AT, MODELS, T1_MODEL_PRIORITY, T2_MODEL_PRIORITY, T3_MODEL_PRIORITY, VISION_MODEL_PRIORITY, COMPLEXITY_T2_COUNT, THEME_NAMES, DEFAULT_THEME, OLLAMA_BASE_URL, LM_STUDIO_BASE_URL, AZURE_BASE_URL_TEMPLATE, TOOL_NAMES, DEFAULT_APPROVAL_REQUIRED;
 var init_constants = __esm({
   "src/constants.ts"() {
-    CASCADE_VERSION = "0.12.7";
+    CASCADE_VERSION = "0.12.9";
     CASCADE_CONFIG_FILE = ".cascade/config.json";
     CASCADE_DB_FILE = ".cascade/memory.db";
     CASCADE_DASHBOARD_SECRET_FILE = ".cascade/dashboard-secret";
@@ -455,6 +455,12 @@ var anthropic_exports = {};
 __export(anthropic_exports, {
   AnthropicProvider: () => AnthropicProvider
 });
+function anthropicThinkingParam(modelId, maxTokens) {
+  if (!/claude-(opus|sonnet)-4/i.test(modelId)) return {};
+  const budget = Math.min(8e3, maxTokens - 1024);
+  if (budget < 1024) return {};
+  return { thinking: { type: "enabled", budget_tokens: budget } };
+}
 var AnthropicProvider;
 var init_anthropic = __esm({
   "src/providers/anthropic.ts"() {
@@ -489,13 +495,18 @@ var init_anthropic = __esm({
         let fullContent = "";
         let inputTokens = 0;
         let outputTokens = 0;
+        const maxTokens = options.maxTokens ?? this.model.maxOutputTokens;
+        const thinkParam = anthropicThinkingParam(this.model.id, maxTokens);
+        const useThinking = !!thinkParam.thinking;
         const stream = this.client.messages.stream({
           model: this.model.id,
-          max_tokens: options.maxTokens ?? this.model.maxOutputTokens,
-          temperature: options.temperature ?? 0.7,
+          max_tokens: maxTokens,
+          // Extended thinking requires temperature = 1; otherwise honor the request.
+          temperature: useThinking ? 1 : options.temperature ?? 0.7,
           system: options.systemPrompt,
           messages,
-          tools: tools?.length ? tools : void 0
+          tools: tools?.length ? tools : void 0,
+          ...thinkParam
         }, { signal: options.signal });
         let isThinking = false;
         for await (const event of stream) {
@@ -3322,6 +3333,7 @@ var ModelSelector = class {
       if (lower.includes("claude")) providerStr = "anthropic";
       else if (lower.startsWith("gpt") || lower.startsWith("o1") || lower.startsWith("o3")) providerStr = "openai";
       else if (lower.includes("gemini")) providerStr = "gemini";
+      else if ((lower.endsWith(".gguf") || actualId.includes("/") || actualId.includes("\\")) && this.availableProviders.has("openai-compatible")) providerStr = "openai-compatible";
       else if (this.availableProviders.has("ollama")) providerStr = "ollama";
       else if (this.availableProviders.has("openai-compatible")) providerStr = "openai-compatible";
       else if (this.availableProviders.size === 1) providerStr = Array.from(this.availableProviders)[0];
@@ -4004,6 +4016,11 @@ var CascadeRouter = class _CascadeRouter extends EventEmitter {
     if (availableProviders.has("ollama")) {
       await this.discoverOllamaModels(ollamaCfg);
     }
+    if (availableProviders.has("openai-compatible")) {
+      await Promise.all(
+        config.providers.filter((p) => p.type === "openai-compatible").map((cfg) => this.discoverOpenAICompatibleModels(cfg))
+      );
+    }
     for (const tier of ["T1", "T2", "T3"]) {
       const override = tier === "T1" ? config.models.t1 : tier === "T2" ? config.models.t2 : config.models.t3;
       if (!override || override === "auto") continue;
@@ -4435,6 +4452,14 @@ var CascadeRouter = class _CascadeRouter extends EventEmitter {
   getModelsForProvider(provider) {
     return this.selector.getAvailableModelsForProvider(provider);
   }
+  /**
+   * Every model available across the configured + reachable providers, after
+   * discovery (Ollama tags, OpenAI-compatible/llama.cpp models, cloud catalog).
+   * Used to populate the desktop model pickers with the user's real models.
+   */
+  getAvailableModels() {
+    return this.selector?.getAllAvailableModels() ?? [];
+  }
   // ── Private ──────────────────────────────────
   async detectAvailableProviders(configs) {
     const available = /* @__PURE__ */ new Set();
@@ -4465,6 +4490,28 @@ var CascadeRouter = class _CascadeRouter extends EventEmitter {
     } catch {
     }
   }
+  async discoverOpenAICompatibleModels(cfg) {
+    try {
+      const seed = {
+        id: "openai-compatible",
+        name: "openai-compatible",
+        provider: "openai-compatible",
+        contextWindow: 32e3,
+        isVisionCapable: false,
+        inputCostPer1kTokens: 0,
+        outputCostPer1kTokens: 0,
+        maxOutputTokens: 4e3,
+        supportsStreaming: true,
+        isLocal: false
+      };
+      const provider = new OpenAICompatibleProvider(cfg, seed);
+      const models = await provider.listModels();
+      for (const m of models) {
+        this.selector.addDynamicModel(m);
+      }
+    } catch {
+    }
+  }
   ensureProvider(model, configs) {
     const key = `${model.provider}:${model.id}`;
     if (this.providers.has(key)) return;
@@ -4494,7 +4541,23 @@ var CascadeRouter = class _CascadeRouter extends EventEmitter {
     }
   }
   getAnyModelForProvider(type) {
-    return Object.values(MODELS).find((m) => m.provider === type);
+    const fromCatalog = Object.values(MODELS).find((m) => m.provider === type);
+    if (fromCatalog) return fromCatalog;
+    if (type === "openai-compatible" || type === "azure") {
+      return {
+        id: type,
+        name: type,
+        provider: type,
+        contextWindow: 32e3,
+        isVisionCapable: false,
+        inputCostPer1kTokens: 0,
+        outputCostPer1kTokens: 0,
+        maxOutputTokens: 4e3,
+        supportsStreaming: true,
+        isLocal: false
+      };
+    }
+    return void 0;
   }
   recordStats(tier, model, usage) {
     this.stats.totalTokens += usage.totalTokens;
@@ -10363,7 +10426,11 @@ ${last.partialOutput}` : "");
   looksLikeConversational(prompt) {
     const LOW_COMPLEXITY = [
       /^(?:hi|hello|hey|thanks|thank you|ok|okay|yes|no|sure|got it|sounds good)\b/i,
-      /^(?:what is|what are|list|show me|tell me|who is|where is|when is|how do i)\b/i,
+      /^(?:what is|what are|what'?s|list|show me|tell me|who is|who are|who'?re|where is|when is|how do i)\b/i,
+      // Self-identity / capability questions ("who are you", "what can you do",
+      // "who made you") are pure conversation — never a multi-agent build.
+      /^(?:who|what)\b.*\byou\b/i,
+      /^what can you\b/i,
       /\b(?:simple|quick|brief|small|single|one-line|typo|rename)\b/i
     ];
     const wordCount = prompt.trim().split(/\s+/).length;
@@ -10461,10 +10528,16 @@ ${prompt}` : prompt;
         temperature: 0
       });
       const content = result.content.trim();
-      const firstWord = (content.split(/[\s—–-]+/)[0] ?? "").toLowerCase();
+      const match = content.toLowerCase().match(/\b(simple|moderate|complex)\b/);
       const reason = content.replace(/^\S+\s*[—–-]*\s*/, "").trim();
-      const verdict = firstWord.includes("simple") ? "Simple" : firstWord.includes("moderate") ? "Moderate" : "Complex";
-      this.recordDecision("complexity", `${verdict} \u2014 classifier: ${reason || "no reason given"}`);
+      let verdict;
+      if (match) {
+        verdict = match[1] === "simple" ? "Simple" : match[1] === "moderate" ? "Moderate" : "Complex";
+        this.recordDecision("complexity", `${verdict} \u2014 classifier: ${reason || "no reason given"}`);
+      } else {
+        verdict = prompt.trim().split(/\s+/).length <= 12 ? "Simple" : "Moderate";
+        this.recordDecision("complexity", `${verdict} \u2014 classifier output unparseable; defaulted by length`);
+      }
       return verdict;
     } catch {
       const followUpPrompt = /^(proceed|continue|go ahead|do it|yes|yep|ok|okay|carry on)$/i.test(prompt.trim());
@@ -13873,7 +13946,8 @@ function SetupWizard({ workspacePath, onComplete }) {
         ) })
       ] });
     }
-    const prompt = isAzure && fieldStage === "deploymentName" ? `Azure deployment name (${currentEntry.label})` : isAzure && fieldStage === "baseUrl" ? `Azure endpoint URL` : isAzure && fieldStage === "apiKey" ? `${currentEntry.label} API Key` : isAzure && fieldStage === "apiVersion" ? `Azure API version (e.g. 2024-08-01-preview)` : isCompat && fieldStage === "label" ? `Name for this endpoint (e.g. Groq)` : isCompat && fieldStage === "baseUrl" ? `Base URL (e.g. https://api.groq.com/openai/v1)` : isOllama ? `Ollama URL` : `${currentEntry.label} API Key`;
+    const prompt = isAzure && fieldStage === "deploymentName" ? `Azure deployment name (${currentEntry.label})` : isAzure && fieldStage === "baseUrl" ? `Azure endpoint URL` : isAzure && fieldStage === "apiKey" ? `${currentEntry.label} API Key` : isAzure && fieldStage === "apiVersion" ? `Azure API version (e.g. 2024-08-01-preview)` : isCompat && fieldStage === "label" ? `Name for this endpoint (e.g. Groq)` : isCompat && fieldStage === "baseUrl" ? `Base URL (e.g. https://api.groq.com/openai/v1)` : isCompat && fieldStage === "apiKey" ? `${currentEntry.label} API Key (optional)` : isOllama ? `Ollama URL` : `${currentEntry.label} API Key`;
+    const keyOptional = isCompat && fieldStage === "apiKey";
     const isMasked = fieldStage === "apiKey" && !isOllama;
     return /* @__PURE__ */ jsxs(Frame, { theme, phase: "keys", children: [
       doneEntries.length > 0 && /* @__PURE__ */ jsx(Box, { flexDirection: "column", marginBottom: 1, children: doneEntries.map((e) => /* @__PURE__ */ jsxs(Box, { children: [
@@ -13891,8 +13965,8 @@ function SetupWizard({ workspacePath, onComplete }) {
         {
           theme,
           label: prompt,
-          tag: isOllama ? "optional \u2014 Enter for default" : "required",
-          tagColor: isOllama ? theme.colors.muted : theme.colors.error,
+          tag: isOllama ? "optional \u2014 Enter for default" : keyOptional ? "optional \u2014 Enter to skip" : "required",
+          tagColor: isOllama || keyOptional ? theme.colors.muted : theme.colors.error,
           active: true,
           children: /* @__PURE__ */ jsx(
             SafeTextInput,