npm - @calliopelabs/cli - Versions diffs - 2.3.0 → 2.5.0 - Mend

@calliopelabs/cli 2.3.0 → 2.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (186) hide show

package/README.md +17 -0
package/dist/agents/agent-config-loader.js +1 -1
package/dist/agents/agent-config-presets.js +13 -13
package/dist/agents/agent-config-presets.js.map +1 -1
package/dist/agents/agent-config-types.d.ts +1 -1
package/dist/agents/agent-config-types.d.ts.map +1 -1
package/dist/agents/dynamic-tools.d.ts.map +1 -1
package/dist/agents/dynamic-tools.js +39 -10
package/dist/agents/dynamic-tools.js.map +1 -1
package/dist/agents/sdk-backend.js +1 -1
package/dist/agents/sdk-backend.js.map +1 -1
package/dist/api-server.d.ts +9 -0
package/dist/api-server.d.ts.map +1 -1
package/dist/api-server.js +74 -3
package/dist/api-server.js.map +1 -1
package/dist/auto-checkpoint.d.ts.map +1 -1
package/dist/auto-checkpoint.js +50 -17
package/dist/auto-checkpoint.js.map +1 -1
package/dist/auto-compressor.d.ts.map +1 -1
package/dist/auto-compressor.js +9 -5
package/dist/auto-compressor.js.map +1 -1
package/dist/bin.d.ts +8 -0
package/dist/bin.d.ts.map +1 -1
package/dist/bin.js +59 -4
package/dist/bin.js.map +1 -1
package/dist/branching.d.ts.map +1 -1
package/dist/branching.js +14 -1
package/dist/branching.js.map +1 -1
package/dist/checkpoint.d.ts.map +1 -1
package/dist/checkpoint.js +13 -1
package/dist/checkpoint.js.map +1 -1
package/dist/cli/agent.d.ts.map +1 -1
package/dist/cli/agent.js +19 -3
package/dist/cli/agent.js.map +1 -1
package/dist/cli/commands.d.ts.map +1 -1
package/dist/cli/commands.js +99 -0
package/dist/cli/commands.js.map +1 -1
package/dist/cli/index.d.ts.map +1 -1
package/dist/cli/index.js +32 -1
package/dist/cli/index.js.map +1 -1
package/dist/cli/types.js +1 -1
package/dist/cli/types.js.map +1 -1
package/dist/config.js +2 -2
package/dist/config.js.map +1 -1
package/dist/diff.d.ts.map +1 -1
package/dist/diff.js +42 -4
package/dist/diff.js.map +1 -1
package/dist/errors.d.ts.map +1 -1
package/dist/errors.js +30 -3
package/dist/errors.js.map +1 -1
package/dist/headless.d.ts.map +1 -1
package/dist/headless.js +56 -2
package/dist/headless.js.map +1 -1
package/dist/hooks.d.ts +8 -2
package/dist/hooks.d.ts.map +1 -1
package/dist/hooks.js +97 -11
package/dist/hooks.js.map +1 -1
package/dist/idle-eviction.d.ts.map +1 -1
package/dist/idle-eviction.js +8 -1
package/dist/idle-eviction.js.map +1 -1
package/dist/markdown.d.ts.map +1 -1
package/dist/markdown.js +32 -10
package/dist/markdown.js.map +1 -1
package/dist/mcp.d.ts +35 -5
package/dist/mcp.d.ts.map +1 -1
package/dist/mcp.js +186 -12
package/dist/mcp.js.map +1 -1
package/dist/model-detection.d.ts +14 -1
package/dist/model-detection.d.ts.map +1 -1
package/dist/model-detection.js +307 -114
package/dist/model-detection.js.map +1 -1
package/dist/model-router.js +7 -7
package/dist/model-router.js.map +1 -1
package/dist/parallel-tools.d.ts +9 -1
package/dist/parallel-tools.d.ts.map +1 -1
package/dist/parallel-tools.js +6 -5
package/dist/parallel-tools.js.map +1 -1
package/dist/plugins.d.ts +37 -0
package/dist/plugins.d.ts.map +1 -1
package/dist/plugins.js +87 -0
package/dist/plugins.js.map +1 -1
package/dist/providers/anthropic.d.ts.map +1 -1
package/dist/providers/anthropic.js +36 -2
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/bedrock.d.ts.map +1 -1
package/dist/providers/bedrock.js +81 -17
package/dist/providers/bedrock.js.map +1 -1
package/dist/providers/index.d.ts.map +1 -1
package/dist/providers/index.js +2 -0
package/dist/providers/index.js.map +1 -1
package/dist/providers/types.d.ts.map +1 -1
package/dist/providers/types.js +19 -10
package/dist/providers/types.js.map +1 -1
package/dist/risk.d.ts.map +1 -1
package/dist/risk.js +15 -5
package/dist/risk.js.map +1 -1
package/dist/sandbox-native.d.ts +1 -0
package/dist/sandbox-native.d.ts.map +1 -1
package/dist/sandbox-native.js +37 -5
package/dist/sandbox-native.js.map +1 -1
package/dist/scope.d.ts +10 -0
package/dist/scope.d.ts.map +1 -1
package/dist/scope.js +75 -15
package/dist/scope.js.map +1 -1
package/dist/scuttlebot/client.d.ts +83 -0
package/dist/scuttlebot/client.d.ts.map +1 -0
package/dist/scuttlebot/client.js +350 -0
package/dist/scuttlebot/client.js.map +1 -0
package/dist/scuttlebot/config.d.ts +28 -0
package/dist/scuttlebot/config.d.ts.map +1 -0
package/dist/scuttlebot/config.js +91 -0
package/dist/scuttlebot/config.js.map +1 -0
package/dist/scuttlebot/http-client.d.ts +63 -0
package/dist/scuttlebot/http-client.d.ts.map +1 -0
package/dist/scuttlebot/http-client.js +124 -0
package/dist/scuttlebot/http-client.js.map +1 -0
package/dist/scuttlebot/index.d.ts +13 -0
package/dist/scuttlebot/index.d.ts.map +1 -0
package/dist/scuttlebot/index.js +10 -0
package/dist/scuttlebot/index.js.map +1 -0
package/dist/scuttlebot/irc-client.d.ts +124 -0
package/dist/scuttlebot/irc-client.d.ts.map +1 -0
package/dist/scuttlebot/irc-client.js +599 -0
package/dist/scuttlebot/irc-client.js.map +1 -0
package/dist/skills.d.ts +19 -0
package/dist/skills.d.ts.map +1 -1
package/dist/skills.js +98 -10
package/dist/skills.js.map +1 -1
package/dist/smart-router.js +4 -4
package/dist/smart-router.js.map +1 -1
package/dist/storage.d.ts +0 -4
package/dist/storage.d.ts.map +1 -1
package/dist/storage.js +81 -5
package/dist/storage.js.map +1 -1
package/dist/tools.d.ts.map +1 -1
package/dist/tools.js +232 -38
package/dist/tools.js.map +1 -1
package/dist/trust.d.ts +16 -3
package/dist/trust.d.ts.map +1 -1
package/dist/trust.js +23 -4
package/dist/trust.js.map +1 -1
package/dist/types.d.ts.map +1 -1
package/dist/types.js +13 -4
package/dist/types.js.map +1 -1
package/dist/ui/agent.d.ts +1 -1
package/dist/ui/agent.d.ts.map +1 -1
package/dist/ui/agent.js +35 -44
package/dist/ui/agent.js.map +1 -1
package/dist/ui/chat-input.d.ts +3 -1
package/dist/ui/chat-input.d.ts.map +1 -1
package/dist/ui/chat-input.js +82 -17
package/dist/ui/chat-input.js.map +1 -1
package/dist/ui/commands.d.ts +2 -0
package/dist/ui/commands.d.ts.map +1 -1
package/dist/ui/commands.js +318 -10
package/dist/ui/commands.js.map +1 -1
package/dist/ui/index.d.ts.map +1 -1
package/dist/ui/index.js +236 -46
package/dist/ui/index.js.map +1 -1
package/dist/ui/input-utils.d.ts +20 -0
package/dist/ui/input-utils.d.ts.map +1 -0
package/dist/ui/input-utils.js +35 -0
package/dist/ui/input-utils.js.map +1 -0
package/dist/ui/messages.d.ts +6 -2
package/dist/ui/messages.d.ts.map +1 -1
package/dist/ui/messages.js +42 -11
package/dist/ui/messages.js.map +1 -1
package/dist/ui/modals.d.ts +21 -1
package/dist/ui/modals.d.ts.map +1 -1
package/dist/ui/modals.js +67 -5
package/dist/ui/modals.js.map +1 -1
package/dist/ui/status-bar.d.ts +4 -1
package/dist/ui/status-bar.d.ts.map +1 -1
package/dist/ui/status-bar.js +12 -1
package/dist/ui/status-bar.js.map +1 -1
package/dist/ui/types.d.ts +3 -0
package/dist/ui/types.d.ts.map +1 -1
package/package.json +4 -7
package/dist/completion.d.ts +0 -75
package/dist/completion.d.ts.map +0 -1
package/dist/completion.js +0 -234
package/dist/completion.js.map +0 -1
package/dist/keyboard.d.ts +0 -57
package/dist/keyboard.d.ts.map +0 -1
package/dist/keyboard.js +0 -265
package/dist/keyboard.js.map +0 -1

package/dist/model-detection.js CHANGED Viewed

@@ -6,6 +6,17 @@
 import OpenAI from 'openai';
 import { select } from '@inquirer/prompts';
 import * as config from './config.js';
+const DEBUG = process.env.CALLIOPE_DEBUG === '1';
+function logModelDetectionWarning(message, error, options = {}) {
+    if (options.quiet || !DEBUG) {
+        return;
+    }
+    if (error !== undefined) {
+        console.warn(message, error);
+        return;
+    }
+    console.warn(message);
+}
 // API base URLs for OpenAI-compatible providers
 const PROVIDER_BASE_URLS = {
     openrouter: 'https://openrouter.ai/api/v1',
@@ -172,7 +183,7 @@ function formatContextLength(tokens) {
 /**
  * Get available models for a provider
  */
-export async function getAvailableModels(provider) {
+export async function getAvailableModels(provider, options = {}) {
     // Check cache first
     const cached = modelCache.get(provider);
     if (cached && Date.now() - cached.timestamp < CACHE_DURATION) {
@@ -182,10 +193,10 @@ export async function getAvailableModels(provider) {
     try {
         switch (provider) {
             case 'anthropic':
-                models = await getAnthropicModels();
+                models = await getAnthropicModels(options);
                 break;
             case 'google':
-                models = await getGoogleModels();
+                models = await getGoogleModels(options);
                 break;
             case 'openai':
                 models = await getOpenAIModels();
@@ -226,14 +237,16 @@ export async function getAvailableModels(provider) {
         modelCache.set(provider, { models, timestamp: Date.now() });
     }
     catch (error) {
-        console.warn(`Failed to fetch models for ${provider}:`, error);
+        logModelDetectionWarning(`Failed to fetch models for ${provider}:`, error, options);
+        if (options.throwOnError)
+            throw error;
     }
     return models;
 }
 /**
  * Get Anthropic models dynamically from API
  */
-async function getAnthropicModels() {
+async function getAnthropicModels(options = {}) {
     const apiKey = config.getApiKey('anthropic');
     if (!apiKey)
         throw new Error('Anthropic API key not configured');
@@ -254,18 +267,20 @@ async function getAnthropicModels() {
             id: model.id,
             name: model.display_name || formatModelName(model.id),
             description: getAnthropicModelDescription(model.id),
-            contextLength: 200000,
+            // The /v1/models list endpoint does not return the context window;
+            // derive it per model family rather than hardcoding a single value.
+            contextLength: getModelContextLimit('anthropic', model.id),
         }))
             .sort((a, b) => b.id.localeCompare(a.id)); // Newest first
     }
     catch (error) {
-        // Fallback to known models if API fails
-        console.warn('Failed to fetch Anthropic models, using fallback list');
+        // Emergency fallback when the API is unreachable. Keep these as the current
+        // shipping models — discovery is the source of truth; this is the offline net.
+        logModelDetectionWarning('Failed to fetch Anthropic models, using fallback list', error, options);
         return [
-            { id: 'claude-opus-4-5-20251101', name: 'Claude Opus 4.5', description: 'Most capable model', contextLength: 200000 },
-            { id: 'claude-sonnet-4-20250514', name: 'Claude Sonnet 4', description: 'Balanced intelligence and speed', contextLength: 200000 },
-            { id: 'claude-3-5-sonnet-20241022', name: 'Claude 3.5 Sonnet', description: 'Previous gen flagship', contextLength: 200000 },
-            { id: 'claude-3-5-haiku-20241022', name: 'Claude 3.5 Haiku', description: 'Fast and affordable', contextLength: 200000 },
+            { id: 'claude-opus-4-8', name: 'Claude Opus 4.8', description: 'Most capable model', contextLength: 1000000 },
+            { id: 'claude-sonnet-4-6', name: 'Claude Sonnet 4.6', description: 'Balanced intelligence and speed', contextLength: 1000000 },
+            { id: 'claude-haiku-4-5', name: 'Claude Haiku 4.5', description: 'Fast and affordable', contextLength: 200000 },
         ];
     }
 }
@@ -290,7 +305,7 @@ function getAnthropicModelDescription(modelId) {
 /**
  * Get Google models dynamically from API
  */
-async function getGoogleModels() {
+async function getGoogleModels(options = {}) {
     const apiKey = config.getApiKey('google');
     if (!apiKey)
         throw new Error('Google API key not configured');
@@ -316,7 +331,7 @@ async function getGoogleModels() {
     }
     catch (error) {
         // Fallback to known models if API fails
-        console.warn('Failed to fetch Google models, using fallback list');
+        logModelDetectionWarning('Failed to fetch Google models, using fallback list', error, options);
         return [
             { id: 'gemini-2.5-pro-preview-06-05', name: 'Gemini 2.5 Pro', description: 'Most capable', contextLength: 1048576 },
             { id: 'gemini-2.5-flash-preview-05-20', name: 'Gemini 2.5 Flash', description: 'Fast next-gen', contextLength: 1048576 },
@@ -594,45 +609,67 @@ async function getBedrockModels() {
     const apiKey = config.getApiKey('bedrock');
     // 1. Try gateway/proxy model listing (OpenAI-compatible)
     if (baseUrl) {
-        try {
-            const modelsUrl = baseUrl.endsWith('/v1') ? `${baseUrl}/models` : `${baseUrl}/v1/models`;
-            const headers = {};
-            if (apiKey) {
-                headers['Authorization'] = `Bearer ${apiKey}`;
-            }
-            const response = await fetch(modelsUrl, { headers });
-            if (response.ok) {
-                const data = await response.json();
-                return data.data
-                    .filter(model => isCompatibleModel(model.id, 'bedrock'))
-                    .map(model => ({
-                    id: model.id,
-                    name: model.id,
-                    description: getBedrockModelDescription(model.id),
-                    contextLength: getBedrockContextLength(model.id),
-                }));
-            }
+        const modelsUrl = baseUrl.endsWith('/v1') ? `${baseUrl}/models` : `${baseUrl}/v1/models`;
+        const headers = {};
+        if (apiKey) {
+            headers['Authorization'] = `Bearer ${apiKey}`;
         }
-        catch {
-            // Fall through to native discovery
+        const response = await fetch(modelsUrl, { headers });
+        if (response.ok) {
+            const data = await response.json();
+            return data.data
+                .filter(model => isCompatibleModel(model.id, 'bedrock'))
+                .map(model => ({
+                id: model.id,
+                name: model.id,
+                description: getBedrockModelDescription(model.id),
+                contextLength: getBedrockContextLength(model.id),
+            }));
         }
+        throw new Error(`Bedrock gateway ${baseUrl} returned ${response.status}. Check BEDROCK_BASE_URL / BEDROCK_API_KEY.`);
     }
-    // 2. Try native AWS ListFoundationModels API
+    // 2. Native AWS path — let errors bubble up so the user sees the real reason.
+    return discoverBedrockModelsNative();
+}
+/**
+ * Resolve AWS credentials via the `aws` CLI. Handles SSO profiles,
+ * role-assumption profiles, and anything else `aws` knows about.
+ * Returns null if the CLI isn't installed or the profile resolution fails.
+ */
+async function resolveAwsCredentialsViaCli(profile) {
     try {
-        const hasNativeCreds = !!((process.env.AWS_ACCESS_KEY_ID && process.env.AWS_SECRET_ACCESS_KEY) ||
-            process.env.AWS_PROFILE ||
-            (await import('fs')).existsSync((await import('path')).join((await import('os')).homedir(), '.aws', 'credentials')));
-        if (hasNativeCreds) {
-            const nativeModels = await discoverBedrockModelsNative();
-            if (nativeModels.length > 0)
-                return nativeModels;
+        const { execFileSync } = await import('child_process');
+        let output = '';
+        try {
+            output = execFileSync('aws', ['configure', 'export-credentials', '--profile', profile, '--format', 'env-no-export'], { encoding: 'utf-8', timeout: 10_000, stdio: ['ignore', 'pipe', 'pipe'] });
+        }
+        catch {
+            output = execFileSync('aws', ['configure', 'export-credentials', '--profile', profile, '--format', 'env'], { encoding: 'utf-8', timeout: 10_000, stdio: ['ignore', 'pipe', 'pipe'] });
         }
+        const envs = {};
+        for (const rawLine of output.split(/\r?\n/)) {
+            const line = rawLine.trim();
+            const match = line.match(/^(?:export\s+)?([A-Z_]+)\s*=\s*(.+)$/);
+            if (!match)
+                continue;
+            let val = match[2].trim();
+            if ((val.startsWith('"') && val.endsWith('"')) || (val.startsWith("'") && val.endsWith("'"))) {
+                val = val.slice(1, -1);
+            }
+            envs[match[1]] = val;
+        }
+        if (envs.AWS_ACCESS_KEY_ID && envs.AWS_SECRET_ACCESS_KEY) {
+            return {
+                accessKeyId: envs.AWS_ACCESS_KEY_ID,
+                secretAccessKey: envs.AWS_SECRET_ACCESS_KEY,
+                sessionToken: envs.AWS_SESSION_TOKEN,
+            };
+        }
+        return null;
     }
     catch {
-        // Fall through to minimal fallback
+        return null;
     }
-    // 3. No hardcoded fallback — the default model from types.ts is used when list is empty
-    return [];
 }
 /**
  * Discover Bedrock models using the native AWS ListFoundationModels API.
@@ -647,85 +684,184 @@ async function discoverBedrockModelsNative() {
     let accessKeyId = process.env.AWS_ACCESS_KEY_ID || '';
     let secretAccessKey = process.env.AWS_SECRET_ACCESS_KEY || '';
     let sessionToken = process.env.AWS_SESSION_TOKEN;
-    if (!accessKeyId || !secretAccessKey) {
-        const profile = process.env.AWS_PROFILE || config.get('awsProfile') || 'default';
-        const credPath = join(homedir(), '.aws', 'credentials');
-        if (existsSync(credPath)) {
-            const content = readFileSync(credPath, 'utf-8');
-            const sections = {};
-            let section = '';
-            for (const line of content.split('\n')) {
-                const trimmed = line.trim();
-                const secMatch = trimmed.match(/^\[(.+)\]$/);
-                if (secMatch) {
-                    section = secMatch[1];
-                    sections[section] = {};
-                    continue;
-                }
-                const kvMatch = trimmed.match(/^([^=]+?)\s*=\s*(.+)$/);
-                if (kvMatch && section)
-                    sections[section][kvMatch[1].trim()] = kvMatch[2].trim();
-            }
-            const cred = sections[profile];
-            if (cred?.aws_access_key_id) {
-                accessKeyId = cred.aws_access_key_id;
-                secretAccessKey = cred.aws_secret_access_key || '';
-                sessionToken = cred.aws_session_token;
+    const profile = process.env.AWS_PROFILE || config.get('awsProfile') || 'default';
+    // Parse an INI-style AWS file. Handles both ~/.aws/credentials sections
+    // ([name]) and ~/.aws/config sections ([profile name]).
+    const readIni = (path) => {
+        if (!existsSync(path))
+            return {};
+        const content = readFileSync(path, 'utf-8');
+        const sections = {};
+        let section = '';
+        for (const line of content.split('\n')) {
+            const trimmed = line.trim();
+            if (!trimmed || trimmed.startsWith('#') || trimmed.startsWith(';'))
+                continue;
+            const secMatch = trimmed.match(/^\[(.+)\]$/);
+            if (secMatch) {
+                section = secMatch[1].replace(/^profile\s+/, '');
+                sections[section] = sections[section] || {};
+                continue;
             }
+            const kvMatch = trimmed.match(/^([^=]+?)\s*=\s*(.+)$/);
+            if (kvMatch && section)
+                sections[section][kvMatch[1].trim()] = kvMatch[2].trim();
+        }
+        return sections;
+    };
+    if (!accessKeyId || !secretAccessKey) {
+        // Try ~/.aws/credentials (static keys) first, then ~/.aws/config (also
+        // used by some setups that put static keys alongside SSO config).
+        const credSections = readIni(join(homedir(), '.aws', 'credentials'));
+        const configSections = readIni(join(homedir(), '.aws', 'config'));
+        const cred = credSections[profile] || configSections[profile];
+        if (cred?.aws_access_key_id) {
+            accessKeyId = cred.aws_access_key_id;
+            secretAccessKey = cred.aws_secret_access_key || '';
+            sessionToken = cred.aws_session_token;
         }
     }
-    if (!accessKeyId || !secretAccessKey)
-        return [];
+    // Last resort: shell out to the AWS CLI. This resolves SSO / role-assumption
+    // profiles that can't be parsed from the INI files alone.
+    if (!accessKeyId || !secretAccessKey) {
+        const cliCreds = await resolveAwsCredentialsViaCli(profile);
+        if (cliCreds) {
+            accessKeyId = cliCreds.accessKeyId;
+            secretAccessKey = cliCreds.secretAccessKey;
+            sessionToken = cliCreds.sessionToken;
+        }
+    }
+    if (!accessKeyId || !secretAccessKey) {
+        throw new Error(`No AWS credentials found for profile "${profile}". ` +
+            `Try: aws sso login --profile ${profile}  (for SSO), or set AWS_ACCESS_KEY_ID + AWS_SECRET_ACCESS_KEY.`);
+    }
     const region = process.env.AWS_REGION || process.env.AWS_DEFAULT_REGION || config.get('awsRegion') || 'us-east-1';
     const host = `bedrock.${region}.amazonaws.com`;
-    const url = `https://${host}/foundation-models?byOutputModality=TEXT&byInferenceType=ON_DEMAND`;
-    // SigV4 sign
-    const now = new Date();
-    const amzDate = now.toISOString().replace(/[:-]|\.\d{3}/g, '');
-    const dateStamp = amzDate.slice(0, 8);
-    const sha256Fn = (d) => createHash('sha256').update(d).digest('hex');
-    const hmacFn = (k, d) => createHmac('sha256', k).update(d).digest();
-    const headers = {
-        'host': host,
-        'x-amz-date': amzDate,
+    const signedGet = async (path, query) => {
+        const url = `https://${host}${path}${query ? '?' + query : ''}`;
+        const now = new Date();
+        const amzDate = now.toISOString().replace(/[:-]|\.\d{3}/g, '');
+        const dateStamp = amzDate.slice(0, 8);
+        const sha256Fn = (d) => createHash('sha256').update(d).digest('hex');
+        const hmacFn = (k, d) => createHmac('sha256', k).update(d).digest();
+        const headers = { host, 'x-amz-date': amzDate };
+        if (sessionToken)
+            headers['x-amz-security-token'] = sessionToken;
+        const signedHeaderKeys = Object.keys(headers).map(k => k.toLowerCase()).sort();
+        const signedHeaders = signedHeaderKeys.join(';');
+        const canonicalHeaders = signedHeaderKeys.map(k => `${k}:${headers[k].trim()}`).join('\n') + '\n';
+        const payloadHash = sha256Fn('');
+        // AWS SigV4: non-S3 services require the canonical URI to be URI-encoded
+        // TWICE. Paths here don't currently contain special chars but we normalise
+        // for consistency with the chat signing path.
+        const canonicalPath = path.split('/').map(s => encodeURIComponent(s)).join('/');
+        const canonicalRequest = ['GET', canonicalPath, query, canonicalHeaders, signedHeaders, payloadHash].join('\n');
+        const credentialScope = `${dateStamp}/${region}/bedrock/aws4_request`;
+        const stringToSign = ['AWS4-HMAC-SHA256', amzDate, credentialScope, sha256Fn(canonicalRequest)].join('\n');
+        const kDate = hmacFn('AWS4' + secretAccessKey, dateStamp);
+        const kRegion = hmacFn(kDate, region);
+        const kService = hmacFn(kRegion, 'bedrock');
+        const signingKey = hmacFn(kService, 'aws4_request');
+        const signature = createHmac('sha256', signingKey).update(stringToSign).digest('hex');
+        headers['Authorization'] = `AWS4-HMAC-SHA256 Credential=${accessKeyId}/${credentialScope}, SignedHeaders=${signedHeaders}, Signature=${signature}`;
+        return fetch(url, { headers });
     };
-    if (sessionToken)
-        headers['x-amz-security-token'] = sessionToken;
-    const parsedUrl = new URL(url);
-    const signedHeaderKeys = Object.keys(headers).map(k => k.toLowerCase()).sort();
-    const signedHeaders = signedHeaderKeys.join(';');
-    const canonicalHeaders = signedHeaderKeys.map(k => `${k}:${headers[k].trim()}`).join('\n') + '\n';
-    const payloadHash = sha256Fn('');
-    const canonicalRequest = ['GET', parsedUrl.pathname, parsedUrl.search.slice(1), canonicalHeaders, signedHeaders, payloadHash].join('\n');
-    const credentialScope = `${dateStamp}/${region}/bedrock/aws4_request`;
-    const stringToSign = ['AWS4-HMAC-SHA256', amzDate, credentialScope, sha256Fn(canonicalRequest)].join('\n');
-    const kDate = hmacFn('AWS4' + secretAccessKey, dateStamp);
-    const kRegion = hmacFn(kDate, region);
-    const kService = hmacFn(kRegion, 'bedrock');
-    const signingKey = hmacFn(kService, 'aws4_request');
-    const signature = createHmac('sha256', signingKey).update(stringToSign).digest('hex');
-    headers['Authorization'] = `AWS4-HMAC-SHA256 Credential=${accessKeyId}/${credentialScope}, SignedHeaders=${signedHeaders}, Signature=${signature}`;
-    const response = await fetch(url, { headers });
-    if (!response.ok)
-        return [];
-    const data = await response.json();
-    if (!data.modelSummaries)
-        return [];
-    return data.modelSummaries
-        .filter(m => {
-        // Only text-in/text-out models that support streaming
-        if (!m.outputModalities?.includes('TEXT'))
-            return false;
-        if (!m.inputModalities?.includes('TEXT'))
-            return false;
-        return isCompatibleModel(m.modelId, 'bedrock');
-    })
+    // 1. ListFoundationModels (direct on-demand access).
+    // Dropped the byInferenceType=ON_DEMAND filter — newer Claude models are only
+    // accessible via cross-region inference profiles and don't have ON_DEMAND flag.
+    const foundationResp = await signedGet('/foundation-models', 'byOutputModality=TEXT');
+    if (!foundationResp.ok) {
+        let body = '';
+        try {
+            body = (await foundationResp.text()).slice(0, 400);
+        }
+        catch { /* ignore */ }
+        throw new Error(`AWS Bedrock ListFoundationModels returned ${foundationResp.status} in region ${region}. ` +
+            (body || 'Common causes: (1) no Bedrock access in this region — try us-east-1 or us-west-2; ' +
+                '(2) IAM role missing bedrock:ListFoundationModels; (3) SSO token expired — run `aws sso login`.'));
+    }
+    const foundationData = await foundationResp.json();
+    const foundationModels = (foundationData.modelSummaries || [])
+        .filter(m => m.inputModalities?.includes('TEXT') && m.outputModalities?.includes('TEXT'))
+        .filter(m => bedrockSupportsConverseTools(m.modelId))
         .map(m => ({
         id: m.modelId,
         name: m.modelName || m.modelId,
         description: `${m.providerName || 'Unknown'} — ${getBedrockModelDescription(m.modelId)}`,
         contextLength: getBedrockContextLength(m.modelId),
     }));
+    // 2. ListInferenceProfiles — cross-region profile IDs (e.g. us.anthropic.claude-sonnet-4-5-*).
+    // Many modern models are ONLY reachable via these, not direct foundation-model IDs.
+    // Failures here are non-fatal (older accounts / regions may not support it).
+    let profileModels = [];
+    try {
+        const profileResp = await signedGet('/inference-profiles', '');
+        if (profileResp.ok) {
+            const profileData = await profileResp.json();
+            profileModels = (profileData.inferenceProfileSummaries || [])
+                .filter(p => p.status !== 'INACTIVE')
+                .filter(p => bedrockSupportsConverseTools(p.inferenceProfileId))
+                .map(p => ({
+                id: p.inferenceProfileId,
+                name: p.inferenceProfileName || p.inferenceProfileId,
+                description: `Inference profile — ${getBedrockModelDescription(p.inferenceProfileId)}`,
+                contextLength: getBedrockContextLength(p.inferenceProfileId),
+            }));
+        }
+    }
+    catch {
+        // Non-fatal — foundation models alone is still useful.
+    }
+    // Merge. For every inference profile, strip the region prefix (e.g. `us.`,
+    // `eu.`, `apac.`, `jp.`) to get the base foundation-model ID it wraps, and
+    // drop that base from the foundation list — because newer Claude 4.x / Haiku
+    // 4.5 models can ONLY be invoked via their inference profile on on-demand
+    // throughput. Showing both would let users pick the invokable-broken raw ID.
+    const coveredBaseIds = new Set();
+    for (const p of profileModels) {
+        const base = p.id.replace(/^[a-z]{2,5}\./, '');
+        if (base !== p.id)
+            coveredBaseIds.add(base);
+    }
+    const filteredFoundation = foundationModels.filter(m => !coveredBaseIds.has(m.id));
+    const merged = new Map();
+    for (const m of filteredFoundation)
+        merged.set(m.id, m);
+    for (const m of profileModels)
+        merged.set(m.id, m);
+    return Array.from(merged.values()).sort((a, b) => a.id.localeCompare(b.id));
+}
+/**
+ * Bedrock Converse API tool-calling support. Maintained as a local allowlist
+ * because AWS doesn't expose per-model tool capability via the list APIs.
+ * See: https://docs.aws.amazon.com/bedrock/latest/userguide/conversation-inference-supported-models-features.html
+ * Matches both raw foundation model IDs (e.g. anthropic.claude-3-5-sonnet-*)
+ * and cross-region inference profile IDs (e.g. us.anthropic.claude-sonnet-4-5-*).
+ */
+function bedrockSupportsConverseTools(modelId) {
+    const id = modelId.toLowerCase();
+    // Anthropic Claude 3, 3.5, 3.7, 4, 4.5 (all support tools). Excludes Claude 2.x / Instant.
+    if (/anthropic\.claude-(3|opus-4|sonnet-4|haiku-4|3-5|3-7)/.test(id))
+        return true;
+    // Amazon Nova (Pro / Lite / Micro support Converse tools; Nova Canvas/Reel are image models — excluded)
+    if (/amazon\.nova-(pro|lite|micro|premier)/.test(id))
+        return true;
+    // Cohere Command R / R+ support tools (older Command models do not)
+    if (/cohere\.command-r/.test(id))
+        return true;
+    // Mistral Large (2402, 2407), Pixtral Large, Mistral Small, Nemo
+    if (/mistral\.(mistral-large|pixtral|mistral-small|mistral-nemo)/.test(id))
+        return true;
+    // Meta Llama 3.1+ supports tools via Converse (3.0 and earlier do not)
+    if (/meta\.llama(3-1|3-2|3-3|4)/.test(id))
+        return true;
+    // AI21 Jamba 1.5 supports tools
+    if (/ai21\.jamba-1-5/.test(id))
+        return true;
+    // DeepSeek R1 supports tools
+    if (/deepseek\.r1/.test(id))
+        return true;
+    return false;
 }
 function getBedrockModelDescription(modelId) {
     if (modelId.includes('claude') && modelId.includes('opus'))
@@ -865,7 +1001,7 @@ export function clearModelCache(provider) {
 export async function preWarmModelCache() {
     const configuredProviders = config.getConfiguredProviders();
     // Fetch models for all configured providers in parallel
-    await Promise.allSettled(configuredProviders.map(provider => getAvailableModels(provider)));
+    await Promise.allSettled(configuredProviders.map(provider => getAvailableModels(provider, { quiet: true })));
 }
 /**
  * Get model info from cache by ID
@@ -874,12 +1010,29 @@ export function getModelInfo(provider, modelId) {
     const cached = modelCache.get(provider);
     if (!cached)
         return undefined;
-    return cached.models.find(m => m.id === modelId || m.id.includes(modelId) || modelId.includes(m.id));
+    // Exact match first.
+    const exact = cached.models.find(m => m.id === modelId);
+    if (exact)
+        return exact;
+    // Otherwise only accept an UNAMBIGUOUS prefix relationship. Loose substring
+    // matching wrongly resolved e.g. `gpt-4` -> `gpt-4o` or `claude-opus-4` ->
+    // `claude-opus-4-8`, returning a different model's context/pricing.
+    const related = cached.models.filter(m => m.id.startsWith(modelId) || modelId.startsWith(m.id));
+    return related.length === 1 ? related[0] : undefined;
 }
 /**
  * Default context limits by model family (fallback when API doesn't provide it)
  */
 const DEFAULT_CONTEXT_LIMITS = {
+    // Anthropic — current 1M-context models matched first (longest key wins).
+    // Everything else (Haiku 4.5, Claude 3.x, and the older -20250514 IDs) falls
+    // through to the generic `claude` 200K entry below.
+    'claude-fable-5': 1000000,
+    'claude-opus-4-8': 1000000,
+    'claude-opus-4-7': 1000000,
+    'claude-opus-4-6': 1000000,
+    'claude-sonnet-4-6': 1000000,
+    'claude-haiku-4-5': 200000,
     'claude': 200000,
     'gpt-4o': 128000,
     'gpt-4-turbo': 128000,
@@ -941,4 +1094,44 @@ export function getModelContextLimit(provider, modelId) {
     // Ultimate fallback
     return 32000;
 }
+/**
+ * Default max OUTPUT tokens by model family (fallback when the API doesn't
+ * report it). Replaces the old global 8192 cap so modern models can use their
+ * real output ceiling. Unknown models fall through to a conservative 8192.
+ */
+const DEFAULT_MAX_OUTPUT = {
+    'claude-fable-5': 128000,
+    'claude-opus-4-8': 128000,
+    'claude-opus-4-7': 128000,
+    'claude-opus-4-6': 128000,
+    'claude-sonnet-4-6': 64000,
+    'claude-haiku-4-5': 64000,
+    'claude': 8192,
+    'gpt-5': 128000,
+    'o1': 100000,
+    'o3': 100000,
+    'gpt-4o': 16384,
+    'gpt-4': 8192,
+    'gemini-2': 8192,
+    'gemini-1.5': 8192,
+};
+/**
+ * Get the max output-token ceiling for a model - cached API info first, then
+ * family fallback. Conservative 8192 default keeps unknown/local models safe.
+ */
+export function getModelMaxOutput(provider, modelId) {
+    const modelInfo = getModelInfo(provider, modelId);
+    if (modelInfo?.maxOutputTokens) {
+        return modelInfo.maxOutputTokens;
+    }
+    const lowerModel = modelId.toLowerCase();
+    const sortedEntries = Object.entries(DEFAULT_MAX_OUTPUT)
+        .sort((a, b) => b[0].length - a[0].length);
+    for (const [key, limit] of sortedEntries) {
+        if (lowerModel.includes(key.toLowerCase())) {
+            return limit;
+        }
+    }
+    return 8192;
+}
 //# sourceMappingURL=model-detection.js.map