npm - keystone-cli - Versions diffs - 1.3.0 → 2.0.0 - Mend

keystone-cli 1.3.0 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

package/README.md +114 -140
package/package.json +6 -3
package/src/cli.ts +54 -369
package/src/commands/init.ts +15 -29
package/src/db/memory-db.test.ts +45 -0
package/src/db/memory-db.ts +47 -21
package/src/db/sqlite-setup.ts +26 -3
package/src/db/workflow-db.ts +12 -5
package/src/parser/config-schema.ts +11 -13
package/src/parser/schema.ts +4 -2
package/src/runner/__test__/llm-mock-setup.ts +173 -0
package/src/runner/__test__/llm-test-setup.ts +271 -0
package/src/runner/engine-executor.test.ts +25 -18
package/src/runner/executors/blueprint-executor.ts +0 -1
package/src/runner/executors/dynamic-executor.ts +11 -6
package/src/runner/executors/engine-executor.ts +5 -1
package/src/runner/executors/llm-executor.ts +502 -1033
package/src/runner/executors/memory-executor.ts +35 -19
package/src/runner/executors/plan-executor.ts +0 -1
package/src/runner/executors/types.ts +4 -4
package/src/runner/llm-adapter.integration.test.ts +151 -0
package/src/runner/llm-adapter.ts +263 -1401
package/src/runner/llm-clarification.test.ts +91 -106
package/src/runner/llm-executor.test.ts +217 -1181
package/src/runner/memoization.test.ts +0 -1
package/src/runner/recovery-security.test.ts +51 -20
package/src/runner/reflexion.test.ts +55 -18
package/src/runner/standard-tools-integration.test.ts +137 -87
package/src/runner/step-executor.test.ts +36 -80
package/src/runner/step-executor.ts +0 -2
package/src/runner/test-harness.ts +3 -29
package/src/runner/tool-integration.test.ts +122 -73
package/src/runner/workflow-runner.ts +92 -35
package/src/runner/workflow-scheduler.ts +11 -1
package/src/runner/workflow-summary.ts +144 -0
package/src/utils/auth-manager.test.ts +10 -520
package/src/utils/auth-manager.ts +3 -756
package/src/utils/config-loader.ts +12 -0
package/src/utils/constants.ts +0 -17
package/src/utils/process-sandbox.ts +15 -3
package/src/runner/llm-adapter-runtime.test.ts +0 -209
package/src/runner/llm-adapter.test.ts +0 -1012

package/src/runner/llm-adapter.ts CHANGED Viewed

@@ -1,335 +1,97 @@
-import { randomUUID } from 'node:crypto';
-import { copyFileSync, existsSync, readdirSync } from 'node:fs';
-import { Module } from 'node:module';
-import { homedir } from 'node:os';
-import { basename, dirname, join } from 'node:path';
-import { pathToFileURL } from 'node:url';
-import { AuthManager, COPILOT_HEADERS } from '../utils/auth-manager';
+import { execSync } from 'node:child_process';
+import { createRequire } from 'node:module';
+import { join } from 'node:path';
+import type { EmbeddingModel, LanguageModel } from 'ai';
+import type { Config } from '../parser/config-schema';
 import { ConfigLoader } from '../utils/config-loader';
 import { ConsoleLogger } from '../utils/logger';
-import { processOpenAIStream } from './stream-utils';
-// Maximum response size to prevent memory exhaustion (1MB)
-const MAX_RESPONSE_SIZE = 1024 * 1024;
-const ANTHROPIC_OAUTH_BETAS = [
-  'oauth-2025-04-20',
-  'claude-code-20250219',
-  'interleaved-thinking-2025-05-14',
-  'fine-grained-tool-streaming-2025-05-14',
-].join(',');
-const GEMINI_DEFAULT_BASE_URL = 'https://cloudcode-pa.googleapis.com';
-const GEMINI_DEFAULT_PROJECT_ID = 'rising-fact-p41fc';
-const GEMINI_HEADERS = {
-  'User-Agent': 'antigravity/1.11.5 windows/amd64',
-  'X-Goog-Api-Client': 'google-cloud-sdk vscode_cloudshelleditor/0.1',
-  'Client-Metadata':
-    '{"ideType":"IDE_UNSPECIFIED","platform":"PLATFORM_UNSPECIFIED","pluginType":"GEMINI"}',
-};
-const defaultLogger = new ConsoleLogger();
-type TransformersPipeline = (...args: unknown[]) => Promise<unknown>;
-let cachedPipeline: TransformersPipeline | null = null;
-let runtimeResolverRegistered = false;
-let nativeFallbacksRegistered = false;
-export function resetRuntimeHelpers(): void {
-  runtimeResolverRegistered = false;
-  nativeFallbacksRegistered = false;
+// --- Keystone Types & Extensions ---
+/**
+ * A provider instance in the AI SDK can be a function that returns a language model,
+ * or an object with methods for different model types.
+ */
+export interface ProviderInstance {
+  (modelId: string): LanguageModel;
+  languageModel?: (modelId: string) => LanguageModel;
+  textEmbeddingModel?: (modelId: string) => EmbeddingModel;
+  embedding?: (modelId: string) => EmbeddingModel;
+  textEmbedding?: (modelId: string) => EmbeddingModel;
 }
-const ONNX_RUNTIME_LIB_PATTERN =
-  process.platform === 'win32' ? /^onnxruntime.*\.dll$/i : /^libonnxruntime/i;
-function hasOnnxRuntimeLibrary(dir: string): boolean {
-  try {
-    return readdirSync(dir, { withFileTypes: true }).some(
-      (entry) => entry.isFile() && ONNX_RUNTIME_LIB_PATTERN.test(entry.name)
+/**
+ * A provider factory is a function that takes configuration options and returns a provider instance.
+ */
+export type ProviderFactory = (options: Record<string, unknown>) => ProviderInstance;
+/**
+ * Local embedding model implementation using @xenova/transformers.
+ * Maintains the "zero-setup local memory" feature.
+ */
+class LocalEmbeddingModel {
+  readonly specificationVersion = 'v2';
+  readonly modelId = 'local-minilm';
+  readonly provider = 'local';
+  readonly maxEmbeddingsPerCall = 1;
+  readonly supportsParallelCalls = false;
+  private static pipelinePromise: Promise<any> | null = null;
+  private async getPipeline() {
+    if (!LocalEmbeddingModel.pipelinePromise) {
+      LocalEmbeddingModel.pipelinePromise = (async () => {
+        const { pipeline } = await import('@xenova/transformers');
+        return pipeline('feature-extraction', 'Xenova/all-MiniLM-L6-v2');
+      })() as Promise<any>;
+    }
+    return LocalEmbeddingModel.pipelinePromise;
+  }
+  async doEmbed(options: { values: string[]; abortSignal?: AbortSignal }) {
+    const pipe = await this.getPipeline();
+    const embeddings = await Promise.all(
+      options.values.map(async (text) => {
+        const output = await pipe(text, { pooling: 'mean', normalize: true });
+        return Array.from(output.data) as number[];
+      })
     );
-  } catch {
-    return false;
-  }
-}
-export function collectOnnxRuntimeLibraryDirs(): string[] {
-  const candidates = new Set<string>();
-  if (process.env.KEYSTONE_ONNX_RUNTIME_LIB_DIR) {
-    candidates.add(process.env.KEYSTONE_ONNX_RUNTIME_LIB_DIR);
-  }
-  const runtimeDir = getRuntimeDir();
-  const runtimeOnnxDir = join(
-    runtimeDir,
-    'node_modules',
-    'onnxruntime-node',
-    'bin',
-    'napi-v3',
-    process.platform,
-    process.arch
-  );
-  if (existsSync(runtimeOnnxDir)) {
-    candidates.add(runtimeOnnxDir);
+    return { embeddings };
   }
-  const nodeModulesDir = join(
-    process.cwd(),
-    'node_modules',
-    'onnxruntime-node',
-    'bin',
-    'napi-v3',
-    process.platform,
-    process.arch
-  );
-  if (existsSync(nodeModulesDir)) {
-    candidates.add(nodeModulesDir);
+  /**
+   * Dispose of the cached pipeline to free memory.
+   * Call this when the embedding model is no longer needed.
+   */
+  static dispose(): void {
+    LocalEmbeddingModel.pipelinePromise = null;
   }
-  const execDir = dirname(process.execPath);
-  candidates.add(execDir);
-  candidates.add(join(execDir, 'lib'));
-  return Array.from(candidates).filter(hasOnnxRuntimeLibrary);
 }
-export function findOnnxRuntimeLibraryPath(dirs: string[]): string | null {
-  for (const dir of dirs) {
-    try {
-      for (const entry of readdirSync(dir, { withFileTypes: true })) {
-        if (entry.isFile() && ONNX_RUNTIME_LIB_PATTERN.test(entry.name)) {
-          return join(dir, entry.name);
-        }
-      }
-    } catch {
-      // Ignore unreadable directories.
-    }
-  }
-  return null;
-}
-export function ensureOnnxRuntimeLibraryPath(): void {
-  const libDirs = collectOnnxRuntimeLibraryDirs();
-  if (!libDirs.length) return;
-  const runtimePath = findOnnxRuntimeLibraryPath(libDirs);
-  if (runtimePath) {
-    const tempDirs = process.platform === 'darwin' ? ['/private/tmp', '/tmp'] : ['/tmp'];
-    for (const tempDir of tempDirs) {
-      try {
-        const target = join(tempDir, basename(runtimePath));
-        if (!existsSync(target)) {
-          copyFileSync(runtimePath, target);
-        }
-      } catch {
-        // Best-effort copy for runtimes that extract native modules into temp.
-      }
-    }
-  }
-  const envKey =
-    process.platform === 'darwin'
-      ? 'DYLD_LIBRARY_PATH'
-      : process.platform === 'win32'
-        ? 'PATH'
-        : 'LD_LIBRARY_PATH';
-  const delimiter = process.platform === 'win32' ? ';' : ':';
-  const existing = (process.env[envKey] || '').split(delimiter).filter(Boolean);
-  const merged: string[] = [];
-  const seen = new Set<string>();
-  for (const dir of [...libDirs, ...existing]) {
-    if (seen.has(dir)) continue;
-    seen.add(dir);
-    merged.push(dir);
-  }
-  process.env[envKey] = merged.join(delimiter);
-  if (runtimePath && typeof Bun !== 'undefined' && typeof (Bun as any).dlopen === 'function') {
-    try {
-      (Bun as any).dlopen(runtimePath, {});
-    } catch {
-      // Best-effort preloading for compiled binaries.
-    }
-  }
-}
+// Re-export specific AI SDK types
+export type { LanguageModel, EmbeddingModel } from 'ai';
-export function resolveNativeModuleFallback(
-  request: string,
-  parentFilename: string
-): string | null {
-  const normalizedRequest = request.replace(/\\/g, '/');
-  const fileName = normalizedRequest.split('/').pop();
-  if (!fileName) return null;
+const userRequire = createRequire(join(process.cwd(), 'package.json'));
-  if (fileName.startsWith('sharp-') || /[\\/]sharp[\\/]/.test(parentFilename)) {
-    const candidate = join(getRuntimeDir(), 'node_modules', 'sharp', 'build', 'Release', fileName);
-    if (existsSync(candidate)) {
-      return candidate;
-    }
-  }
+// Lazy-loaded global require to avoid blocking import time
+let globalRequire: NodeRequire | undefined;
+let globalRequireResolved = false;
-  if (
-    fileName === 'onnxruntime_binding.node' ||
-    /[\\/]onnxruntime-node[\\/]/.test(parentFilename)
-  ) {
-    const candidate = join(
-      getRuntimeDir(),
-      'node_modules',
-      'onnxruntime-node',
-      'bin',
-      'napi-v3',
-      process.platform,
-      process.arch,
-      'onnxruntime_binding.node'
-    );
-    if (existsSync(candidate)) {
-      return candidate;
-    }
+function getGlobalRequire(): NodeRequire | undefined {
+  if (globalRequireResolved) {
+    return globalRequire;
   }
-  return null;
-}
-export function ensureNativeModuleFallbacks(): void {
-  if (nativeFallbacksRegistered) return;
-  nativeFallbacksRegistered = true;
-  const moduleAny = Module as unknown as {
-    _resolveFilename: (
-      request: string,
-      parent?: { filename?: string },
-      isMain?: boolean,
-      options?: unknown
-    ) => string;
-  };
-  const originalResolve = moduleAny._resolveFilename;
-  if (typeof originalResolve !== 'function') return;
-  moduleAny._resolveFilename = function resolveFilename(request, parent, isMain, options) {
-    if (typeof request === 'string' && request.endsWith('.node')) {
-      try {
-        return originalResolve.call(this, request, parent, isMain, options);
-      } catch (error) {
-        const parentFilename = parent && typeof parent.filename === 'string' ? parent.filename : '';
-        const fallback = resolveNativeModuleFallback(request, parentFilename);
-        if (fallback) {
-          return fallback;
-        }
-        throw error;
-      }
-    }
-    return originalResolve.call(this, request, parent, isMain, options);
-  };
-}
-export function resolveTransformersCacheDir(): string | null {
-  if (process.env.TRANSFORMERS_CACHE) {
-    return process.env.TRANSFORMERS_CACHE;
-  }
-  if (process.env.XDG_CACHE_HOME) {
-    return join(process.env.XDG_CACHE_HOME, 'keystone', 'transformers');
-  }
-  const home = process.env.HOME || homedir();
-  if (home) {
-    return join(home, '.cache', 'keystone', 'transformers');
-  }
-  return null;
-}
-async function getTransformersPipeline(): Promise<TransformersPipeline> {
-  if (!cachedPipeline) {
-    ensureNativeModuleFallbacks();
-    ensureRuntimeResolver();
-    const resolved = resolveTransformersPath();
-    const module = resolved
-      ? await import(pathToFileURL(resolved).href)
-      : await import('@xenova/transformers');
-    if (module.env?.cacheDir?.includes('/$bunfs')) {
-      const cacheDir = resolveTransformersCacheDir();
-      if (cacheDir) {
-        module.env.cacheDir = cacheDir;
-      }
-    }
-    cachedPipeline = module.pipeline;
-  }
-  if (!cachedPipeline) {
-    throw new Error('Failed to load transformers pipeline');
-  }
-  return cachedPipeline;
-}
-export function resolveTransformersPath(): string | null {
+  globalRequireResolved = true;
   try {
-    if (
-      process.env.KEYSTONE_TRANSFORMERS_PATH &&
-      existsSync(process.env.KEYSTONE_TRANSFORMERS_PATH)
-    ) {
-      return process.env.KEYSTONE_TRANSFORMERS_PATH;
-    }
+    const globalRoot = execSync('npm root -g', { encoding: 'utf-8' }).trim();
+    globalRequire = createRequire(join(globalRoot, 'package.json'));
   } catch {
-    // Ignore resolve failures and fall back to bundled module.
+    // Global npm root not found - this is expected in some environments (e.g., containers, CI)
+    // Global package resolution will be disabled silently
   }
-  return null;
-}
-export function getRuntimeDir(): string {
-  return process.env.KEYSTONE_RUNTIME_DIR || join(dirname(process.execPath), 'keystone-runtime');
-}
-function resolveRuntimePackageEntry(pkg: string, entry: string): string | null {
-  const runtimePath = join(getRuntimeDir(), 'node_modules', ...pkg.split('/'), entry);
-  if (existsSync(runtimePath)) {
-    return runtimePath;
-  }
-  const cwdPath = join(process.cwd(), 'node_modules', ...pkg.split('/'), entry);
-  if (existsSync(cwdPath)) {
-    return cwdPath;
-  }
-  return null;
-}
-export function ensureRuntimeResolver(): void {
-  if (runtimeResolverRegistered) return;
-  if (typeof Bun === 'undefined' || typeof Bun.plugin !== 'function') {
-    return;
-  }
-  const entryMap: Record<string, string> = {
-    '@huggingface/jinja': 'dist/index.js',
-    sharp: 'lib/index.js',
-    'onnxruntime-node': 'dist/index.js',
-    'onnxruntime-common': 'dist/ort-common.node.js',
-  };
-  Bun.plugin({
-    name: 'keystone-runtime-resolver',
-    setup(builder) {
-      builder.onResolve(
-        { filter: /^(sharp|onnxruntime-node|onnxruntime-common|@huggingface\/jinja)$/ },
-        (args) => {
-          const entry = entryMap[args.path];
-          if (!entry) return null;
-          const resolved = resolveRuntimePackageEntry(args.path, entry);
-          if (!resolved) return null;
-          return { path: resolved };
-        }
-      );
-    },
-  });
-  runtimeResolverRegistered = true;
-}
-export interface LLMMessage {
-  role: 'system' | 'user' | 'assistant' | 'tool';
-  content: string | null;
-  tool_call_id?: string;
-  name?: string;
-  tool_calls?: LLMToolCall[];
-  reasoning?: {
-    encrypted_content: string;
-    summary?: string;
-  };
+  return globalRequire;
 }
+// Compatibility types for Keystone
 export interface LLMToolCall {
   id: string;
   type: 'function';
@@ -339,9 +101,14 @@ export interface LLMToolCall {
   };
 }
-type LLMMessageWithId = LLMMessage & { id?: string };
-type ChatGPTToolCall = Omit<LLMToolCall, 'id'>;
-type ChatGPTMessage = Omit<LLMMessage, 'tool_calls'> & { tool_calls?: ChatGPTToolCall[] };
+export interface LLMMessage {
+  role: 'system' | 'user' | 'assistant' | 'tool';
+  content?: string;
+  name?: string;
+  tool_calls?: LLMToolCall[];
+  tool_call_id?: string;
+  reasoning?: { summary?: string }; // Keystone extension
+}
 export interface LLMResponse {
   message: LLMMessage;
@@ -352,1155 +119,250 @@ export interface LLMResponse {
   };
 }
-export interface LLMTool {
-  type: 'function';
-  function: {
-    name: string;
-    description?: string;
-    parameters?: Record<string, unknown>;
-  };
-}
-interface GeminiFunctionCall {
-  name: string;
-  args?: Record<string, unknown> | string;
-}
-interface GeminiPart {
-  text?: string;
-  functionCall?: GeminiFunctionCall;
-  functionResponse?: {
-    name: string;
-    response: Record<string, unknown>;
-  };
-}
-interface GeminiContent {
-  role: 'user' | 'model';
-  parts: GeminiPart[];
-}
-interface GeminiSystemInstruction {
-  role?: 'system';
-  parts: GeminiPart[];
-}
-export interface LLMAdapter {
-  chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any; // Native JSON schema for structured output
-    }
-  ): Promise<LLMResponse>;
-  embed?(text: string, model?: string, options?: { signal?: AbortSignal }): Promise<number[]>;
-}
-export class OpenAIAdapter implements LLMAdapter {
-  private apiKey: string;
-  private baseUrl: string;
-  constructor(apiKey?: string, baseUrl?: string) {
-    this.apiKey = apiKey || ConfigLoader.getSecret('OPENAI_API_KEY') || '';
-    this.baseUrl =
-      baseUrl || ConfigLoader.getSecret('OPENAI_BASE_URL') || 'https://api.openai.com/v1';
-    if (!this.apiKey && this.baseUrl === 'https://api.openai.com/v1') {
-      defaultLogger.warn('Warning: OPENAI_API_KEY is not set.');
-    }
-  }
-  async chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any;
-    }
-  ): Promise<LLMResponse> {
-    const isStreaming = !!options?.onStream;
-    const response = await fetch(`${this.baseUrl}/chat/completions`, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        Authorization: `Bearer ${this.apiKey}`,
-      },
-      body: JSON.stringify({
-        model: options?.model || 'gpt-4o',
-        messages,
-        tools: options?.tools,
-        stream: isStreaming,
-        response_format: options?.responseSchema
-          ? {
-              type: 'json_schema',
-              json_schema: {
-                name: 'output',
-                strict: true,
-                schema: options.responseSchema,
-              },
-            }
-          : undefined,
-      }),
-      signal: options?.signal,
-    });
-    if (!response.ok) {
-      const error = await response.text();
-      throw new Error(`OpenAI API error: ${response.status} ${response.statusText} - ${error}`);
-    }
-    if (isStreaming) {
-      if (!response.body) throw new Error('Response body is null');
-      return processOpenAIStream(response, options, 'OpenAI');
-    }
+// --- Dynamic Provider Registry ---
-    const data = (await response.json()) as {
-      choices: { message: LLMMessage }[];
-      usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
-    };
+export class DynamicProviderRegistry {
+  private static loadedProviders = new Map<string, ProviderFactory | ProviderInstance>();
-    // Validate response size to prevent memory exhaustion
-    const contentLength = data.choices[0]?.message?.content?.length ?? 0;
-    if (contentLength > MAX_RESPONSE_SIZE) {
-      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
+  static async getProvider(
+    providerName: string,
+    config: Config['providers'][string]
+  ): Promise<ProviderFactory | ProviderInstance> {
+    if (DynamicProviderRegistry.loadedProviders.has(providerName)) {
+      return DynamicProviderRegistry.loadedProviders.get(providerName) as
+        | ProviderFactory
+        | ProviderInstance;
     }
-    return {
-      message: data.choices[0].message,
-      usage: data.usage,
-    };
-  }
-  async embed(
-    text: string,
-    model = 'text-embedding-3-small',
-    options?: { signal?: AbortSignal }
-  ): Promise<number[]> {
-    const response = await fetch(`${this.baseUrl}/embeddings`, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        Authorization: `Bearer ${this.apiKey}`,
-      },
-      body: JSON.stringify({
-        model,
-        input: text,
-      }),
-      signal: options?.signal,
-    });
-    if (!response.ok) {
-      const error = await response.text();
-      throw new Error(
-        `OpenAI Embeddings API error: ${response.status} ${response.statusText} - ${error}`
-      );
-    }
-    const data = (await response.json()) as {
-      data: { embedding: number[] }[];
-    };
-    return data.data[0].embedding;
-  }
-}
-export class AnthropicAdapter implements LLMAdapter {
-  private apiKey: string;
-  private baseUrl: string;
-  private authMode: 'api-key' | 'oauth';
-  constructor(apiKey?: string, baseUrl?: string, authMode: 'api-key' | 'oauth' = 'api-key') {
-    this.apiKey = apiKey || ConfigLoader.getSecret('ANTHROPIC_API_KEY') || '';
-    this.baseUrl =
-      baseUrl || ConfigLoader.getSecret('ANTHROPIC_BASE_URL') || 'https://api.anthropic.com/v1';
-    this.authMode = authMode;
-    if (
-      this.authMode === 'api-key' &&
-      !this.apiKey &&
-      this.baseUrl === 'https://api.anthropic.com/v1'
-    ) {
-      defaultLogger.warn('Warning: ANTHROPIC_API_KEY is not set.');
-    }
-  }
-  private async getAuthHeaders(): Promise<Record<string, string>> {
-    if (this.authMode === 'oauth') {
-      const token = await AuthManager.getAnthropicClaudeToken();
-      if (!token) {
+    // 1. Custom Script
+    if (config.script) {
+      const scriptPath = join(process.cwd(), config.script);
+      try {
+        const module = await import(scriptPath);
+        if (!module.default) {
+          throw new Error(`Custom provider script '${scriptPath}' must export a default function.`);
+        }
+        DynamicProviderRegistry.loadedProviders.set(providerName, module.default);
+        return module.default;
+      } catch (err) {
         throw new Error(
-          'Anthropic Claude authentication not found. Please run "keystone auth login anthropic-claude" first.'
+          `Failed to load custom provider script '${scriptPath}': ${err instanceof Error ? err.message : String(err)}`
         );
       }
-      return {
-        Authorization: `Bearer ${token}`,
-        'anthropic-beta': ANTHROPIC_OAUTH_BETAS,
-      };
-    }
-    return {
-      'x-api-key': this.apiKey,
-    };
-  }
-  async chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any;
     }
-  ): Promise<LLMResponse> {
-    const isStreaming = !!options?.onStream;
-    const system = messages.find((m) => m.role === 'system')?.content || undefined;
-    // Anthropic requires alternating user/assistant roles.
-    // Sequential tool results must be grouped into a single user message.
-    const anthropicMessages: Array<{
-      role: 'user' | 'assistant';
-      content: string | Array<Record<string, unknown>>;
-    }> = [];
-    for (const m of messages) {
-      if (m.role === 'system') continue;
-      if (m.role === 'tool') {
-        const lastMsg = anthropicMessages[anthropicMessages.length - 1];
-        const toolResult = {
-          type: 'tool_result' as const,
-          tool_use_id: m.tool_call_id,
-          content: m.content,
-        };
-        if (lastMsg && lastMsg.role === 'user' && Array.isArray(lastMsg.content)) {
-          // Append to existing tool result block if previous message was also a tool result
-          lastMsg.content.push(toolResult);
-        } else {
-          // Start a new user message for tool results
-          anthropicMessages.push({
-            role: 'user',
-            content: [toolResult],
-          });
-        }
-      } else if (m.tool_calls) {
-        anthropicMessages.push({
-          role: 'assistant',
-          content: [
-            ...(m.content ? [{ type: 'text' as const, text: m.content }] : []),
-            ...m.tool_calls.map((tc) => {
-              let input = {};
+    // 2. Package
+    if (config.package) {
+      try {
+        let pkg: any;
+        try {
+          // Try local project first
+          pkg = await import(config.package);
+        } catch {
+          try {
+            const pkgPath = userRequire.resolve(config.package);
+            pkg = await import(pkgPath);
+          } catch {
+            // Try global if local resolution fails
+            const globalReq = getGlobalRequire();
+            if (globalReq) {
               try {
-                input =
-                  typeof tc.function.arguments === 'string'
-                    ? JSON.parse(tc.function.arguments)
-                    : tc.function.arguments;
-              } catch (e) {
-                defaultLogger.error(`Failed to parse tool arguments: ${tc.function.arguments}`);
+                const globalPkgPath = globalReq.resolve(config.package);
+                pkg = await import(globalPkgPath);
+              } catch {
+                throw new Error(
+                  `Failed to resolve package '${config.package}' locally or globally.`
+                );
               }
-              return {
-                type: 'tool_use' as const,
-                id: tc.id,
-                name: tc.function.name,
-                input,
-              };
-            }),
-          ],
-        });
-      } else {
-        const role = m.role as 'user' | 'assistant';
-        const lastMsg = anthropicMessages[anthropicMessages.length - 1];
-        if (
-          lastMsg &&
-          lastMsg.role === role &&
-          typeof lastMsg.content === 'string' &&
-          typeof m.content === 'string'
-        ) {
-          lastMsg.content += `\n\n${m.content}`;
-        } else {
-          anthropicMessages.push({
-            role,
-            content: m.content || '',
-          });
+            } else {
+              throw new Error(`Failed to resolve package '${config.package}' locally.`);
+            }
+          }
         }
-      }
-    }
-    const anthropicTools = options?.tools
-      ? options.tools.map((t) => ({
-          name: t.function.name,
-          description: t.function.description,
-          input_schema: t.function.parameters,
-        }))
-      : undefined;
-    // If responseSchema is provided, Anthropic requires using tool call to force output
-    const responseTool = options?.responseSchema
-      ? {
-          name: 'record_output',
-          description: 'Record the structured output matching the requested schema',
-          input_schema: options.responseSchema,
+        // If a specific factory is configured, try to use it first
+        const factoryKey = config.factory || config.type || 'default';
+        if (pkg[factoryKey] && typeof pkg[factoryKey] === 'function') {
+          DynamicProviderRegistry.loadedProviders.set(providerName, pkg[factoryKey]);
+          return pkg[factoryKey];
         }
-      : undefined;
-    const combinedTools = [...(anthropicTools || []), ...(responseTool ? [responseTool] : [])];
-    const authHeaders = await this.getAuthHeaders();
-    const response = await fetch(`${this.baseUrl}/messages`, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        ...authHeaders,
-        'anthropic-version': '2023-06-01',
-      },
-      body: JSON.stringify({
-        model: options?.model || 'claude-3-5-sonnet-20240620',
-        system,
-        messages: anthropicMessages,
-        tools: combinedTools.length > 0 ? combinedTools : undefined,
-        tool_choice: responseTool ? { type: 'tool', name: 'record_output' } : undefined,
-        max_tokens: 4096,
-        stream: isStreaming,
-      }),
-      signal: options?.signal,
-    });
-    if (!response.ok) {
-      const error = await response.text();
-      throw new Error(`Anthropic API error: ${response.status} ${response.statusText} - ${error}`);
-    }
-    if (isStreaming) {
-      if (!response.body) throw new Error('Response body is null');
-      const reader = response.body.getReader();
-      const decoder = new TextDecoder();
-      let fullContent = '';
-      // Track tool calls by content block index for robust correlation
-      const toolCallsMap = new Map<number, { id: string; name: string; inputString: string }>();
-      const usage = { prompt_tokens: 0, completion_tokens: 0, total_tokens: 0 };
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-        const chunk = decoder.decode(value);
-        const lines = chunk.split('\n').filter((line) => line.trim() !== '');
-        for (const line of lines) {
-          if (!line.startsWith('data: ')) continue;
-          try {
-            const data = JSON.parse(line.slice(6));
-            if (data.type === 'content_block_delta' && data.delta?.text) {
-              if (fullContent.length + data.delta.text.length > MAX_RESPONSE_SIZE) {
-                throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-              }
-              fullContent += data.delta.text;
-              options.onStream?.(data.delta.text);
-            }
-            // Track tool calls by their index in the content blocks
-            if (data.type === 'content_block_start' && data.content_block?.type === 'tool_use') {
-              const index = data.index ?? toolCallsMap.size;
-              toolCallsMap.set(index, {
-                id: data.content_block.id || '',
-                name: data.content_block.name || '',
-                inputString: '',
-              });
-            }
-            // Handle tool input streaming - Anthropic uses content_block_delta with input_json_delta
-            if (
-              data.type === 'content_block_delta' &&
-              data.delta?.type === 'input_json_delta' &&
-              data.delta?.partial_json
-            ) {
-              const index = data.index;
-              const toolCall = toolCallsMap.get(index);
-              if (toolCall) {
-                toolCall.inputString += data.delta.partial_json;
-              }
-            }
-            // Update tool call ID if it arrives later (some edge cases)
-            if (data.type === 'content_block_delta' && data.content_block?.id) {
-              const index = data.index;
-              const toolCall = toolCallsMap.get(index);
-              if (toolCall && !toolCall.id) {
-                toolCall.id = data.content_block.id;
-              }
-            }
-            if (data.type === 'message_start' && data.message?.usage) {
-              usage.prompt_tokens += data.message.usage.input_tokens || 0;
-            }
-            if (data.type === 'message_delta' && data.usage) {
-              usage.completion_tokens += data.usage.output_tokens || 0;
-            }
-            usage.total_tokens = usage.prompt_tokens + usage.completion_tokens;
-          } catch (e) {
-            // Log non-SyntaxError exceptions at warning level (they indicate real issues)
-            if (!(e instanceof SyntaxError)) {
-              defaultLogger.warn(`[Anthropic Stream] Error processing chunk: ${e}`);
-            } else if (process.env.DEBUG || process.env.LLM_DEBUG) {
-              // SyntaxErrors are normal for incomplete chunks - only log in debug mode
-              process.stderr.write(
-                `[Anthropic Stream] Incomplete chunk parse: ${line.slice(0, 50)}...\n`
-              );
+        // Discovery fallback: Search for common factory patterns case-insensitively
+        const searchTerms = [
+          `create${providerName.replace(/[-_]/g, '')}provider`,
+          `create${providerName.split(/[-_]/)[0]}provider`,
+          providerName.replace(/[-_]/g, ''),
+          providerName.split(/[-_]/)[0],
+        ];
+        const allKeys = Object.keys(pkg);
+        for (const key of allKeys) {
+          const lowerKey = key.toLowerCase();
+          if (
+            searchTerms.some(
+              (term) =>
+                lowerKey === term ||
+                lowerKey === `create${term}provider` ||
+                lowerKey.includes(`${term}provider`)
+            )
+          ) {
+            if (typeof pkg[key] === 'function') {
+              DynamicProviderRegistry.loadedProviders.set(providerName, pkg[key]);
+              return pkg[key];
             }
           }
         }
-      }
-      // Convert map to array and filter out incomplete tool calls
-      const toolCalls = Array.from(toolCallsMap.values())
-        .filter((tc) => tc.id && tc.name) // Only include complete tool calls
-        .map((tc) => ({
-          id: tc.id,
-          type: 'function' as const,
-          function: { name: tc.name, arguments: tc.inputString },
-        }));
-      return {
-        message: {
-          role: 'assistant',
-          content: fullContent || null,
-          tool_calls: toolCalls.length > 0 ? toolCalls : undefined,
-        },
-        usage: usage.total_tokens > 0 ? usage : undefined,
-      };
-    }
-    const data = (await response.json()) as {
-      content: {
-        type: 'text' | 'tool_use';
-        text?: string;
-        id?: string;
-        name?: string;
-        input?: Record<string, unknown>;
-      }[];
-      usage: { input_tokens: number; output_tokens: number };
-    };
+        if (pkg.default && typeof pkg.default === 'function') {
+          DynamicProviderRegistry.loadedProviders.set(providerName, pkg.default);
+          return pkg.default;
+        }
-    const textBlocks = data.content.filter((c) => c.type === 'text');
-    const thinkingBlocks = data.content.filter((c) => c.type === ('thinking' as any));
+        const firstFn = Object.values(pkg).find((v) => typeof v === 'function');
+        if (firstFn) {
+          DynamicProviderRegistry.loadedProviders.set(providerName, firstFn as any);
+          return firstFn as any;
+        }
-    let content =
-      textBlocks
-        .map((tb) => tb.text)
-        .filter(Boolean)
-        .join('\n') || null;
-    if (thinkingBlocks.length > 0) {
-      const thoughts = thinkingBlocks
-        .map((tb) => (tb as any).thinking)
-        .filter(Boolean)
-        .join('\n');
-      if (thoughts) {
-        content = `<thinking>\n${thoughts}\n</thinking>${content ? `\n\n${content}` : ''}`;
+        throw new Error(
+          `Could not find a valid factory function in package '${config.package}'. Available keys: ${allKeys.join(', ')}`
+        );
+      } catch (err) {
+        throw new Error(
+          `Failed to load provider package '${config.package}': ${err instanceof Error ? err.message : String(err)}. Please run 'npm install -g ${config.package}' or 'npm install ${config.package}'.`
+        );
       }
     }
-    // Validate response size to prevent memory exhaustion
-    if (content && content.length > MAX_RESPONSE_SIZE) {
-      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-    }
-    const toolCalls = data.content
-      .filter((c) => c.type === 'tool_use')
-      .map((c) => ({
-        id: c.id as string,
-        type: 'function' as const,
-        function: {
-          name: c.name as string,
-          arguments: JSON.stringify(c.input),
-        },
-      }));
-    return {
-      message: {
-        role: 'assistant',
-        content,
-        tool_calls: toolCalls.length > 0 ? toolCalls : undefined,
-      },
-      usage: {
-        prompt_tokens: data.usage.input_tokens,
-        completion_tokens: data.usage.output_tokens,
-        total_tokens: data.usage.input_tokens + data.usage.output_tokens,
-      },
-    };
+    throw new Error(
+      `Provider '${providerName}' must have a 'package' or 'script' configured in your keystone settings.`
+    );
   }
 }
-export class AnthropicClaudeAdapter extends AnthropicAdapter {
-  constructor(baseUrl?: string) {
-    super(undefined, baseUrl, 'oauth');
-  }
+export function resetProviderRegistry(): void {
+  // @ts-ignore: private static property access for test cleanup
+  DynamicProviderRegistry.loadedProviders.clear();
 }
-export class OpenAIChatGPTAdapter implements LLMAdapter {
-  private baseUrl: string;
+async function prepareProvider(
+  model: string
+): Promise<{ provider: ProviderInstance; resolvedModel: string }> {
+  const providerName = ConfigLoader.getProviderForModel(model);
+  const config = ConfigLoader.load();
+  const providerConfig = config.providers[providerName];
-  constructor(baseUrl?: string) {
-    this.baseUrl =
-      baseUrl || ConfigLoader.getSecret('OPENAI_CHATGPT_BASE_URL') || 'https://api.openai.com/v1';
+  if (!providerConfig) {
+    throw new Error(
+      `Provider configuration not found for: ${providerName}. Ensure it is defined in your keystone configuration.`
+    );
   }
-  private filterMessages(messages: LLMMessage[], model: string): ChatGPTMessage[] {
-    // Stateless mode requires stripping all IDs and filtering out item_references
-    const normalizedModel = this.normalizeModel(model);
-    return messages.map((m): ChatGPTMessage => {
-      // Create a shallow copy and remove id if it exists
-      const { id: _id, ...rest } = m as LLMMessageWithId;
+  // Pure BYOP: Load provider factory from user configuration
+  const providerFactory = await DynamicProviderRegistry.getProvider(providerName, providerConfig);
-      if (m.tool_calls) {
-        const toolCalls = m.tool_calls.map((tc) => {
-          const { id: _toolCallId, ...tcRest } = tc;
-          return tcRest;
-        });
-        return {
-          ...rest,
-          tool_calls: toolCalls,
-        };
-      }
+  // Initialize provider with AuthManager secrets
+  const options: Record<string, unknown> = {};
-      if (
-        m.role === 'system' &&
-        (normalizedModel === 'gpt-4o' || normalizedModel.startsWith('o1-'))
-      ) {
-        return { ...rest, role: 'developer' as any };
-      }
-      return rest;
-    });
+  if (providerConfig.base_url) {
+    options.baseURL = providerConfig.base_url;
   }
-  private normalizeModel(model: string): string {
-    // Map Keystone model names to Codex API expected names
-    if (model.includes('gpt-5')) return 'gpt-5-codex';
-    if (model.includes('gpt-4o-codex')) return 'gpt-4o';
-    return model;
+  // Fallback to env var lookup via ConfigLoader if not found above
+  if (!options.apiKey && providerConfig.api_key_env) {
+    options.apiKey = ConfigLoader.getSecret(providerConfig.api_key_env);
   }
-  async chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any;
-    }
-  ): Promise<LLMResponse> {
-    const isStreaming = !!options?.onStream;
-    const token = await AuthManager.getOpenAIChatGPTToken();
-    if (!token) {
-      throw new Error(
-        'OpenAI ChatGPT authentication not found. Please run "keystone auth login openai-chatgpt" first.'
-      );
-    }
-    const filteredMessages = this.filterMessages(messages, options?.model || 'gpt-5-codex');
-    const resolvedModel = this.normalizeModel(options?.model || 'gpt-5-codex');
-    const response = await fetch(`${this.baseUrl}/chat/completions`, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        Authorization: `Bearer ${token}`,
-        'OpenAI-Organization': '', // Ensure clear org context
-      },
-      body: JSON.stringify({
-        model: resolvedModel,
-        messages: filteredMessages,
-        tools: options?.tools,
-        stream: isStreaming,
-        // Critical for ChatGPT Plus/Pro backend compatibility
-        store: false,
-        include: ['reasoning.encrypted_content'],
-        response_format: options?.responseSchema
-          ? {
-              type: 'json_schema',
-              json_schema: {
-                name: 'output',
-                strict: true,
-                schema: options.responseSchema,
-              },
-            }
-          : undefined,
-      }),
-      signal: options?.signal,
-    });
-    if (!response.ok) {
-      const error = await response.text();
-      // Handle usage limit messages gracefully
-      if (response.status === 429 && error.includes('limit')) {
-        throw new Error(
-          'ChatGPT subscription limit reached. Please wait and try again or switch to another provider.'
-        );
-      }
-      throw new Error(
-        `OpenAI ChatGPT API error: ${response.status} ${response.statusText} - ${error}`
-      );
-    }
-    if (isStreaming) {
-      if (!response.body) throw new Error('Response body is null');
-      return processOpenAIStream(response, options, 'OpenAIChatGPT');
-    }
-    const data = (await response.json()) as {
-      choices: { message: LLMMessage }[];
-      usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
-    };
+  // Create the provider instance
+  const provider =
+    typeof providerFactory === 'function'
+      ? (providerFactory as ProviderFactory)(options)
+      : providerFactory;
-    return {
-      message: data.choices[0].message,
-      usage: data.usage,
-    };
-  }
-}
-export class GoogleGeminiAdapter implements LLMAdapter {
-  private baseUrl: string;
-  private projectId?: string;
-  constructor(baseUrl?: string, projectId?: string) {
-    this.baseUrl = (baseUrl || Bun.env.GOOGLE_GEMINI_BASE_URL || GEMINI_DEFAULT_BASE_URL).replace(
-      /\/$/,
-      ''
+  if (!provider) {
+    throw new Error(
+      `Provider factory for '${providerName}' returned undefined. Check your provider implementation.`
     );
-    this.projectId =
-      projectId || Bun.env.GOOGLE_GEMINI_PROJECT_ID || Bun.env.KEYSTONE_GEMINI_PROJECT_ID;
-  }
-  private sanitizeToolName(name: string, index: number, used: Set<string>): string {
-    let sanitized = name.replace(/[^a-zA-Z0-9_-]/g, '_').slice(0, 64);
-    if (!sanitized) {
-      sanitized = `tool_${index}`;
-    }
-    while (used.has(sanitized)) {
-      sanitized = `${sanitized}_${index}`.slice(0, 64);
-    }
-    used.add(sanitized);
-    return sanitized;
-  }
-  private buildToolMaps(tools?: LLMTool[]): {
-    nameToSanitized: Map<string, string>;
-    sanitizedToName: Map<string, string>;
-    tools?: {
-      functionDeclarations: Array<{ name: string; description: string; parameters: unknown }>;
-    }[];
-    toolConfig?: { functionCallingConfig: { mode: 'AUTO' } };
-  } {
-    const nameToSanitized = new Map<string, string>();
-    const sanitizedToName = new Map<string, string>();
-    if (!tools || tools.length === 0) {
-      return { nameToSanitized, sanitizedToName };
-    }
-    const usedNames = new Set<string>();
-    const functionDeclarations = tools.map((tool, index) => {
-      const originalName = tool.function.name;
-      const sanitized = this.sanitizeToolName(originalName, index, usedNames);
-      nameToSanitized.set(originalName, sanitized);
-      sanitizedToName.set(sanitized, originalName);
-      return {
-        name: sanitized,
-        description: tool.function.description ?? '',
-        parameters: tool.function.parameters ?? { type: 'object', properties: {} },
-      };
-    });
-    return {
-      nameToSanitized,
-      sanitizedToName,
-      tools: [{ functionDeclarations }],
-      toolConfig: { functionCallingConfig: { mode: 'AUTO' } },
-    };
   }
-  private parseToolResponse(content: string | null): Record<string, unknown> {
-    if (!content) return {};
-    try {
-      const parsed = JSON.parse(content);
-      if (parsed && typeof parsed === 'object') {
-        return parsed as Record<string, unknown>;
-      }
-      return { content: parsed };
-    } catch {
-      return { content };
+  // Resolve model name (strip prefix if typical "provider:model" format)
+  let resolvedModel = model;
+  if (model.includes(':')) {
+    const [prefix, ...rest] = model.split(':');
+    if (config.providers[prefix]) {
+      resolvedModel = rest.join(':');
     }
   }
-  private buildContents(
-    messages: LLMMessage[],
-    nameToSanitized: Map<string, string>
-  ): { contents: GeminiContent[]; systemInstruction?: GeminiSystemInstruction } {
-    const contents: GeminiContent[] = [];
-    const systemParts: string[] = [];
-    for (const message of messages) {
-      if (message.role === 'system') {
-        if (message.content) systemParts.push(message.content);
-        continue;
-      }
-      const role: GeminiContent['role'] = message.role === 'assistant' ? 'model' : 'user';
-      const parts: GeminiPart[] = [];
-      if (message.role === 'tool') {
-        const toolName = message.name
-          ? nameToSanitized.get(message.name) || message.name
-          : undefined;
-        if (toolName) {
-          parts.push({
-            functionResponse: {
-              name: toolName,
-              response: this.parseToolResponse(message.content),
-            },
-          });
-        } else if (message.content) {
-          parts.push({ text: message.content });
-        }
-      } else {
-        if (message.content) {
-          parts.push({ text: message.content });
-        }
-        if (message.tool_calls) {
-          for (const toolCall of message.tool_calls) {
-            const toolName = nameToSanitized.get(toolCall.function.name) || toolCall.function.name;
-            let args: Record<string, unknown> | string = {};
-            if (typeof toolCall.function.arguments === 'string') {
-              try {
-                args = JSON.parse(toolCall.function.arguments) as Record<string, unknown>;
-              } catch {
-                args = toolCall.function.arguments;
-              }
-            } else {
-              args = toolCall.function.arguments as unknown as Record<string, unknown>;
-            }
-            parts.push({
-              functionCall: {
-                name: toolName,
-                args,
-              },
-            });
-          }
-        }
-      }
-      if (parts.length > 0) {
-        contents.push({ role, parts });
-      }
-    }
+  return { provider, resolvedModel };
+}
-    const systemInstruction =
-      systemParts.length > 0
-        ? {
-            parts: [{ text: systemParts.join('\n\n') }],
-          }
-        : undefined;
+export async function getModel(model: string): Promise<LanguageModel> {
+  const { provider, resolvedModel } = await prepareProvider(model);
-    return { contents, systemInstruction };
+  // AI SDK convention: provider(modelId)
+  if (typeof provider === 'function') {
+    return (provider as any)(resolvedModel);
   }
-  private buildEndpoint(isStreaming: boolean): string {
-    const action = isStreaming ? 'streamGenerateContent' : 'generateContent';
-    const suffix = isStreaming ? '?alt=sse' : '';
-    return `${this.baseUrl}/v1internal:${action}${suffix}`;
+  // Fallback for objects that aren't callable but have standard methods
+  if (typeof (provider as any).languageModel === 'function') {
+    return (provider as any).languageModel(resolvedModel);
   }
-  private buildUsage(usage?: {
-    promptTokenCount?: number;
-    candidatesTokenCount?: number;
-    totalTokenCount?: number;
-  }): LLMResponse['usage'] | undefined {
-    if (!usage) return undefined;
-    const promptTokens = usage.promptTokenCount ?? 0;
-    const completionTokens = usage.candidatesTokenCount ?? 0;
-    const totalTokens = usage.totalTokenCount ?? promptTokens + completionTokens;
-    return {
-      prompt_tokens: promptTokens,
-      completion_tokens: completionTokens,
-      total_tokens: totalTokens,
-    };
+  if (typeof (provider as any).chatModel === 'function') {
+    return (provider as any).chatModel(resolvedModel);
   }
-  private extractGeminiParts(
-    data: {
-      candidates?: Array<{ content?: { parts?: GeminiPart[] } }>;
-      usageMetadata?: {
-        promptTokenCount?: number;
-        candidatesTokenCount?: number;
-        totalTokenCount?: number;
-      };
-    },
-    sanitizedToName: Map<string, string>,
-    onStream?: (chunk: string) => void,
-    toolCalls?: LLMToolCall[]
-  ): { content: string; usage?: LLMResponse['usage'] } {
-    let content = '';
-    if (Array.isArray(data.candidates)) {
-      const candidate = data.candidates[0];
-      const parts = candidate?.content?.parts || [];
-      for (const part of parts) {
-        if (part.text) {
-          if (content.length + part.text.length > MAX_RESPONSE_SIZE) {
-            throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-          }
-          content += part.text;
-          onStream?.(part.text);
-        }
-        if (part.functionCall && toolCalls) {
-          const originalName =
-            sanitizedToName.get(part.functionCall.name) || part.functionCall.name;
-          const args = part.functionCall.args ?? {};
-          const argsString = typeof args === 'string' ? args : JSON.stringify(args);
-          toolCalls.push({
-            id: `gemini_tool_${toolCalls.length + 1}`,
-            type: 'function',
-            function: {
-              name: originalName,
-              arguments: argsString,
-            },
-          });
-        }
-      }
-    }
-    return { content, usage: this.buildUsage(data.usageMetadata) };
-  }
-  async chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any;
-    }
-  ): Promise<LLMResponse> {
-    const isStreaming = !!options?.onStream;
-    const token = await AuthManager.getGoogleGeminiToken();
-    if (!token) {
-      throw new Error(
-        'Google Gemini authentication not found. Please run "keystone auth login gemini" first.'
-      );
-    }
-    const { nameToSanitized, sanitizedToName, tools, toolConfig } = this.buildToolMaps(
-      options?.tools
-    );
-    const { contents, systemInstruction } = this.buildContents(messages, nameToSanitized);
-    const requestPayload: Record<string, unknown> = {
-      contents,
-      sessionId: randomUUID(),
-    };
-    if (systemInstruction) requestPayload.systemInstruction = systemInstruction;
-    if (tools) requestPayload.tools = tools;
-    if (toolConfig) requestPayload.toolConfig = toolConfig;
-    if (options?.responseSchema) {
-      requestPayload.generationConfig = {
-        responseMimeType: 'application/json',
-        responseSchema: options.responseSchema,
-      };
-    }
-    const authProjectId = this.projectId ? undefined : AuthManager.load().google_gemini?.project_id;
-    const resolvedProjectId = this.projectId || authProjectId || GEMINI_DEFAULT_PROJECT_ID;
-    const wrappedBody = {
-      project: resolvedProjectId,
-      model: options?.model || 'gemini-3-pro-high',
-      request: requestPayload,
-      userAgent: 'antigravity',
-      requestId: `keystone-${randomUUID()}`,
-    };
-    const response = await fetch(this.buildEndpoint(isStreaming), {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        Authorization: `Bearer ${token}`,
-        ...GEMINI_HEADERS,
-        ...(isStreaming ? { Accept: 'text/event-stream' } : {}),
-      },
-      body: JSON.stringify(wrappedBody),
-      signal: options?.signal,
-    });
-    if (!response.ok) {
-      const error = await response.text();
-      throw new Error(
-        `Google Gemini API error: ${response.status} ${response.statusText} - ${error}`
-      );
-    }
-    if (isStreaming) {
-      if (!response.body) throw new Error('Response body is null');
-      const reader = response.body.getReader();
-      const decoder = new TextDecoder();
-      let buffer = '';
-      let fullContent = '';
-      const toolCalls: LLMToolCall[] = [];
-      let usage: LLMResponse['usage'] | undefined;
-      while (true) {
-        const { done, value } = await reader.read();
-        if (done) break;
-        buffer += decoder.decode(value, { stream: true });
-        const lines = buffer.split('\n');
-        buffer = lines.pop() || '';
-        for (const line of lines) {
-          const trimmed = line.trim();
-          if (!trimmed.startsWith('data:')) continue;
-          const payload = trimmed.slice(5).trim();
-          if (!payload || payload === '[DONE]') continue;
-          try {
-            const data = JSON.parse(payload) as {
-              candidates?: Array<{ content?: { parts?: GeminiPart[] } }>;
-              usageMetadata?: {
-                promptTokenCount?: number;
-                candidatesTokenCount?: number;
-                totalTokenCount?: number;
-              };
-            };
-            const result = this.extractGeminiParts(
-              data,
-              sanitizedToName,
-              options?.onStream,
-              toolCalls
-            );
-            if (result.content) {
-              if (fullContent.length + result.content.length > MAX_RESPONSE_SIZE) {
-                throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
-              }
-              fullContent += result.content;
-            }
-            if (result.usage) {
-              usage = result.usage;
-            }
-          } catch (e) {
-            if (e instanceof Error && e.message.includes('LLM response exceeds')) {
-              throw e;
-            }
-            if (process.env.DEBUG || process.env.LLM_DEBUG) {
-              process.stderr.write(`[Gemini Stream] Failed to parse chunk: ${payload}\n`);
-            }
-          }
-        }
-      }
-      const finalToolCalls = toolCalls.length > 0 ? toolCalls : undefined;
-      return {
-        message: {
-          role: 'assistant',
-          content: fullContent || null,
-          tool_calls: finalToolCalls,
-        },
-        usage,
-      };
-    }
-    const data = (await response.json()) as {
-      candidates?: Array<{ content?: { parts?: GeminiPart[] } }>;
-      usageMetadata?: {
-        promptTokenCount?: number;
-        candidatesTokenCount?: number;
-        totalTokenCount?: number;
-      };
-    };
-    const toolCalls: LLMToolCall[] = [];
-    const extracted = this.extractGeminiParts(data, sanitizedToName, undefined, toolCalls);
-    const content = extracted.content || null;
-    return {
-      message: {
-        role: 'assistant',
-        content,
-        tool_calls: toolCalls.length > 0 ? toolCalls : undefined,
-      },
-      usage: extracted.usage,
-    };
-  }
+  const keys = Object.keys(provider as any);
+  const type = typeof provider;
+  throw new Error(
+    `Provider for model '${model}' is not a function (type: ${type}) and has no .languageModel() method. Available keys: ${keys.join(', ')}`
+  );
 }
-export class CopilotAdapter implements LLMAdapter {
-  private baseUrl: string;
-  constructor(baseUrl?: string) {
-    this.baseUrl = baseUrl || 'https://api.githubcopilot.com';
+export async function getEmbeddingModel(model: string): Promise<EmbeddingModel> {
+  // 1. Check for local fallback
+  if (model === 'local' || model === 'keystone-local') {
+    return new LocalEmbeddingModel();
   }
-  async chat(
-    messages: LLMMessage[],
-    options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
-      responseSchema?: any;
-    }
-  ): Promise<LLMResponse> {
-    const isStreaming = !!options?.onStream;
-    const token = await AuthManager.getCopilotToken();
-    if (!token) {
-      throw new Error('GitHub Copilot token not found. Please run "keystone auth login" first.');
-    }
-    const response = await fetch(`${this.baseUrl}/chat/completions`, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        Authorization: `Bearer ${token}`,
-        'vscode-editorid': 'vscode-chat',
-        'vscode-machineid': 'default',
-        ...COPILOT_HEADERS,
-      },
-      body: JSON.stringify({
-        model: options?.model || 'gpt-4o',
-        messages,
-        tools: options?.tools,
-        stream: isStreaming,
-      }),
-      signal: options?.signal,
-    });
+  try {
+    const { provider, resolvedModel } = await prepareProvider(model);
-    if (!response.ok) {
-      const error = await response.text();
-      throw new Error(`Copilot API error: ${response.status} ${response.statusText} - ${error}`);
+    // AI SDK convention: provider.textEmbeddingModel(modelId) OR provider.embedding(modelId)
+    // We check all known variations to be safe with different provider implementations or versions
+    if (typeof provider.textEmbeddingModel === 'function') {
+      return provider.textEmbeddingModel(resolvedModel);
     }
-    if (isStreaming) {
-      // Use the same streaming logic as OpenAIAdapter since Copilot uses OpenAI API
-      if (!response.body) throw new Error('Response body is null');
-      return processOpenAIStream(response, options, 'Copilot');
+    if (typeof provider.embedding === 'function') {
+      return provider.embedding(resolvedModel);
     }
-    const data = (await response.json()) as {
-      choices: { message: LLMMessage }[];
-      usage?: { prompt_tokens: number; completion_tokens: number; total_tokens: number };
-    };
-    // Validate response size to prevent memory exhaustion
-    const contentLength = data.choices[0]?.message?.content?.length ?? 0;
-    if (contentLength > MAX_RESPONSE_SIZE) {
-      throw new Error(`LLM response exceeds maximum size of ${MAX_RESPONSE_SIZE} bytes`);
+    if (typeof provider.textEmbedding === 'function') {
+      return provider.textEmbedding(resolvedModel);
     }
-    return {
-      message: data.choices[0].message,
-      usage: data.usage,
-    };
-  }
-}
-export class LocalEmbeddingAdapter implements LLMAdapter {
-  private static extractor: unknown = null;
-  async chat(
-    _messages: LLMMessage[],
-    _options?: {
-      model?: string;
-      tools?: LLMTool[];
-      onStream?: (chunk: string) => void;
-      signal?: AbortSignal;
+  } catch (err) {
+    // If explicit provider setup fails AND it's a default attempt, fallback to local
+    const config = ConfigLoader.load();
+    if (model === config.embedding_model || !model) {
+      new ConsoleLogger().warn(
+        `⚠️  Embedding provider for '${model}' failed, falling back to local embeddings: ${err instanceof Error ? err.message : String(err)}`
+      );
+      return new LocalEmbeddingModel();
     }
-  ): Promise<LLMResponse> {
-    throw new Error(
-      'Local models in Keystone currently only support memory/embedding operations. ' +
-        'To use a local LLM for chat/generation, please use an OpenAI-compatible local server ' +
-        '(like Ollama, LM Studio, or LocalAI) and configure it as an OpenAI provider in your config.'
-    );
+    throw err;
   }
-  async embed(
-    text: string,
-    model = 'Xenova/all-MiniLM-L6-v2',
-    options?: { signal?: AbortSignal }
-  ): Promise<number[]> {
-    const modelToUse = model === 'local' ? 'Xenova/all-MiniLM-L6-v2' : model;
-    if (options?.signal?.aborted) throw new Error('Embedding aborted');
-    if (!LocalEmbeddingAdapter.extractor) {
-      try {
-        ensureOnnxRuntimeLibraryPath();
-        const pipeline = await getTransformersPipeline();
-        LocalEmbeddingAdapter.extractor = await pipeline('feature-extraction', modelToUse);
-      } catch (error) {
-        const details = error instanceof Error ? error.message : String(error);
-        throw new Error(
-          `Failed to initialize local embeddings. If you are running a compiled binary, ensure the keystone-runtime directory is next to the executable (or set KEYSTONE_RUNTIME_DIR), and that the ONNX Runtime shared library is available (set KEYSTONE_ONNX_RUNTIME_LIB_DIR or place it next to the executable). Original error: ${details}`
-        );
-      }
-    }
-    const output = await LocalEmbeddingAdapter.extractor(text, {
-      pooling: 'mean',
-      normalize: true,
-    });
-    return Array.from(output.data);
-  }
+  // Some providers might just return the model directly if called, but usually that's for LanguageModel.
+  // We assume standard AI SDK provider structure here.
+  throw new Error(
+    `Provider for model '${model}' does not support embeddings (no .textEmbeddingModel, .embedding, or .textEmbedding method found).`
+  );
 }
-export function getAdapter(model: string): { adapter: LLMAdapter; resolvedModel: string } {
-  if (model === 'local' || model.startsWith('local:')) {
-    const resolvedModel = model === 'local' ? 'Xenova/all-MiniLM-L6-v2' : model.substring(6);
-    return { adapter: new LocalEmbeddingAdapter(), resolvedModel };
-  }
-  const providerName = ConfigLoader.getProviderForModel(model);
-  const config = ConfigLoader.load();
-  const providerConfig = config.providers[providerName];
-  if (!providerConfig) {
-    throw new Error(`Provider configuration not found for: ${providerName}`);
-  }
-  let resolvedModel = model;
-  if (model.includes(':')) {
-    const [prefix, ...rest] = model.split(':');
-    if (config.providers[prefix]) {
-      resolvedModel = rest.join(':');
-    }
-  }
-  let adapter: LLMAdapter;
-  if (providerConfig.type === 'copilot') {
-    adapter = new CopilotAdapter(providerConfig.base_url);
-  } else if (providerConfig.type === 'openai-chatgpt') {
-    adapter = new OpenAIChatGPTAdapter(providerConfig.base_url);
-  } else if (providerConfig.type === 'google-gemini') {
-    adapter = new GoogleGeminiAdapter(providerConfig.base_url, providerConfig.project_id);
-  } else if (providerConfig.type === 'anthropic-claude') {
-    adapter = new AnthropicClaudeAdapter(providerConfig.base_url);
-  } else {
-    const apiKey = providerConfig.api_key_env
-      ? ConfigLoader.getSecret(providerConfig.api_key_env)
-      : undefined;
-    if (providerConfig.type === 'anthropic') {
-      adapter = new AnthropicAdapter(apiKey, providerConfig.base_url);
-    } else {
-      adapter = new OpenAIAdapter(apiKey, providerConfig.base_url);
-    }
-  }
-  return { adapter, resolvedModel };
+/**
+ * Dispose of the local embedding model's cached pipeline to free memory.
+ * Call this during graceful shutdown or when embeddings are no longer needed.
+ */
+export function disposeLocalEmbeddingModel(): void {
+  LocalEmbeddingModel.dispose();
 }