npm - universal-llm-client - Versions diffs - 4.2.0 → 4.5.0 - Mend

universal-llm-client 4.2.0 → 4.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

package/CHANGELOG.md +142 -103
package/LICENSE +21 -21
package/README.md +640 -591
package/dist/ai-model.d.ts +12 -1
package/dist/ai-model.d.ts.map +1 -1
package/dist/ai-model.js +36 -1
package/dist/ai-model.js.map +1 -1
package/dist/gemma-channel.d.ts +14 -0
package/dist/gemma-channel.d.ts.map +1 -0
package/dist/gemma-channel.js +38 -0
package/dist/gemma-channel.js.map +1 -0
package/dist/gemma-diffusion.d.ts +49 -0
package/dist/gemma-diffusion.d.ts.map +1 -0
package/dist/gemma-diffusion.js +147 -0
package/dist/gemma-diffusion.js.map +1 -0
package/dist/http.d.ts +4 -0
package/dist/http.d.ts.map +1 -1
package/dist/http.js +14 -1
package/dist/http.js.map +1 -1
package/dist/index.d.ts +2 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +4 -0
package/dist/index.js.map +1 -1
package/dist/interfaces.d.ts +183 -7
package/dist/interfaces.d.ts.map +1 -1
package/dist/interfaces.js.map +1 -1
package/dist/providers/anthropic.d.ts.map +1 -1
package/dist/providers/anthropic.js +28 -3
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/google.d.ts +22 -1
package/dist/providers/google.d.ts.map +1 -1
package/dist/providers/google.js +225 -13
package/dist/providers/google.js.map +1 -1
package/dist/providers/ollama.d.ts +2 -0
package/dist/providers/ollama.d.ts.map +1 -1
package/dist/providers/ollama.js +59 -30
package/dist/providers/ollama.js.map +1 -1
package/dist/providers/openai.d.ts +14 -0
package/dist/providers/openai.d.ts.map +1 -1
package/dist/providers/openai.js +200 -22
package/dist/providers/openai.js.map +1 -1
package/dist/router.d.ts +2 -0
package/dist/router.d.ts.map +1 -1
package/dist/router.js +4 -0
package/dist/router.js.map +1 -1
package/dist/stream-decoder.d.ts +12 -0
package/dist/stream-decoder.d.ts.map +1 -1
package/dist/stream-decoder.js +182 -5
package/dist/stream-decoder.js.map +1 -1
package/dist/thinking.d.ts +36 -0
package/dist/thinking.d.ts.map +1 -0
package/dist/thinking.js +52 -0
package/dist/thinking.js.map +1 -0
package/package.json +118 -116
package/src/ai-model.ts +400 -350
package/src/auditor.ts +213 -213
package/src/client.ts +402 -402
package/src/debug/debug-google-streaming.ts +1 -1
package/src/demos/basic/universal-llm-examples.ts +3 -3
package/src/demos/diffusion-gemma/.env +29 -0
package/src/demos/diffusion-gemma/.env.example +27 -0
package/src/demos/diffusion-gemma/CLAUDE.md +95 -0
package/src/demos/diffusion-gemma/README.md +59 -0
package/src/demos/diffusion-gemma/canvas.ts +1606 -0
package/src/demos/diffusion-gemma/docker-compose.yml +29 -0
package/src/demos/diffusion-gemma/probe-stream.ts +51 -0
package/src/demos/diffusion-gemma/probe-tools.ts +55 -0
package/src/demos/diffusion-gemma/server.ts +1205 -0
package/src/demos/diffusion-gemma/start-vllm.sh +98 -0
package/src/gemma-channel.ts +47 -0
package/src/gemma-diffusion.ts +167 -0
package/src/http.ts +261 -247
package/src/index.ts +180 -161
package/src/interfaces.ts +843 -657
package/src/mcp.ts +345 -345
package/src/providers/anthropic.ts +796 -762
package/src/providers/google.ts +840 -620
package/src/providers/index.ts +8 -8
package/src/providers/ollama.ts +503 -469
package/src/providers/openai.ts +587 -392
package/src/router.ts +785 -780
package/src/stream-decoder.ts +535 -361
package/src/structured-output.ts +759 -759
package/src/test-scripts/test-google-deep-research.ts +33 -0
package/src/test-scripts/test-google-streaming-enhanced.ts +147 -147
package/src/test-scripts/test-google-streaming.ts +1 -1
package/src/test-scripts/test-google-system-prompt-comprehensive.ts +189 -189
package/src/test-scripts/test-google-thinking.ts +46 -0
package/src/test-scripts/test-system-message-positions.ts +163 -163
package/src/test-scripts/test-system-prompt-improvement-demo.ts +83 -83
package/src/test-scripts/test-vllm-qwen36.ts +256 -0
package/src/tests/ai-model.test.ts +1614 -1614
package/src/tests/auditor.test.ts +224 -224
package/src/tests/gemma-diffusion.test.ts +115 -0
package/src/tests/http.test.ts +200 -200
package/src/tests/interfaces.test.ts +117 -117
package/src/tests/providers/anthropic.test.ts +118 -0
package/src/tests/providers/google.test.ts +841 -660
package/src/tests/providers/ollama.test.ts +1034 -954
package/src/tests/providers/openai.test.ts +1511 -1122
package/src/tests/router.test.ts +254 -254
package/src/tests/stream-decoder.test.ts +263 -179
package/src/tests/structured-output.test.ts +1450 -1450
package/src/tests/thinking.test.ts +65 -0
package/src/tests/tools.test.ts +175 -175
package/src/thinking.ts +73 -0
package/src/tools.ts +246 -246
package/src/zod-adapter.ts +72 -72

package/src/ai-model.ts CHANGED Viewed

@@ -1,350 +1,400 @@
-/**
- * Universal LLM Client v3 — AIModel (The Universal Client)
- *
- * The only public-facing class. Developers configure one model with
- * multiple provider backends for transparent failover.
- *
- * Provider classes are internal — the user never imports them.
- */
-import {
-    AIModelApiType,
-    type AIModelConfig,
-    type ProviderConfig,
-    type LLMClientOptions,
-    type LLMChatMessage,
-    type LLMChatResponse,
-    type ChatOptions,
-    type ModelMetadata,
-    type LLMFunction,
-    type ToolHandler,
-} from './interfaces.js';
-import type { DecodedEvent } from './stream-decoder.js';
-import { Router, type RouterConfig, type ProviderStatus } from './router.js';
-import type { Auditor } from './auditor.js';
-import { NoopAuditor } from './auditor.js';
-import { OllamaClient } from './providers/ollama.js';
-import { OpenAICompatibleClient } from './providers/openai.js';
-import { GoogleClient } from './providers/google.js';
-import { AnthropicClient } from './providers/anthropic.js';
-import { BaseLLMClient } from './client.js';
-import {
-    type StructuredOutputResult,
-    type SchemaConfig,
-} from './structured-output.js';
-// ============================================================================
-// Default Provider URLs
-// ============================================================================
-const DEFAULT_URLS: Record<string, string> = {
-    ollama: 'http://localhost:11434',
-    openai: 'https://api.openai.com',
-    llamacpp: 'http://localhost:8080',
-    anthropic: 'https://api.anthropic.com',
-    // google and vertex build their own URLs internally
-};
-// ============================================================================
-// AIModel — The Universal Client
-// ============================================================================
-export class AIModel {
-    private router: Router;
-    private auditor: Auditor;
-    private config: AIModelConfig;
-    constructor(config: AIModelConfig) {
-        this.config = config;
-        this.auditor = config.auditor ?? new NoopAuditor();
-        const routerConfig: RouterConfig = {
-            retriesPerProvider: config.retries ?? 2,
-            auditor: this.auditor,
-        };
-        this.router = new Router(routerConfig);
-        // Initialize providers in order
-        for (let i = 0; i < config.providers.length; i++) {
-            const providerConfig = config.providers[i]!;
-            const client = this.createClient(providerConfig);
-            const id = `${this.normalizeType(providerConfig.type)}-${i}`;
-            this.router.addProvider({
-                id,
-                client,
-                priority: providerConfig.priority ?? i,
-                modelOverride: providerConfig.model,
-            });
-        }
-    }
-    // ========================================================================
-    // Chat
-    // ========================================================================
-    /** Send a chat request with automatic failover across providers */
-    async chat(
-        messages: LLMChatMessage[],
-        options?: ChatOptions,
-    ): Promise<LLMChatResponse> {
-        return this.router.chat(messages, options);
-    }
-    /** Chat with automatic tool execution (multi-turn loop) */
-    async chatWithTools(
-        messages: LLMChatMessage[],
-        options?: ChatOptions & { maxIterations?: number },
-    ): Promise<LLMChatResponse> {
-        return this.router.chatWithTools(messages, options);
-    }
-    /** Stream chat response with pluggable decoder strategy */
-    async *chatStream(
-        messages: LLMChatMessage[],
-        options?: ChatOptions,
-    ): AsyncGenerator<DecodedEvent, LLMChatResponse | void, unknown> {
-        return yield* this.router.chatStream(messages, options);
-    }
-    // ========================================================================
-    // Structured Output
-    // ========================================================================
-    /**
-     * Generate structured output from the LLM with automatic failover.
-     * Validates the response against the provided Zod schema.
-     * Throws StructuredOutputError on validation failure.
-     *
-     * @template T The output type
-     * @param config Schema configuration (JSON Schema + optional validator)
-     * @param messages Chat messages to send
-     * @param options Additional options (temperature, maxTokens, etc.)
-     * @returns Promise resolving to validated structured output
-     * @throws StructuredOutputError if JSON parsing fails or validation fails
-     *
-     * @example
-     * ```typescript
-     * import { fromZod } from 'universal-llm-client/zod';
-     * const UserConfig = fromZod(z.object({
-     *   name: z.string(),
-     *   age: z.number(),
-     * }));
-     *
-     * const user = await model.generateStructured(UserConfig, [
-     *   { role: 'user', content: 'Generate a user profile' },
-     * ]);
-     * // user.name: string, user.age: number
-     * ```
-     */
-    async generateStructured<T>(
-        config: SchemaConfig<T>,
-        messages: LLMChatMessage[],
-        options?: ChatOptions,
-    ): Promise<T> {
-        return this.router.generateStructured(config, messages, options);
-    }
-    /**
-     * Try to generate structured output, returning a result object instead of throwing.
-     * Same as generateStructured but returns { ok: true, value } on success
-     * and { ok: false, error, rawOutput } on failure.
-     *
-     * @template T The output type
-     * @param config Schema configuration (JSON Schema + optional validator)
-     * @param messages Chat messages to send
-     * @param options Additional options (temperature, maxTokens, etc.)
-     * @returns StructuredOutputResult<T> - either success with value or failure with error
-     *
-     * @example
-     * ```typescript
-     * const result = await model.tryParseStructured(config, messages);
-     *
-     * if (result.ok) {
-     *   console.log('User:', result.value.name);
-     * } else {
-     *   console.log('Error:', result.error.message);
-     *   console.log('Raw output:', result.rawOutput);
-     * }
-     * ```
-     */
-    async tryParseStructured<T>(
-        config: SchemaConfig<T>,
-        messages: LLMChatMessage[],
-        options?: ChatOptions,
-    ): Promise<StructuredOutputResult<T>> {
-        return this.router.tryParseStructured(config, messages, options);
-    }
-    /**
-     * Stream structured output with partial validated objects.
-     *
-     * Yields partial validated objects as JSON generates, then returns the
-     * complete validated object on stream completion.
-     *
-     * For invalid partial JSON, no yield occurs (partial validation is best-effort).
-     * On stream completion, if the final JSON fails validation, throws StructuredOutputError.
-     *
-     * @template T The output type
-     * @param config Schema configuration (JSON Schema + optional validator)
-     * @param messages Chat messages to send
-     * @param options Additional options (temperature, maxTokens, etc.)
-     * @yields Partial validated objects as the JSON stream progresses
-     * @returns Complete validated object on stream completion
-     * @throws StructuredOutputError if final validation fails
-     *
-     * @example
-     * ```typescript
-     * import { fromZod } from 'universal-llm-client/zod';
-     * const UserConfig = fromZod(z.object({
-     *   name: z.string(),
-     *   age: z.number(),
-     * }));
-     *
-     * const stream = model.generateStructuredStream(UserConfig, [
-     *   { role: 'user', content: 'Generate a user' },
-     * ]);
-     *
-     * for await (const partial of stream) {
-     *   console.log('Partial user:', partial);
-     * }
-     * ```
-     */
-    async *generateStructuredStream<T>(
-        config: SchemaConfig<T>,
-        messages: LLMChatMessage[],
-        options?: ChatOptions,
-    ): AsyncGenerator<T, T, unknown> {
-        return yield* this.router.generateStructuredStream(config, messages, options);
-    }
-    // ========================================================================
-    // Embeddings
-    // ========================================================================
-    /** Generate embedding for a single text */
-    async embed(text: string): Promise<number[]> {
-        return this.router.embed(text);
-    }
-    /** Generate embeddings for multiple texts */
-    async embedArray(texts: string[]): Promise<number[][]> {
-        return this.router.embedArray(texts);
-    }
-    // ========================================================================
-    // Tool Registration
-    // ========================================================================
-    /** Register a tool callable by the LLM (broadcast to all providers) */
-    registerTool(
-        name: string,
-        description: string,
-        parameters: LLMFunction['parameters'],
-        handler: ToolHandler,
-    ): void {
-        this.router.registerTool(name, description, parameters, handler);
-    }
-    /** Register multiple tools at once */
-    registerTools(
-        tools: Array<{
-            name: string;
-            description: string;
-            parameters: LLMFunction['parameters'];
-            handler: ToolHandler;
-        }>,
-    ): void {
-        this.router.registerTools(tools);
-    }
-    // ========================================================================
-    // Model Management
-    // ========================================================================
-    /** Get available models from all configured providers */
-    async getModels(): Promise<string[]> {
-        return this.router.getModels();
-    }
-    /** Get metadata about the current model (context length, capabilities) */
-    async getModelInfo(): Promise<ModelMetadata> {
-        return this.router.getModelInfo();
-    }
-    /** Switch model at runtime (updates all providers) */
-    setModel(name: string): void {
-        this.config.model = name;
-        // The model name change will be picked up by the providers
-        // through the router on next request
-    }
-    /** Get the current model name */
-    get model(): string {
-        return this.config.model;
-    }
-    // ========================================================================
-    // Provider Status
-    // ========================================================================
-    /** Get health/status of all configured providers */
-    getProviderStatus(): ProviderStatus[] {
-        return this.router.getStatus();
-    }
-    // ========================================================================
-    // Lifecycle
-    // ========================================================================
-    /** Clean shutdown — flush auditor, disconnect MCP, etc. */
-    async dispose(): Promise<void> {
-        await this.auditor.flush?.();
-    }
-    // ========================================================================
-    // Internal: Provider Factory
-    // ========================================================================
-    private createClient(providerConfig: ProviderConfig): BaseLLMClient {
-        const type = this.normalizeType(providerConfig.type);
-        const modelName = providerConfig.model ?? this.config.model;
-        const clientOptions: LLMClientOptions = {
-            model: modelName,
-            url: providerConfig.url ?? DEFAULT_URLS[type] ?? '',
-            apiType: type as AIModelApiType,
-            apiKey: providerConfig.apiKey,
-            timeout: this.config.timeout ?? 30000,
-            retries: this.config.retries ?? 2,
-            debug: this.config.debug ?? false,
-            defaultParameters: this.config.defaultParameters,
-            thinking: this.config.thinking ?? false,
-            region: providerConfig.region,
-            apiVersion: providerConfig.apiVersion,
-        };
-        switch (type) {
-            case 'ollama':
-                return new OllamaClient(clientOptions, this.auditor);
-            case 'openai':
-            case 'llamacpp':
-                return new OpenAICompatibleClient(clientOptions, this.auditor);
-            case 'google':
-            case 'vertex':
-                return new GoogleClient(clientOptions, this.auditor);
-            case 'anthropic':
-                return new AnthropicClient(clientOptions, this.auditor);
-            default:
-                throw new Error(`Unknown provider type: ${type}`);
-        }
-    }
-    private normalizeType(type: string): string {
-        return type.toLowerCase();
-    }
-}
+/**
+ * Universal LLM Client v3 — AIModel (The Universal Client)
+ *
+ * The only public-facing class. Developers configure one model with
+ * multiple provider backends for transparent failover.
+ *
+ * Provider classes are internal — the user never imports them.
+ */
+import {
+    AIModelApiType,
+    type AIModelConfig,
+    type ProviderConfig,
+    type LLMClientOptions,
+    type LLMChatMessage,
+    type LLMChatResponse,
+    type ChatOptions,
+    type ModelMetadata,
+    type LLMFunction,
+    type ToolHandler,
+    type DeepResearchOptions,
+    type DeepResearchResult,
+    type DeepResearchEvent,
+} from './interfaces.js';
+import type { DecodedEvent } from './stream-decoder.js';
+import { Router, type RouterConfig, type ProviderStatus } from './router.js';
+import type { Auditor } from './auditor.js';
+import { NoopAuditor } from './auditor.js';
+import { OllamaClient } from './providers/ollama.js';
+import { OpenAICompatibleClient } from './providers/openai.js';
+import { GoogleClient } from './providers/google.js';
+import { AnthropicClient } from './providers/anthropic.js';
+import { BaseLLMClient } from './client.js';
+import {
+    type StructuredOutputResult,
+    type SchemaConfig,
+} from './structured-output.js';
+// ============================================================================
+// Default Provider URLs
+// ============================================================================
+const DEFAULT_URLS: Record<string, string> = {
+    ollama: 'http://localhost:11434',
+    openai: 'https://api.openai.com',
+    llamacpp: 'http://localhost:8080',
+    anthropic: 'https://api.anthropic.com',
+    // google and vertex build their own URLs internally
+};
+// ============================================================================
+// AIModel — The Universal Client
+// ============================================================================
+export class AIModel {
+    private router: Router;
+    private auditor: Auditor;
+    private config: AIModelConfig;
+    constructor(config: AIModelConfig) {
+        this.config = config;
+        this.auditor = config.auditor ?? new NoopAuditor();
+        const routerConfig: RouterConfig = {
+            retriesPerProvider: config.retries ?? 2,
+            auditor: this.auditor,
+        };
+        this.router = new Router(routerConfig);
+        // Initialize providers in order
+        for (let i = 0; i < config.providers.length; i++) {
+            const providerConfig = config.providers[i]!;
+            const client = this.createClient(providerConfig);
+            const id = `${this.normalizeType(providerConfig.type)}-${i}`;
+            this.router.addProvider({
+                id,
+                client,
+                priority: providerConfig.priority ?? i,
+                modelOverride: providerConfig.model,
+            });
+        }
+    }
+    // ========================================================================
+    // Chat
+    // ========================================================================
+    /** Send a chat request with automatic failover across providers */
+    async chat(
+        messages: LLMChatMessage[],
+        options?: ChatOptions,
+    ): Promise<LLMChatResponse> {
+        return this.router.chat(messages, options);
+    }
+    /** Chat with automatic tool execution (multi-turn loop) */
+    async chatWithTools(
+        messages: LLMChatMessage[],
+        options?: ChatOptions & { maxIterations?: number },
+    ): Promise<LLMChatResponse> {
+        return this.router.chatWithTools(messages, options);
+    }
+    /** Stream chat response with pluggable decoder strategy */
+    async *chatStream(
+        messages: LLMChatMessage[],
+        options?: ChatOptions,
+    ): AsyncGenerator<DecodedEvent, LLMChatResponse | void, unknown> {
+        return yield* this.router.chatStream(messages, options);
+    }
+    // ========================================================================
+    // Structured Output
+    // ========================================================================
+    /**
+     * Generate structured output from the LLM with automatic failover.
+     * Validates the response against the provided Zod schema.
+     * Throws StructuredOutputError on validation failure.
+     *
+     * @template T The output type
+     * @param config Schema configuration (JSON Schema + optional validator)
+     * @param messages Chat messages to send
+     * @param options Additional options (temperature, maxTokens, etc.)
+     * @returns Promise resolving to validated structured output
+     * @throws StructuredOutputError if JSON parsing fails or validation fails
+     *
+     * @example
+     * ```typescript
+     * import { fromZod } from 'universal-llm-client/zod';
+     * const UserConfig = fromZod(z.object({
+     *   name: z.string(),
+     *   age: z.number(),
+     * }));
+     *
+     * const user = await model.generateStructured(UserConfig, [
+     *   { role: 'user', content: 'Generate a user profile' },
+     * ]);
+     * // user.name: string, user.age: number
+     * ```
+     */
+    async generateStructured<T>(
+        config: SchemaConfig<T>,
+        messages: LLMChatMessage[],
+        options?: ChatOptions,
+    ): Promise<T> {
+        return this.router.generateStructured(config, messages, options);
+    }
+    /**
+     * Try to generate structured output, returning a result object instead of throwing.
+     * Same as generateStructured but returns { ok: true, value } on success
+     * and { ok: false, error, rawOutput } on failure.
+     *
+     * @template T The output type
+     * @param config Schema configuration (JSON Schema + optional validator)
+     * @param messages Chat messages to send
+     * @param options Additional options (temperature, maxTokens, etc.)
+     * @returns StructuredOutputResult<T> - either success with value or failure with error
+     *
+     * @example
+     * ```typescript
+     * const result = await model.tryParseStructured(config, messages);
+     *
+     * if (result.ok) {
+     *   console.log('User:', result.value.name);
+     * } else {
+     *   console.log('Error:', result.error.message);
+     *   console.log('Raw output:', result.rawOutput);
+     * }
+     * ```
+     */
+    async tryParseStructured<T>(
+        config: SchemaConfig<T>,
+        messages: LLMChatMessage[],
+        options?: ChatOptions,
+    ): Promise<StructuredOutputResult<T>> {
+        return this.router.tryParseStructured(config, messages, options);
+    }
+    /**
+     * Stream structured output with partial validated objects.
+     *
+     * Yields partial validated objects as JSON generates, then returns the
+     * complete validated object on stream completion.
+     *
+     * For invalid partial JSON, no yield occurs (partial validation is best-effort).
+     * On stream completion, if the final JSON fails validation, throws StructuredOutputError.
+     *
+     * @template T The output type
+     * @param config Schema configuration (JSON Schema + optional validator)
+     * @param messages Chat messages to send
+     * @param options Additional options (temperature, maxTokens, etc.)
+     * @yields Partial validated objects as the JSON stream progresses
+     * @returns Complete validated object on stream completion
+     * @throws StructuredOutputError if final validation fails
+     *
+     * @example
+     * ```typescript
+     * import { fromZod } from 'universal-llm-client/zod';
+     * const UserConfig = fromZod(z.object({
+     *   name: z.string(),
+     *   age: z.number(),
+     * }));
+     *
+     * const stream = model.generateStructuredStream(UserConfig, [
+     *   { role: 'user', content: 'Generate a user' },
+     * ]);
+     *
+     * for await (const partial of stream) {
+     *   console.log('Partial user:', partial);
+     * }
+     * ```
+     */
+    async *generateStructuredStream<T>(
+        config: SchemaConfig<T>,
+        messages: LLMChatMessage[],
+        options?: ChatOptions,
+    ): AsyncGenerator<T, T, unknown> {
+        return yield* this.router.generateStructuredStream(config, messages, options);
+    }
+    // ========================================================================
+    // Embeddings
+    // ========================================================================
+    /** Generate embedding for a single text */
+    async embed(text: string): Promise<number[]> {
+        return this.router.embed(text);
+    }
+    /** Generate embeddings for multiple texts */
+    async embedArray(texts: string[]): Promise<number[][]> {
+        return this.router.embedArray(texts);
+    }
+    // ========================================================================
+    // Deep Research (Gemini-only)
+    // ========================================================================
+    private getGoogleClient(method: string): GoogleClient {
+        const googleClients = this.router.getClients().filter(
+            (c): c is GoogleClient => c instanceof GoogleClient,
+        );
+        // Prefer an AI Studio client — Vertex AI doesn't support Deep Research.
+        const aiStudio = googleClients.find(c => c.supportsDeepResearch());
+        if (aiStudio) return aiStudio;
+        if (googleClients.length > 0) {
+            throw new Error(
+                `${method} requires an AI Studio Google provider (type: "google"); Vertex AI is not supported for Deep Research.`,
+            );
+        }
+        throw new Error(
+            `${method} requires a Google provider (type: "google"). None is configured.`,
+        );
+    }
+    /**
+     * Run an agentic Deep Research interaction (Gemini only): creates it and
+     * polls until completion. Throws if no Google provider is configured.
+     */
+    async deepResearch(input: string, options?: DeepResearchOptions): Promise<DeepResearchResult> {
+        return this.getGoogleClient('deepResearch').deepResearch(input, options);
+    }
+    /**
+     * Stream a Deep Research interaction's intermediate thought/text/step events
+     * (Gemini only), returning the final result. Throws if no Google provider.
+     */
+    async *deepResearchStream(
+        input: string,
+        options?: DeepResearchOptions,
+    ): AsyncGenerator<DeepResearchEvent, DeepResearchResult, unknown> {
+        return yield* this.getGoogleClient('deepResearchStream').deepResearchStream(input, options);
+    }
+    // ========================================================================
+    // Tool Registration
+    // ========================================================================
+    /** Register a tool callable by the LLM (broadcast to all providers) */
+    registerTool(
+        name: string,
+        description: string,
+        parameters: LLMFunction['parameters'],
+        handler: ToolHandler,
+    ): void {
+        this.router.registerTool(name, description, parameters, handler);
+    }
+    /** Register multiple tools at once */
+    registerTools(
+        tools: Array<{
+            name: string;
+            description: string;
+            parameters: LLMFunction['parameters'];
+            handler: ToolHandler;
+        }>,
+    ): void {
+        this.router.registerTools(tools);
+    }
+    // ========================================================================
+    // Model Management
+    // ========================================================================
+    /** Get available models from all configured providers */
+    async getModels(): Promise<string[]> {
+        return this.router.getModels();
+    }
+    /** Get metadata about the current model (context length, capabilities) */
+    async getModelInfo(): Promise<ModelMetadata> {
+        return this.router.getModelInfo();
+    }
+    /** Switch model at runtime (updates all providers) */
+    setModel(name: string): void {
+        this.config.model = name;
+        // The model name change will be picked up by the providers
+        // through the router on next request
+    }
+    /** Get the current model name */
+    get model(): string {
+        return this.config.model;
+    }
+    // ========================================================================
+    // Provider Status
+    // ========================================================================
+    /** Get health/status of all configured providers */
+    getProviderStatus(): ProviderStatus[] {
+        return this.router.getStatus();
+    }
+    // ========================================================================
+    // Lifecycle
+    // ========================================================================
+    /** Clean shutdown — flush auditor, disconnect MCP, etc. */
+    async dispose(): Promise<void> {
+        await this.auditor.flush?.();
+    }
+    // ========================================================================
+    // Internal: Provider Factory
+    // ========================================================================
+    private createClient(providerConfig: ProviderConfig): BaseLLMClient {
+        const type = this.normalizeType(providerConfig.type);
+        const modelName = providerConfig.model ?? this.config.model;
+        const clientOptions: LLMClientOptions = {
+            model: modelName,
+            url: providerConfig.url ?? DEFAULT_URLS[type] ?? '',
+            apiType: type as AIModelApiType,
+            apiKey: providerConfig.apiKey,
+            timeout: this.config.timeout ?? 30000,
+            retries: this.config.retries ?? 2,
+            debug: this.config.debug ?? false,
+            defaultParameters: this.config.defaultParameters,
+            // Preserve `undefined` (not set) vs explicit false so providers can
+            // decide whether to send a thinking toggle at all.
+            thinking: this.config.thinking,
+            region: providerConfig.region,
+            apiVersion: providerConfig.apiVersion,
+            extraHeaders: providerConfig.headers,
+            queryParams: providerConfig.queryParams,
+            authHeader: providerConfig.authHeader,
+            authPrefix: providerConfig.authPrefix,
+            apiBasePath: providerConfig.apiBasePath,
+        };
+        switch (type) {
+            case 'ollama':
+                return new OllamaClient(clientOptions, this.auditor);
+            case 'openai':
+            case 'llamacpp':
+                return new OpenAICompatibleClient(clientOptions, this.auditor);
+            case 'google':
+            case 'vertex':
+                return new GoogleClient(clientOptions, this.auditor);
+            case 'anthropic':
+                return new AnthropicClient(clientOptions, this.auditor);
+            default:
+                throw new Error(`Unknown provider type: ${type}`);
+        }
+    }
+    private normalizeType(type: string): string {
+        return type.toLowerCase();
+    }
+}