npm - universal-llm-client - Versions diffs - 4.2.0 → 4.5.0 - Mend

universal-llm-client 4.2.0 → 4.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (108) hide show

package/CHANGELOG.md +142 -103
package/LICENSE +21 -21
package/README.md +640 -591
package/dist/ai-model.d.ts +12 -1
package/dist/ai-model.d.ts.map +1 -1
package/dist/ai-model.js +36 -1
package/dist/ai-model.js.map +1 -1
package/dist/gemma-channel.d.ts +14 -0
package/dist/gemma-channel.d.ts.map +1 -0
package/dist/gemma-channel.js +38 -0
package/dist/gemma-channel.js.map +1 -0
package/dist/gemma-diffusion.d.ts +49 -0
package/dist/gemma-diffusion.d.ts.map +1 -0
package/dist/gemma-diffusion.js +147 -0
package/dist/gemma-diffusion.js.map +1 -0
package/dist/http.d.ts +4 -0
package/dist/http.d.ts.map +1 -1
package/dist/http.js +14 -1
package/dist/http.js.map +1 -1
package/dist/index.d.ts +2 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +4 -0
package/dist/index.js.map +1 -1
package/dist/interfaces.d.ts +183 -7
package/dist/interfaces.d.ts.map +1 -1
package/dist/interfaces.js.map +1 -1
package/dist/providers/anthropic.d.ts.map +1 -1
package/dist/providers/anthropic.js +28 -3
package/dist/providers/anthropic.js.map +1 -1
package/dist/providers/google.d.ts +22 -1
package/dist/providers/google.d.ts.map +1 -1
package/dist/providers/google.js +225 -13
package/dist/providers/google.js.map +1 -1
package/dist/providers/ollama.d.ts +2 -0
package/dist/providers/ollama.d.ts.map +1 -1
package/dist/providers/ollama.js +59 -30
package/dist/providers/ollama.js.map +1 -1
package/dist/providers/openai.d.ts +14 -0
package/dist/providers/openai.d.ts.map +1 -1
package/dist/providers/openai.js +200 -22
package/dist/providers/openai.js.map +1 -1
package/dist/router.d.ts +2 -0
package/dist/router.d.ts.map +1 -1
package/dist/router.js +4 -0
package/dist/router.js.map +1 -1
package/dist/stream-decoder.d.ts +12 -0
package/dist/stream-decoder.d.ts.map +1 -1
package/dist/stream-decoder.js +182 -5
package/dist/stream-decoder.js.map +1 -1
package/dist/thinking.d.ts +36 -0
package/dist/thinking.d.ts.map +1 -0
package/dist/thinking.js +52 -0
package/dist/thinking.js.map +1 -0
package/package.json +118 -116
package/src/ai-model.ts +400 -350
package/src/auditor.ts +213 -213
package/src/client.ts +402 -402
package/src/debug/debug-google-streaming.ts +1 -1
package/src/demos/basic/universal-llm-examples.ts +3 -3
package/src/demos/diffusion-gemma/.env +29 -0
package/src/demos/diffusion-gemma/.env.example +27 -0
package/src/demos/diffusion-gemma/CLAUDE.md +95 -0
package/src/demos/diffusion-gemma/README.md +59 -0
package/src/demos/diffusion-gemma/canvas.ts +1606 -0
package/src/demos/diffusion-gemma/docker-compose.yml +29 -0
package/src/demos/diffusion-gemma/probe-stream.ts +51 -0
package/src/demos/diffusion-gemma/probe-tools.ts +55 -0
package/src/demos/diffusion-gemma/server.ts +1205 -0
package/src/demos/diffusion-gemma/start-vllm.sh +98 -0
package/src/gemma-channel.ts +47 -0
package/src/gemma-diffusion.ts +167 -0
package/src/http.ts +261 -247
package/src/index.ts +180 -161
package/src/interfaces.ts +843 -657
package/src/mcp.ts +345 -345
package/src/providers/anthropic.ts +796 -762
package/src/providers/google.ts +840 -620
package/src/providers/index.ts +8 -8
package/src/providers/ollama.ts +503 -469
package/src/providers/openai.ts +587 -392
package/src/router.ts +785 -780
package/src/stream-decoder.ts +535 -361
package/src/structured-output.ts +759 -759
package/src/test-scripts/test-google-deep-research.ts +33 -0
package/src/test-scripts/test-google-streaming-enhanced.ts +147 -147
package/src/test-scripts/test-google-streaming.ts +1 -1
package/src/test-scripts/test-google-system-prompt-comprehensive.ts +189 -189
package/src/test-scripts/test-google-thinking.ts +46 -0
package/src/test-scripts/test-system-message-positions.ts +163 -163
package/src/test-scripts/test-system-prompt-improvement-demo.ts +83 -83
package/src/test-scripts/test-vllm-qwen36.ts +256 -0
package/src/tests/ai-model.test.ts +1614 -1614
package/src/tests/auditor.test.ts +224 -224
package/src/tests/gemma-diffusion.test.ts +115 -0
package/src/tests/http.test.ts +200 -200
package/src/tests/interfaces.test.ts +117 -117
package/src/tests/providers/anthropic.test.ts +118 -0
package/src/tests/providers/google.test.ts +841 -660
package/src/tests/providers/ollama.test.ts +1034 -954
package/src/tests/providers/openai.test.ts +1511 -1122
package/src/tests/router.test.ts +254 -254
package/src/tests/stream-decoder.test.ts +263 -179
package/src/tests/structured-output.test.ts +1450 -1450
package/src/tests/thinking.test.ts +65 -0
package/src/tests/tools.test.ts +175 -175
package/src/thinking.ts +73 -0
package/src/tools.ts +246 -246
package/src/zod-adapter.ts +72 -72

package/src/tests/router.test.ts CHANGED Viewed

@@ -1,254 +1,254 @@
-/**
- * Tests for router.ts — Failover Engine
- */
-import { describe, it, expect, mock, beforeEach } from 'bun:test';
-import { Router, type ProviderEntry } from '../router.js';
-import { BaseLLMClient } from '../client.js';
-import { BufferedAuditor } from '../auditor.js';
-import type {
-    LLMChatMessage,
-    LLMChatResponse,
-    ChatOptions,
-    DecodedEvent,
-} from '../interfaces.js';
-// ============================================================================
-// Mock Client
-// ============================================================================
-class MockClient extends BaseLLMClient {
-    public chatFn: (messages: LLMChatMessage[]) => Promise<LLMChatResponse>;
-    public embedFn: (text: string) => Promise<number[]>;
-    public modelsFn: () => Promise<string[]>;
-    constructor(id: string, opts?: {
-        chatFn?: (messages: LLMChatMessage[]) => Promise<LLMChatResponse>;
-        embedFn?: (text: string) => Promise<number[]>;
-    }) {
-        super({
-            model: `mock-${id}`,
-            url: `http://mock-${id}`,
-            apiType: 'openai' as never,
-        });
-        this.chatFn = opts?.chatFn ?? (async () => ({
-            message: { role: 'assistant' as const, content: `Response from ${id}` },
-            provider: id,
-        }));
-        this.embedFn = opts?.embedFn ?? (async () => [1, 2, 3]);
-        this.modelsFn = async () => [`mock-${id}`];
-    }
-    async chat(messages: LLMChatMessage[]): Promise<LLMChatResponse> {
-        return this.chatFn(messages);
-    }
-    async *chatStream(): AsyncGenerator<DecodedEvent, LLMChatResponse | void, unknown> {
-        yield { type: 'text', content: 'streamed' };
-        return { message: { role: 'assistant', content: 'streamed' }, provider: 'mock' };
-    }
-    async getModels(): Promise<string[]> {
-        return this.modelsFn();
-    }
-    async embed(text: string): Promise<number[]> {
-        return this.embedFn(text);
-    }
-}
-// ============================================================================
-// Tests
-// ============================================================================
-describe('Router', () => {
-    let router: Router;
-    let auditor: BufferedAuditor;
-    beforeEach(() => {
-        auditor = new BufferedAuditor();
-        router = new Router({ auditor, retriesPerProvider: 1, maxFailures: 2, cooldownMs: 100 });
-    });
-    describe('provider management', () => {
-        it('adds providers and sorts by priority', () => {
-            const clientA = new MockClient('a');
-            const clientB = new MockClient('b');
-            router.addProvider({ id: 'a', client: clientA, priority: 2 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            const status = router.getStatus();
-            expect(status).toHaveLength(2);
-            // b has lower priority number = tried first
-            expect(status[0]!.id).toBe('b');
-            expect(status[1]!.id).toBe('a');
-        });
-        it('removes providers', () => {
-            router.addProvider({ id: 'a', client: new MockClient('a'), priority: 0 });
-            router.addProvider({ id: 'b', client: new MockClient('b'), priority: 1 });
-            router.removeProvider('a');
-            expect(router.getStatus()).toHaveLength(1);
-            expect(router.getStatus()[0]!.id).toBe('b');
-        });
-    });
-    describe('execution with failover', () => {
-        it('uses the highest-priority provider', async () => {
-            const clientA = new MockClient('a');
-            const clientB = new MockClient('b');
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            const result = await router.chat([{ role: 'user', content: 'test' }]);
-            expect(result.provider).toBe('a');
-        });
-        it('fails over to next provider on error', async () => {
-            const clientA = new MockClient('a', {
-                chatFn: async () => { throw new Error('A failed'); },
-            });
-            const clientB = new MockClient('b');
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            const result = await router.chat([{ role: 'user', content: 'test' }]);
-            expect(result.provider).toBe('b');
-            // Check audit events
-            const events = auditor.getEvents();
-            const failoverEvents = events.filter(e => e.type === 'failover');
-            expect(failoverEvents.length).toBeGreaterThan(0);
-        });
-        it('retries within a provider before failover', async () => {
-            let attempts = 0;
-            const clientA = new MockClient('a', {
-                chatFn: async () => {
-                    attempts++;
-                    if (attempts === 1) throw new Error('Transient failure');
-                    return {
-                        message: { role: 'assistant' as const, content: 'recovered' },
-                        provider: 'a',
-                    };
-                },
-            });
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            const result = await router.chat([{ role: 'user', content: 'test' }]);
-            expect(result.provider).toBe('a');
-            expect(attempts).toBe(2); // first attempt + 1 retry
-        });
-        it('throws when all providers fail', async () => {
-            const clientA = new MockClient('a', {
-                chatFn: async () => { throw new Error('A failed'); },
-            });
-            const clientB = new MockClient('b', {
-                chatFn: async () => { throw new Error('B failed'); },
-            });
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            expect(router.chat([{ role: 'user', content: 'test' }])).rejects.toThrow();
-        });
-        it('throws when no providers configured', async () => {
-            expect(router.chat([{ role: 'user', content: 'test' }])).rejects.toThrow(
-                'No available LLM providers'
-            );
-        });
-    });
-    describe('health tracking', () => {
-        it('marks unhealthy after max failures', async () => {
-            const failing = new MockClient('fail', {
-                chatFn: async () => { throw new Error('always fails'); },
-            });
-            const backup = new MockClient('backup');
-            router.addProvider({ id: 'fail', client: failing, priority: 0 });
-            router.addProvider({ id: 'backup', client: backup, priority: 1 });
-            // Each chat call records 1 failure for 'fail', maxFailures is 2
-            await router.chat([{ role: 'user', content: 'test 1' }]);
-            await router.chat([{ role: 'user', content: 'test 2' }]);
-            const status = router.getStatus();
-            const failStatus = status.find(s => s.id === 'fail');
-            expect(failStatus!.healthy).toBe(false);
-        });
-        it('recovers after cooldown expires', async () => {
-            let callCount = 0;
-            const failing = new MockClient('fail', {
-                chatFn: async () => {
-                    callCount++;
-                    if (callCount <= 4) throw new Error('failing');
-                    return {
-                        message: { role: 'assistant' as const, content: 'recovered' },
-                        provider: 'fail',
-                    };
-                },
-            });
-            const backup = new MockClient('backup');
-            router.addProvider({ id: 'fail', client: failing, priority: 0 });
-            router.addProvider({ id: 'backup', client: backup, priority: 1 });
-            // First call: fail → backup
-            await router.chat([{ role: 'user', content: '1' }]);
-            // Wait for cooldown (100ms in test config)
-            await new Promise(r => setTimeout(r, 150));
-            // After cooldown, fail should be tried again
-            const status = router.getStatus();
-            const failStatus = status.find(s => s.id === 'fail');
-            expect(failStatus!.healthy).toBe(true);
-        });
-    });
-    describe('tool registration', () => {
-        it('broadcasts tool registration to all providers', () => {
-            const clientA = new MockClient('a');
-            const clientB = new MockClient('b');
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            router.registerTool(
-                'test_tool',
-                'A test tool',
-                { type: 'object', properties: {} },
-                async () => 'result',
-            );
-            // Both clients should have the tool registered
-            const defsA = clientA.getToolDefinitions();
-            const defsB = clientB.getToolDefinitions();
-            expect(defsA).toHaveLength(1);
-            expect(defsB).toHaveLength(1);
-            expect(defsA[0]!.function.name).toBe('test_tool');
-        });
-    });
-    describe('model aggregation', () => {
-        it('aggregates models from all providers', async () => {
-            const clientA = new MockClient('a');
-            const clientB = new MockClient('b');
-            router.addProvider({ id: 'a', client: clientA, priority: 0 });
-            router.addProvider({ id: 'b', client: clientB, priority: 1 });
-            const models = await router.getModels();
-            expect(models).toContain('mock-a');
-            expect(models).toContain('mock-b');
-        });
-    });
-});
+/**
+ * Tests for router.ts — Failover Engine
+ */
+import { describe, it, expect, mock, beforeEach } from 'bun:test';
+import { Router, type ProviderEntry } from '../router.js';
+import { BaseLLMClient } from '../client.js';
+import { BufferedAuditor } from '../auditor.js';
+import type {
+    LLMChatMessage,
+    LLMChatResponse,
+    ChatOptions,
+    DecodedEvent,
+} from '../interfaces.js';
+// ============================================================================
+// Mock Client
+// ============================================================================
+class MockClient extends BaseLLMClient {
+    public chatFn: (messages: LLMChatMessage[]) => Promise<LLMChatResponse>;
+    public embedFn: (text: string) => Promise<number[]>;
+    public modelsFn: () => Promise<string[]>;
+    constructor(id: string, opts?: {
+        chatFn?: (messages: LLMChatMessage[]) => Promise<LLMChatResponse>;
+        embedFn?: (text: string) => Promise<number[]>;
+    }) {
+        super({
+            model: `mock-${id}`,
+            url: `http://mock-${id}`,
+            apiType: 'openai' as never,
+        });
+        this.chatFn = opts?.chatFn ?? (async () => ({
+            message: { role: 'assistant' as const, content: `Response from ${id}` },
+            provider: id,
+        }));
+        this.embedFn = opts?.embedFn ?? (async () => [1, 2, 3]);
+        this.modelsFn = async () => [`mock-${id}`];
+    }
+    async chat(messages: LLMChatMessage[]): Promise<LLMChatResponse> {
+        return this.chatFn(messages);
+    }
+    async *chatStream(): AsyncGenerator<DecodedEvent, LLMChatResponse | void, unknown> {
+        yield { type: 'text', content: 'streamed' };
+        return { message: { role: 'assistant', content: 'streamed' }, provider: 'mock' };
+    }
+    async getModels(): Promise<string[]> {
+        return this.modelsFn();
+    }
+    async embed(text: string): Promise<number[]> {
+        return this.embedFn(text);
+    }
+}
+// ============================================================================
+// Tests
+// ============================================================================
+describe('Router', () => {
+    let router: Router;
+    let auditor: BufferedAuditor;
+    beforeEach(() => {
+        auditor = new BufferedAuditor();
+        router = new Router({ auditor, retriesPerProvider: 1, maxFailures: 2, cooldownMs: 100 });
+    });
+    describe('provider management', () => {
+        it('adds providers and sorts by priority', () => {
+            const clientA = new MockClient('a');
+            const clientB = new MockClient('b');
+            router.addProvider({ id: 'a', client: clientA, priority: 2 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            const status = router.getStatus();
+            expect(status).toHaveLength(2);
+            // b has lower priority number = tried first
+            expect(status[0]!.id).toBe('b');
+            expect(status[1]!.id).toBe('a');
+        });
+        it('removes providers', () => {
+            router.addProvider({ id: 'a', client: new MockClient('a'), priority: 0 });
+            router.addProvider({ id: 'b', client: new MockClient('b'), priority: 1 });
+            router.removeProvider('a');
+            expect(router.getStatus()).toHaveLength(1);
+            expect(router.getStatus()[0]!.id).toBe('b');
+        });
+    });
+    describe('execution with failover', () => {
+        it('uses the highest-priority provider', async () => {
+            const clientA = new MockClient('a');
+            const clientB = new MockClient('b');
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            const result = await router.chat([{ role: 'user', content: 'test' }]);
+            expect(result.provider).toBe('a');
+        });
+        it('fails over to next provider on error', async () => {
+            const clientA = new MockClient('a', {
+                chatFn: async () => { throw new Error('A failed'); },
+            });
+            const clientB = new MockClient('b');
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            const result = await router.chat([{ role: 'user', content: 'test' }]);
+            expect(result.provider).toBe('b');
+            // Check audit events
+            const events = auditor.getEvents();
+            const failoverEvents = events.filter(e => e.type === 'failover');
+            expect(failoverEvents.length).toBeGreaterThan(0);
+        });
+        it('retries within a provider before failover', async () => {
+            let attempts = 0;
+            const clientA = new MockClient('a', {
+                chatFn: async () => {
+                    attempts++;
+                    if (attempts === 1) throw new Error('Transient failure');
+                    return {
+                        message: { role: 'assistant' as const, content: 'recovered' },
+                        provider: 'a',
+                    };
+                },
+            });
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            const result = await router.chat([{ role: 'user', content: 'test' }]);
+            expect(result.provider).toBe('a');
+            expect(attempts).toBe(2); // first attempt + 1 retry
+        });
+        it('throws when all providers fail', async () => {
+            const clientA = new MockClient('a', {
+                chatFn: async () => { throw new Error('A failed'); },
+            });
+            const clientB = new MockClient('b', {
+                chatFn: async () => { throw new Error('B failed'); },
+            });
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            expect(router.chat([{ role: 'user', content: 'test' }])).rejects.toThrow();
+        });
+        it('throws when no providers configured', async () => {
+            expect(router.chat([{ role: 'user', content: 'test' }])).rejects.toThrow(
+                'No available LLM providers'
+            );
+        });
+    });
+    describe('health tracking', () => {
+        it('marks unhealthy after max failures', async () => {
+            const failing = new MockClient('fail', {
+                chatFn: async () => { throw new Error('always fails'); },
+            });
+            const backup = new MockClient('backup');
+            router.addProvider({ id: 'fail', client: failing, priority: 0 });
+            router.addProvider({ id: 'backup', client: backup, priority: 1 });
+            // Each chat call records 1 failure for 'fail', maxFailures is 2
+            await router.chat([{ role: 'user', content: 'test 1' }]);
+            await router.chat([{ role: 'user', content: 'test 2' }]);
+            const status = router.getStatus();
+            const failStatus = status.find(s => s.id === 'fail');
+            expect(failStatus!.healthy).toBe(false);
+        });
+        it('recovers after cooldown expires', async () => {
+            let callCount = 0;
+            const failing = new MockClient('fail', {
+                chatFn: async () => {
+                    callCount++;
+                    if (callCount <= 4) throw new Error('failing');
+                    return {
+                        message: { role: 'assistant' as const, content: 'recovered' },
+                        provider: 'fail',
+                    };
+                },
+            });
+            const backup = new MockClient('backup');
+            router.addProvider({ id: 'fail', client: failing, priority: 0 });
+            router.addProvider({ id: 'backup', client: backup, priority: 1 });
+            // First call: fail → backup
+            await router.chat([{ role: 'user', content: '1' }]);
+            // Wait for cooldown (100ms in test config)
+            await new Promise(r => setTimeout(r, 150));
+            // After cooldown, fail should be tried again
+            const status = router.getStatus();
+            const failStatus = status.find(s => s.id === 'fail');
+            expect(failStatus!.healthy).toBe(true);
+        });
+    });
+    describe('tool registration', () => {
+        it('broadcasts tool registration to all providers', () => {
+            const clientA = new MockClient('a');
+            const clientB = new MockClient('b');
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            router.registerTool(
+                'test_tool',
+                'A test tool',
+                { type: 'object', properties: {} },
+                async () => 'result',
+            );
+            // Both clients should have the tool registered
+            const defsA = clientA.getToolDefinitions();
+            const defsB = clientB.getToolDefinitions();
+            expect(defsA).toHaveLength(1);
+            expect(defsB).toHaveLength(1);
+            expect(defsA[0]!.function.name).toBe('test_tool');
+        });
+    });
+    describe('model aggregation', () => {
+        it('aggregates models from all providers', async () => {
+            const clientA = new MockClient('a');
+            const clientB = new MockClient('b');
+            router.addProvider({ id: 'a', client: clientA, priority: 0 });
+            router.addProvider({ id: 'b', client: clientB, priority: 1 });
+            const models = await router.getModels();
+            expect(models).toContain('mock-a');
+            expect(models).toContain('mock-b');
+        });
+    });
+});