npm - @webmcp-auto-ui/agent - Versions diffs - 2.5.12 → 2.5.15 - Mend

@webmcp-auto-ui/agent 2.5.12 → 2.5.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/README.md +10 -9
package/package.json +3 -3
package/src/server/{anthropicProxy.ts → llmProxy.ts} +2 -2

package/README.md CHANGED Viewed

@@ -4,12 +4,14 @@ LLM agent loop that connects MCP and WebMCP servers to a UI. Given a user messag
 ## Providers
-**AnthropicProvider** — proxies to a `+server.ts` endpoint that holds the API key. Supports `claude-haiku-4-5` and `claude-sonnet-4-6`. Prompt caching enabled by default. Retry on 503 with exponential backoff. Returns stats in `LLMResponse`: tok/s, totalTokens, latencyMs.
+**RemoteLLMProvider** — proxies to a `+server.ts` endpoint that holds the API key. Compatible with any OpenAI-compatible API backend (Anthropic, OpenAI, Google, Mistral, etc.). Prompt caching enabled by default. Retry on 503 with exponential backoff. Returns stats in `LLMResponse`: tok/s, totalTokens, latencyMs.
 **GemmaProvider (LiteRT)** — runs Gemma 4 models via `@mediapipe/tasks-genai` (LiteRT, formerly known as MediaPipe) directly on the **main thread**. Uses WebGPU when available. No API key required. Models are cached in **OPFS** (Origin Private File System) for instant reload after first download.
 > **v0.5.0 migration**: GemmaProvider was migrated from ONNX (`@huggingface/transformers`) to LiteRT (`@mediapipe/tasks-genai`). LiteRT is 2-4x faster on WebGPU and provides native Gemma 4 support. The provider now runs on the main thread because MediaPipe is incompatible with ES module workers.
+**LocalLLMProvider** — runs against a local Ollama instance (or any OpenAI-compatible local server: vLLM, LM Studio, llamafile). No API key required. Converts messages and tools to the OpenAI chat completions format automatically.
 **Gemma 4 prompt format** — uses `<|turn>...<turn|>` delimiters (instead of the Gemma 2/3 `<start_of_turn>...<end_of_turn>`).
 **Native tool calling** — Gemma 4 tool calls are parsed from `<|tool_call>call:name{args}<tool_call|>` format. No regex heuristics needed.
@@ -46,10 +48,10 @@ npm install @webmcp-auto-ui/agent
 ## Usage
 ```ts
-import { autoui, runAgentLoop, AnthropicProvider } from '@webmcp-auto-ui/agent';
+import { autoui, runAgentLoop, RemoteLLMProvider } from '@webmcp-auto-ui/agent';
 const result = await runAgentLoop('Show me sales data', {
-  provider: new AnthropicProvider({ proxyUrl: '/api/chat' }),
+  provider: new RemoteLLMProvider({ proxyUrl: '/api/chat' }),
   layers: [mcpClient.layer(), autoui.layer()],
   maxIterations: 5,
   callbacks: {
@@ -64,8 +66,6 @@ const result = await runAgentLoop('Show me sales data', {
 });
 ```
-> **Migration from Phase 7**: `onBlock` still works as a deprecated alias for `onWidget`. The `UILayer`, `SkillLayer`, `COMPONENT_TOOL`, `executeComponent`, and `componentRegistry` exports are removed — use `autoui.layer()` instead.
 ## TokenTracker
 Real-time usage metrics tracking across requests:
@@ -125,18 +125,19 @@ Requires `Cross-Origin-Opener-Policy: same-origin` and `Cross-Origin-Embedder-Po
 ## API proxy (`+server.ts`)
-The `AnthropicProvider` sends requests to a local endpoint. The endpoint reads `ANTHROPIC_API_KEY` from the environment, or from `body.__apiKey` as a fallback (for cases where the key is provided at runtime).
+The `RemoteLLMProvider` sends requests to a local `+server.ts` endpoint that forwards them to the configured LLM API. The endpoint reads `LLM_API_KEY` from the environment, or from `body.__apiKey` as a fallback (for cases where the key is provided at runtime).
 ```ts
 // src/routes/api/chat/+server.ts
 import { env } from '$env/dynamic/private';
 export const POST: RequestHandler = async ({ request }) => {
   const body = await request.json();
-  const apiKey = body.__apiKey || env.ANTHROPIC_API_KEY;
+  const apiKey = body.__apiKey || env.LLM_API_KEY;
   delete body.__apiKey;
-  const res = await fetch('https://api.anthropic.com/v1/messages', {
+  // Forward to your LLM provider (Anthropic, OpenAI, Mistral, etc.)
+  const res = await fetch(LLM_ENDPOINT, {
     method: 'POST',
-    headers: { 'x-api-key': apiKey, 'anthropic-version': '2023-06-01', 'Content-Type': 'application/json' },
+    headers: { 'Authorization': `Bearer ${apiKey}`, 'Content-Type': 'application/json' },
     body: JSON.stringify(body),
   });
   return Response.json(await res.json());

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@webmcp-auto-ui/agent",
-  "version": "2.5.12",
-  "description": "LLM agent loop + Anthropic/Gemma LiteRT providers + MCP wrapper",
+  "version": "2.5.15",
+  "description": "LLM agent loop + remote/WASM/local providers + MCP wrapper",
   "license": "AGPL-3.0-or-later",
   "type": "module",
   "sideEffects": true,
@@ -11,7 +11,7 @@
       "import": "./src/index.ts"
     },
     "./server": {
-      "import": "./src/server/anthropicProxy.ts"
+      "import": "./src/server/llmProxy.ts"
     }
   },
   "scripts": {

package/src/server/{anthropicProxy.ts → llmProxy.ts} RENAMED Viewed

@@ -1,9 +1,9 @@
 /**
- * Shared Anthropic proxy handler — used by all apps' /api/chat/+server.ts
+ * Shared LLM proxy handler — used by all apps' /api/chat/+server.ts
  * Accepts the parsed body (with __apiKey already extracted), the resolved
  * API key, and the optional model override from X-Model header.
  */
-export async function anthropicProxy(
+export async function llmProxy(
   body: Record<string, unknown>,
   apiKey: string,
   model?: string | null,