npm - @blockrun/llm - Versions diffs - 1.8.0 → 1.10.1 - Mend

@blockrun/llm 1.8.0 → 1.10.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/README.md CHANGED Viewed

@@ -103,7 +103,7 @@ const client = new LLMClient();
 // Auto-routes to cheapest capable model
 const result = await client.smartChat('What is 2+2?');
 console.log(result.response);     // '4'
-console.log(result.model);        // 'nvidia/kimi-k2.5' (cheap, fast)
+console.log(result.model);        // 'moonshot/kimi-k2.5' (cheap, fast)
 console.log(`Saved ${(result.routing.savings * 100).toFixed(0)}%`); // 'Saved 78%'
 // Complex reasoning task -> routes to reasoning model
@@ -144,7 +144,7 @@ The classifier runs in <1ms, 100% locally, and routes to one of four tiers:
 | Tier | Example Tasks | Auto Profile Model |
 |------|---------------|-------------------|
-| SIMPLE | "What is 2+2?", definitions | nvidia/kimi-k2.5 |
+| SIMPLE | "What is 2+2?", definitions | moonshot/kimi-k2.5 |
 | MEDIUM | Code snippets, explanations | xai/grok-code-fast-1 |
 | COMPLEX | Architecture, long documents | google/gemini-3.1-pro |
 | REASONING | Proofs, multi-step reasoning | xai/grok-4-1-fast-reasoning |
@@ -236,11 +236,23 @@ The classifier runs in <1ms, 100% locally, and routes to one of four tiers:
 | `minimax/minimax-m2.7` | $0.30/M | $1.20/M |
 | `minimax/minimax-m2.5` | $0.30/M | $1.20/M |
-### NVIDIA (Free & Hosted)
+### NVIDIA (Free) + Moonshot
+Free tier refreshed 2026-04-21: retired the Nemotron family, `mistral-large-3-675b`,
+`devstral-2-123b`, and paid `nvidia/kimi-k2.5`. The backend auto-redirects the
+old IDs; the recommended replacements are listed below.
 | Model | Input Price | Output Price | Notes |
 |-------|-------------|--------------|-------|
-| `nvidia/gpt-oss-120b` | **FREE** | **FREE** | OpenAI open-weight 120B (Apache 2.0) |
-| `nvidia/kimi-k2.5` | $0.60/M | $3.00/M | Moonshot 1T MoE with vision |
+| `nvidia/qwen3-next-80b-a3b-thinking` | **FREE** | **FREE** | Reasoning flagship — 116 tok/s, thinking mode |
+| `nvidia/mistral-small-4-119b` | **FREE** | **FREE** | Fastest free chat — 114 tok/s |
+| `nvidia/glm-4.7` | **FREE** | **FREE** | GLM-4.7 with thinking — 237 tok/s |
+| `nvidia/llama-4-maverick` | **FREE** | **FREE** | Llama 4 Maverick MoE |
+| `nvidia/qwen3-coder-480b` | **FREE** | **FREE** | Coding-optimised 480B MoE |
+| `nvidia/deepseek-v3.2` | **FREE** | **FREE** | DeepSeek V3.2 hosted |
+| `nvidia/gpt-oss-120b` | **FREE** | **FREE** | OpenAI open-weight 120B — 123 tok/s |
+| `nvidia/gpt-oss-20b` | **FREE** | **FREE** | OpenAI open-weight 20B — 155 tok/s |
+| `moonshot/kimi-k2.5` | $0.60/M | $3.00/M | Direct from Moonshot — replaces `nvidia/kimi-k2.5` |
 ### E2E Verified Models
@@ -262,6 +274,7 @@ All models below have been tested end-to-end via the TypeScript SDK (Feb 2026):
 |-------|-------|
 | `openai/dall-e-3` | $0.04-0.08/image |
 | `openai/gpt-image-1` | $0.02-0.04/image |
+| `openai/gpt-image-2` | $0.06-0.12/image (reasoning-driven, multilingual text rendering, character consistency) |
 | `google/nano-banana` | $0.05/image |
 | `google/nano-banana-pro` | $0.10-0.15/image |
 | `black-forest/flux-1.1-pro` | $0.04/image |
@@ -269,10 +282,15 @@ All models below have been tested end-to-end via the TypeScript SDK (Feb 2026):
 | `xai/grok-imagine-image-pro` | $0.07/image |
 | `zai/cogview-4` | $0.015/image |
+Image editing (`client.edit`): `openai/gpt-image-1` and `openai/gpt-image-2` both support the `/v1/images/image2image` endpoint.
 ### Video Generation
 | Model | Price |
 |-------|-------|
 | `xai/grok-imagine-video` | $0.05/sec (8s default → $0.42/clip) |
+| `bytedance/seedance-1.5-pro` | $0.03/sec (5s default, up to 10s, 720p) |
+| `bytedance/seedance-2.0-fast` | $0.15/sec (~60-80s gen, sweet-spot price/quality) |
+| `bytedance/seedance-2.0` | $0.30/sec (720p Pro) |
 ```ts
 import { VideoClient } from '@blockrun/llm';

package/dist/index.cjs CHANGED Viewed

@@ -1685,7 +1685,7 @@ var import_accounts3 = require("viem/accounts");
 var DEFAULT_API_URL2 = "https://blockrun.ai/api";
 var DEFAULT_MODEL = "google/nano-banana";
 var DEFAULT_SIZE = "1024x1024";
-var DEFAULT_TIMEOUT2 = 12e4;
+var DEFAULT_TIMEOUT2 = 2e5;
 var ImageClient = class {
   account;
   privateKey;

package/dist/index.js CHANGED Viewed

@@ -1596,7 +1596,7 @@ import { privateKeyToAccount as privateKeyToAccount2 } from "viem/accounts";
 var DEFAULT_API_URL2 = "https://blockrun.ai/api";
 var DEFAULT_MODEL = "google/nano-banana";
 var DEFAULT_SIZE = "1024x1024";
-var DEFAULT_TIMEOUT2 = 12e4;
+var DEFAULT_TIMEOUT2 = 2e5;
 var ImageClient = class {
   account;
   privateKey;

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@blockrun/llm",
-  "version": "1.8.0",
+  "version": "1.10.1",
   "type": "module",
   "description": "BlockRun SDK - Pay-per-request AI (LLM, Image, Video, Music) via x402 on Base and Solana",
   "main": "dist/index.cjs",