npm - @blockrun/mcp - Versions diffs - 0.7.0 → 0.7.1 - Mend

@blockrun/mcp 0.7.0 → 0.7.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (2) hide show

package/dist/index.js +7 -175
package/package.json +1 -1

package/dist/index.js CHANGED Viewed

@@ -590,18 +590,22 @@ function registerImageTool(server) {
   server.registerTool(
     "blockrun_image",
     {
-      description: `Generate or edit images via BlockRun.
+      description: `Generate or edit images via BlockRun. Pays with USDC \u2014 no separate API keys needed.
 Actions:
 - generate (default): Create image from text prompt
 - edit: Transform an existing image using img2img
-Generation models: openai/dall-e-3 ($0.04-0.08), together/flux-schnell ($0.02), google/nano-banana
+Generation models:
+- zai/cogview-4 ($0.02) \u2014 Zhipu CogView-4, photorealistic, great for detailed scenes
+- openai/dall-e-3 ($0.04-0.08) \u2014 High quality, prompt adherence
+- together/flux-schnell ($0.02) \u2014 Fast, stylized
+- google/nano-banana \u2014 Google image model
 Edit models: openai/gpt-image-1 (default for edits)`,
       inputSchema: {
         prompt: z4.string().describe("Image description or edit instructions"),
         action: z4.enum(["generate", "edit"]).optional().default("generate").describe("generate: create from text; edit: transform existing image"),
-        model: z4.enum(["openai/dall-e-3", "together/flux-schnell", "google/nano-banana", "openai/gpt-image-1"]).optional().describe("Model to use (default: dall-e-3 for generate, gpt-image-1 for edit)"),
+        model: z4.enum(["zai/cogview-4", "openai/dall-e-3", "together/flux-schnell", "google/nano-banana", "openai/gpt-image-1"]).optional().describe("Model to use (default: dall-e-3 for generate, gpt-image-1 for edit). zai/cogview-4 is Zhipu's photorealistic model."),
         image: z4.string().optional().describe("Source image for edit action: base64-encoded image or URL"),
         size: z4.enum(["1024x1024", "1792x1024", "1024x1792"]).optional().default("1024x1024"),
         quality: z4.enum(["standard", "hd"]).optional().default("standard")
@@ -1038,175 +1042,6 @@ ${lines.join("\n\n")}` }],
   );
 }
-// src/tools/glm-vision.ts
-import { z as z10 } from "zod";
-var ZHIPU_BASE_URL = "https://open.bigmodel.cn/api/paas/v4";
-async function callGLMVision(model, prompt, imageUrl, thinking = false) {
-  const apiKey = process.env.ZHIPU_API_KEY;
-  if (!apiKey) throw new Error("ZHIPU_API_KEY environment variable is required for GLM Vision");
-  const payload = {
-    model,
-    messages: [
-      {
-        role: "user",
-        content: [
-          { type: "image_url", image_url: { url: imageUrl } },
-          { type: "text", text: prompt }
-        ]
-      }
-    ],
-    temperature: 0.8,
-    top_p: 0.6,
-    max_tokens: 16384,
-    stream: false
-  };
-  if (thinking || model.includes("thinking")) {
-    payload["thinking"] = { type: "enabled" };
-  }
-  const res = await fetch(`${ZHIPU_BASE_URL}/chat/completions`, {
-    method: "POST",
-    headers: {
-      "Content-Type": "application/json",
-      Authorization: `Bearer ${apiKey}`
-    },
-    body: JSON.stringify(payload)
-  });
-  if (!res.ok) {
-    const err = await res.text().catch(() => res.statusText);
-    throw new Error(`GLM Vision API error ${res.status}: ${err}`);
-  }
-  const data = await res.json();
-  const choice = data.choices?.[0];
-  if (!choice) throw new Error("No response from GLM Vision");
-  if (choice.finish_reason === "sensitive") throw new Error("Content blocked by safety filter");
-  return choice.message.content;
-}
-async function callGLMOCR(fileUrl, startPage = 1, endPage) {
-  const apiKey = process.env.ZHIPU_API_KEY;
-  if (!apiKey) throw new Error("ZHIPU_API_KEY environment variable is required for GLM OCR");
-  const payload = {
-    model: "glm-ocr",
-    file: fileUrl,
-    return_crop_images: false,
-    need_layout_visualization: false,
-    start_page_id: startPage
-  };
-  if (endPage) payload["end_page_id"] = endPage;
-  const res = await fetch(`${ZHIPU_BASE_URL}/layout_parsing`, {
-    method: "POST",
-    headers: {
-      "Content-Type": "application/json",
-      Authorization: `Bearer ${apiKey}`
-    },
-    body: JSON.stringify(payload)
-  });
-  if (!res.ok) {
-    const err = await res.text().catch(() => res.statusText);
-    throw new Error(`GLM OCR API error ${res.status}: ${err}`);
-  }
-  const data = await res.json();
-  return data.markdown_result || data.choices?.[0]?.message?.content || JSON.stringify(data);
-}
-async function callGLMImageGen(prompt, size, quality) {
-  const apiKey = process.env.ZHIPU_API_KEY;
-  if (!apiKey) throw new Error("ZHIPU_API_KEY environment variable is required for GLM Image Gen");
-  const res = await fetch(`${ZHIPU_BASE_URL}/images/generations`, {
-    method: "POST",
-    headers: {
-      "Content-Type": "application/json",
-      Authorization: `Bearer ${apiKey}`
-    },
-    body: JSON.stringify({
-      model: "cogview-4-250304",
-      prompt,
-      size,
-      quality,
-      watermark_enabled: false
-    })
-  });
-  if (!res.ok) {
-    const err = await res.text().catch(() => res.statusText);
-    throw new Error(`GLM Image API error ${res.status}: ${err}`);
-  }
-  const data = await res.json();
-  const url = data.data?.[0]?.url;
-  if (!url) throw new Error("No image URL in GLM response");
-  return url;
-}
-function registerGLMVisionTool(server) {
-  server.registerTool(
-    "blockrun_glm_vision",
-    {
-      description: `Analyze images and documents using Zhipu AI's GLM vision models.
-Requires ZHIPU_API_KEY environment variable.
-Actions:
-- caption: Describe what's in an image
-- analyze: Deep analysis of an image (objects, layout, text, colors)
-- grounding: Locate specific elements in an image (returns bounding boxes)
-- code: Generate code from a UI screenshot or mockup
-- ocr: Extract text from a document/PDF (use file URL)
-- imagegen: Generate an image using CogView-4
-Models:
-- glm-4.6v (default): Best quality vision model
-- glm-4.6v-flash: Faster, cheaper
-- glm-4.1v-thinking-flash: With reasoning/thinking
-Cost: Zhipu AI pricing (separate from BlockRun x402 \u2014 uses ZHIPU_API_KEY)`,
-      inputSchema: {
-        action: z10.enum(["caption", "analyze", "grounding", "code", "ocr", "imagegen"]).describe("Task to perform"),
-        image: z10.string().optional().describe("Image URL or base64 data URI (for vision actions)"),
-        prompt: z10.string().optional().describe("Custom prompt or question about the image. For imagegen: the image description"),
-        model: z10.enum(["glm-4.6v", "glm-4.6v-flash", "glm-4.1v-thinking-flash"]).optional().default("glm-4.6v").describe("Vision model to use"),
-        size: z10.enum(["1280x1280", "1280x720", "720x1280", "1024x1024"]).optional().default("1280x1280").describe("Image size (for imagegen)"),
-        quality: z10.enum(["hd", "standard"]).optional().default("hd").describe("Image quality (for imagegen)"),
-        start_page: z10.number().optional().default(1).describe("Start page for OCR (PDF)"),
-        end_page: z10.number().optional().describe("End page for OCR (PDF)")
-      }
-    },
-    async ({ action, image, prompt, model, size, quality, start_page, end_page }) => {
-      try {
-        if (action === "imagegen") {
-          const imagePrompt = prompt || image || "";
-          if (!imagePrompt) {
-            return { content: [{ type: "text", text: formatError("prompt is required for imagegen action") }], isError: true };
-          }
-          const url = await callGLMImageGen(imagePrompt, size ?? "1280x1280", quality ?? "hd");
-          return {
-            content: [{ type: "text", text: `Generated image: ${url}` }],
-            structuredContent: { url }
-          };
-        }
-        if (action === "ocr") {
-          const fileUrl = image || prompt;
-          if (!fileUrl) {
-            return { content: [{ type: "text", text: formatError("image (PDF URL) is required for OCR") }], isError: true };
-          }
-          const result2 = await callGLMOCR(fileUrl, start_page ?? 1, end_page);
-          return { content: [{ type: "text", text: result2 }] };
-        }
-        if (!image) {
-          return { content: [{ type: "text", text: formatError("image is required for vision actions") }], isError: true };
-        }
-        const actionPrompts = {
-          caption: "Describe this image concisely and accurately.",
-          analyze: "Analyze this image in detail: describe all visible objects, layout, colors, text, and any notable features.",
-          grounding: `Locate the following elements in the image and return their bounding boxes in [x1,y1,x2,y2] format (0-1000 normalized): ${prompt || "all interactive UI elements"}`,
-          code: "Generate complete, working code to replicate this UI. Use React + TypeScript + Tailwind CSS. Include all components, styling, and mock data visible in the screenshot."
-        };
-        const visionPrompt = actionPrompts[action] || prompt || actionPrompts.caption;
-        const result = await callGLMVision(model ?? "glm-4.6v", visionPrompt, image);
-        return { content: [{ type: "text", text: result }] };
-      } catch (err) {
-        const errMsg = err instanceof Error ? err.message : String(err);
-        return { content: [{ type: "text", text: formatError(errMsg) }], isError: true };
-      }
-    }
-  );
-}
 // src/mcp-handler.ts
 function initializeMcpServer(server) {
   const budget = { limit: null, spent: 0, calls: 0, agents: /* @__PURE__ */ new Map() };
@@ -1220,9 +1055,6 @@ function initializeMcpServer(server) {
   registerExaTool(server);
   registerMarketsTool(server);
   registerDexTool(server);
-  if (process.env.ZHIPU_API_KEY) {
-    registerGLMVisionTool(server);
-  }
   server.registerResource(
     "wallet",
     "blockrun://wallet",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@blockrun/mcp",
-  "version": "0.7.0",
+  "version": "0.7.1",
   "mcpName": "io.github.BlockRunAI/blockrun-mcp",
   "description": "BlockRun MCP Server - Give your AI agent web search, deep research, prediction markets, crypto data, X/Twitter intelligence. Paid via x402 micropayments.",
   "type": "module",