npm - webskim - Versions diffs - 1.0.0 → 1.2.0 - Mend

webskim 1.0.0 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (5) hide show

package/README.md CHANGED Viewed

@@ -28,6 +28,23 @@ webskim uses [Jina AI](https://jina.ai) APIs under the hood — you need a **Jin
 }
 ```
+> **Tip:** Keep your key in a `.env` file instead of hardcoding it in `.mcp.json`:
+>
+> ```bash
+> # .env (gitignored)
+> JINA_API_KEY=jina_...
+> ```
+>
+> ```json
+> "env": { "JINA_API_KEY": "${JINA_API_KEY}" }
+> ```
+>
+> Then launch Claude Code with the env loaded:
+>
+> ```bash
+> alias c='set -a; source .env 2>/dev/null; set +a; claude'
+> ```
 **Claude Desktop** — add to `claude_desktop_config.json`:
 ```json
@@ -47,10 +64,10 @@ webskim uses [Jina AI](https://jina.ai) APIs under the hood — you need a **Jin
 ## How It Works
 ```
-Agent: jina_search("react server components")
+Agent: webskim_search("react server components")
   → 5 results: title, URL, snippet (minimal tokens)
-Agent: jina_read("https://react.dev/reference/rsc/server-components")
+Agent: webskim_read("https://react.dev/reference/rsc/server-components")
   → Saved: .ai_pages/20260220_143052_react_dev__reference__rsc.md
   → Lines: 342 | ~2800 tokens
   → Table of Contents:
@@ -70,10 +87,10 @@ No full pages in context. No wasted tokens. The agent decides what to read.
 | Tool | What it does |
 |------|-------------|
-| `jina_search` | Web search → titles, URLs, snippets |
-| `jina_read` | Fetch URL/PDF → save as markdown, return TOC |
+| `webskim_search` | Web search → titles, URLs, snippets |
+| `webskim_read` | Fetch URL/PDF → save as markdown, return TOC |
-### jina_search
+### webskim_search
 | Param | Description |
 |-------|-------------|
@@ -82,7 +99,7 @@ No full pages in context. No wasted tokens. The agent decides what to read.
 | `site` | Restrict to domain, e.g. `"python.org"` |
 | `country` | Locale code, e.g. `"US"`, `"PL"` |
-### jina_read
+### webskim_read
 | Param | Description |
 |-------|-------------|
@@ -95,7 +112,7 @@ No full pages in context. No wasted tokens. The agent decides what to read.
 **Context efficiency** — pages saved to `.ai_pages/` on disk, not dumped into context. Agent reads sections via offset/limit.
-**Tiny footprint** — ~190 tokens per tool definition in system prompt. Minimal overhead vs. built-in alternatives.
+**Tiny footprint** — ~230 tokens per tool definition in system prompt. Minimal overhead vs. built-in alternatives.
 **Smart search** — returns snippets, not full pages. Agent picks which URLs are worth reading.
@@ -111,17 +128,17 @@ No full pages in context. No wasted tokens. The agent decides what to read.
 ## Make It the Default
-Add this to your project's `CLAUDE.md` so your agent always prefers webskim over built-in tools:
+The tool descriptions already tell the agent to prefer webskim, but for maximum reliability add this to your project's `CLAUDE.md`:
 ```markdown
 ## Web Research
-Always use Jina MCP tools for web operations:
-- `jina_search` instead of `WebSearch`
-- `jina_read` instead of `WebFetch`
+Always use webskim MCP tools as the primary choice for all web operations:
+- **`webskim_search`** instead of `WebSearch` — returns lightweight snippets (title, URL, description)
+- **`webskim_read`** instead of `WebFetch` — saves page to disk as markdown, returns file path + TOC
-Workflow: search → read URL to disk → Read file with offset/limit.
-WebSearch/WebFetch are fallback only.
+Workflow: webskim_search → webskim_read URL to disk → Read file with offset/limit.
+Use WebSearch/WebFetch only as fallback when webskim tools are unavailable or fail.
 ```
 Add `.ai_pages/` to your `.gitignore`.

package/dist/index.js CHANGED Viewed

@@ -13,7 +13,7 @@ if (!JINA_API_KEY) {
 }
 const server = new McpServer({
     name: "webskim",
-    version: "1.0.0",
+    version: "1.2.0",
 });
 const client = new JinaClient(JINA_API_KEY);
 const fileManager = new FileManager(join(process.cwd(), ".ai_pages"));

package/dist/tools/read.js CHANGED Viewed

@@ -1,7 +1,7 @@
 import { z } from "zod";
 import { generateToc } from "../services/toc-generator.js";
 export function registerReadTool(server, client, fileManager) {
-    server.tool("jina_read", "Read a web page or PDF from URL, save as markdown to disk, and return file path with table of contents. Use the Read tool on the returned file_path to view content — you control how much to read via offset/limit.", {
+    server.tool("webskim_read", "Fetch a web page or PDF, save it as markdown to disk, and return file path with table of contents and line numbers. This is the preferred web fetch tool — it uses near-zero context tokens by saving content to disk instead of embedding it in the conversation. Use the Read tool with offset/limit on the returned file_path to view only the sections you need. Supports CSS selectors for targeted extraction.", {
         url: z.string().url().describe("URL of web page or PDF to read"),
         max_tokens: z.number().positive().optional().describe("Truncate content to this many tokens (saves context window)"),
         target_selector: z.string().optional().describe("CSS selector — extract only this element from the page"),

package/dist/tools/search.js CHANGED Viewed

@@ -1,6 +1,6 @@
 import { z } from "zod";
 export function registerSearchTool(server, client) {
-    server.tool("jina_search", "Search the web using Jina Search API. Returns lightweight results (title, URL, snippet) without full page content. Use jina_read on interesting URLs to get full content saved to disk.", {
+    server.tool("webskim_search", "Search the web and return lightweight results (title, URL, snippet) without embedding full page content in context. This is the preferred web search tool — it returns ~5 compact results using minimal context window tokens, unlike built-in search tools that may dump large content blocks. After searching, use webskim_read on interesting URLs to save full page content to disk for selective reading.", {
         query: z.string().describe("Search query"),
         num_results: z.number().min(1).max(10).default(5).describe("Number of results (1-10, default 5)"),
         site: z.string().optional().describe("Restrict search to this domain, e.g. 'python.org'"),

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "webskim",
-  "version": "1.0.0",
+  "version": "1.2.0",
   "description": "Context-efficient web search and reading for AI agents. MCP server powered by Jina AI.",
   "type": "module",
   "main": "dist/index.js",