PyPI - morph-websearch-mcp - Versions diffs - 0.1.0__tar.gz - Mend

morph-websearch-mcp 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

morph_websearch_mcp-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,73 @@
+Metadata-Version: 2.4
+Name: morph-websearch-mcp
+Version: 0.1.0
+Summary: Web search MCP server with AI-powered content extraction
+License-Expression: MIT
+Requires-Python: >=3.13
+Description-Content-Type: text/markdown
+Requires-Dist: mcp>=1.0.0
+Requires-Dist: crawl4ai>=0.4.0
+Requires-Dist: requests>=2.31.0
+Requires-Dist: openai>=1.0.0
+Requires-Dist: beautifulsoup4>=4.12.0
+# websearch-mcp
+MCP server providing web search, web fetch, and AI-powered web extraction — all results compacted for minimal context usage.
+## Tools
+| Tool | Input | Output |
+|------|-------|--------|
+| `websearch` | `{query, num_results?}` | `[{title, url, snippet, content}]` |
+| `webfetch` | `{url}` | `{url, content}` |
+| `webextract` | `{query}` | `{answer, sources: [{title, url}]}` |
+All page content is compacted via morph before returning, stripping irrelevant boilerplate.
+## Install
+```bash
+pip install morph-websearch-mcp
+# or
+uv add morph-websearch-mcp
+```
+## Setup
+Set your morph API key:
+```bash
+export MORPH_API_KEY="sk-..."
+```
+## MCP Client Config
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "websearch-mcp",
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```
+If installing from source:
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "uv",
+      "args": ["run", "--directory", "/path/to/websearch-mcp", "main.py"],
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```

morph_websearch_mcp-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,60 @@
+# websearch-mcp
+MCP server providing web search, web fetch, and AI-powered web extraction — all results compacted for minimal context usage.
+## Tools
+| Tool | Input | Output |
+|------|-------|--------|
+| `websearch` | `{query, num_results?}` | `[{title, url, snippet, content}]` |
+| `webfetch` | `{url}` | `{url, content}` |
+| `webextract` | `{query}` | `{answer, sources: [{title, url}]}` |
+All page content is compacted via morph before returning, stripping irrelevant boilerplate.
+## Install
+```bash
+pip install morph-websearch-mcp
+# or
+uv add morph-websearch-mcp
+```
+## Setup
+Set your morph API key:
+```bash
+export MORPH_API_KEY="sk-..."
+```
+## MCP Client Config
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "websearch-mcp",
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```
+If installing from source:
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "uv",
+      "args": ["run", "--directory", "/path/to/websearch-mcp", "main.py"],
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```

morph_websearch_mcp-0.1.0/main.py ADDED Viewed

@@ -0,0 +1,320 @@
+import asyncio
+import json
+import urllib.parse
+from mcp.server import Server
+from mcp.server.stdio import stdio_server
+from mcp.types import Tool, TextContent
+import requests
+from openai import AsyncOpenAI
+from crawl4ai import AsyncWebCrawler
+from bs4 import BeautifulSoup
+import os
+MORPH_API_KEY = os.environ.get("MORPH_API_KEY", "")
+COMPACT_URL = "https://api.morphllm.com/v1/compact"
+OPENAI_BASE = "https://api.morphllm.com/v1"
+MODEL = "morph-dsv4flash"
+from importlib.metadata import version as pkg_version
+try:
+    __version__ = pkg_version("websearch-mcp")
+except Exception:
+    __version__ = "0.1.0"
+server = Server("websearch-mcp", version=__version__)
+_crawler = None
+async def get_crawler():
+    global _crawler
+    if _crawler is None:
+        _crawler = AsyncWebCrawler()
+        await _crawler.__aenter__()
+    return _crawler
+def get_markdown(result):
+    md = result.markdown
+    if isinstance(md, str):
+        return md
+    if hasattr(md, "raw_markdown"):
+        return md.raw_markdown
+    return str(md)
+async def compact_text(text, query, ratio=0.5):
+    if not text:
+        return ""
+    try:
+        response = await asyncio.to_thread(
+            lambda: requests.post(
+                COMPACT_URL,
+                headers={"Authorization": f"Bearer {MORPH_API_KEY}"},
+                json={
+                    "input": text,
+                    "query": query,
+                    "compression_ratio": ratio,
+                    "preserve_recent": 0,
+                    "include_markers": False,
+                },
+                timeout=60,
+            )
+        )
+        if response.status_code == 200:
+            return response.json()["output"]
+    except Exception:
+        pass
+    return text
+def _resolve_ddg_url(href):
+    if not href:
+        return ""
+    if href.startswith("//duckduckgo.com/l/") or "uddg=" in href:
+        parsed = urllib.parse.urlparse(href, scheme="https")
+        params = urllib.parse.parse_qs(parsed.query)
+        encoded = params.get("uddg", [""])[0]
+        if encoded:
+            return urllib.parse.unquote(encoded)
+    if href.startswith("//"):
+        return "https:" + href
+    return href
+async def websearch_impl(query, num_results=5):
+    crawler = await get_crawler()
+    ddg_url = f"https://html.duckduckgo.com/html/?q={urllib.parse.quote(query)}"
+    result = await crawler.arun(ddg_url)
+    html = getattr(result, "html", "") or ""
+    soup = BeautifulSoup(html, "html.parser")
+    result_elements = soup.select(".result")
+    parsed = []
+    for item in result_elements:
+        classes = item.get("class", [])
+        if "result--ad" in classes:
+            continue
+        link_el = item.select_one("a.result__a")
+        snippet_el = item.select_one("a.result__snippet")
+        if not link_el:
+            continue
+        title = link_el.get_text(strip=True)
+        url = _resolve_ddg_url(link_el.get("href", ""))
+        snippet = snippet_el.get_text(strip=True) if snippet_el else ""
+        if not url or not (url.startswith("http://") or url.startswith("https://")):
+            continue
+        parsed.append({"title": title, "url": url, "snippet": snippet})
+        if len(parsed) >= num_results:
+            break
+    for r in parsed:
+        r["content"] = ""
+    urls = [r["url"] for r in parsed]
+    if urls:
+        try:
+            crawl_results = await crawler.arun_many(urls)
+            url_to_content = {}
+            for cr in crawl_results:
+                if cr and cr.url:
+                    md = get_markdown(cr)
+                    url_to_content[cr.url] = await compact_text(md, query, 0.3) if md else ""
+            for r in parsed:
+                r["content"] = url_to_content.get(r["url"], "")
+        except Exception:
+            pass
+    return parsed
+async def webfetch_impl(url):
+    crawler = await get_crawler()
+    result = await crawler.arun(url)
+    md = get_markdown(result)
+    content = await compact_text(md, url, 0.5) if md else ""
+    return {"url": url, "content": content}
+async def webextract_impl(query):
+    client = AsyncOpenAI(api_key=MORPH_API_KEY, base_url=OPENAI_BASE)
+    tools = [
+        {
+            "type": "function",
+            "function": {
+                "name": "websearch",
+                "description": "Search the web for information using DuckDuckGo",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "query": {"type": "string", "description": "The search query"},
+                        "num_results": {"type": "integer", "default": 5},
+                    },
+                    "required": ["query"],
+                },
+            },
+        },
+        {
+            "type": "function",
+            "function": {
+                "name": "webfetch",
+                "description": "Fetch and extract content from a URL",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "url": {"type": "string", "description": "The URL to fetch"}
+                    },
+                    "required": ["url"],
+                },
+            },
+        },
+    ]
+    messages = [
+        {
+            "role": "system",
+            "content": "You are a web research agent. Your job is to answer user queries by searching the web and fetching web pages. You have access to two functions: websearch(query, num_results) and webfetch(url). Use them to find the answer. When you have enough information, output your final answer in a clear format with links to sources.",
+        },
+        {"role": "user", "content": query},
+    ]
+    sources = []
+    for _ in range(5):
+        response = await client.chat.completions.create(
+            model=MODEL,
+            messages=messages,
+            tools=tools,
+        )
+        msg = response.choices[0].message
+        if not msg.tool_calls:
+            return {"answer": msg.content, "sources": sources}
+        tool_calls_data = [
+            {
+                "id": tc.id,
+                "type": "function",
+                "function": {"name": tc.function.name, "arguments": tc.function.arguments},
+            }
+            for tc in msg.tool_calls
+        ]
+        messages.append(
+            {"role": "assistant", "tool_calls": tool_calls_data}
+        )
+        for tc in msg.tool_calls:
+            args = json.loads(tc.function.arguments)
+            if tc.function.name == "websearch":
+                results = await websearch_impl(
+                    args.get("query", ""), args.get("num_results", 5)
+                )
+                for r in results:
+                    if r.get("title") and r.get("url"):
+                        sources.append({"title": r["title"], "url": r["url"]})
+                messages.append(
+                    {"role": "tool", "tool_call_id": tc.id, "content": json.dumps(results)}
+                )
+            elif tc.function.name == "webfetch":
+                result = await webfetch_impl(args.get("url", ""))
+                if result.get("url"):
+                    sources.append({"title": result["url"], "url": result["url"]})
+                messages.append(
+                    {"role": "tool", "tool_call_id": tc.id, "content": json.dumps(result)}
+                )
+    final_response = await client.chat.completions.create(
+        model=MODEL,
+        messages=messages
+        + [
+            {
+                "role": "user",
+                "content": "You have reached the maximum number of research steps. Provide your final answer now based on what you found, with links to sources.",
+            }
+        ],
+    )
+    return {"answer": final_response.choices[0].message.content, "sources": sources}
+@server.list_tools()
+async def list_tools():
+    return [
+        Tool(
+            name="websearch",
+            description="Search the web using DuckDuckGo and return results with full page content",
+            inputSchema={
+                "type": "object",
+                "properties": {
+                    "query": {"type": "string", "description": "The search query"},
+                    "num_results": {
+                        "type": "integer",
+                        "default": 5,
+                        "description": "Number of results to return",
+                    },
+                },
+                "required": ["query"],
+            },
+        ),
+        Tool(
+            name="webfetch",
+            description="Fetch and extract content from a URL",
+            inputSchema={
+                "type": "object",
+                "properties": {
+                    "url": {"type": "string", "description": "The URL to fetch"}
+                },
+                "required": ["url"],
+            },
+        ),
+        Tool(
+            name="webextract",
+            description="Agentic web research — searches and fetches pages to answer a query",
+            inputSchema={
+                "type": "object",
+                "properties": {
+                    "query": {
+                        "type": "string",
+                        "description": "The research query to answer",
+                    }
+                },
+                "required": ["query"],
+            },
+        ),
+    ]
+@server.call_tool()
+async def call_tool(name, arguments):
+    if name == "websearch":
+        results = await websearch_impl(
+            arguments.get("query", ""), arguments.get("num_results", 5)
+        )
+        return [TextContent(type="text", text=json.dumps(results, indent=2))]
+    elif name == "webfetch":
+        result = await webfetch_impl(arguments.get("url", ""))
+        return [TextContent(type="text", text=json.dumps(result, indent=2))]
+    elif name == "webextract":
+        result = await webextract_impl(arguments.get("query", ""))
+        return [TextContent(type="text", text=json.dumps(result, indent=2))]
+    return [TextContent(type="text", text="Unknown tool")]
+async def serve():
+    try:
+        async with stdio_server() as (read_stream, write_stream):
+            await server.run(
+                read_stream, write_stream, server.create_initialization_options()
+            )
+    finally:
+        global _crawler
+        if _crawler:
+            await _crawler.__aexit__(None, None, None)
+def main():
+    asyncio.run(serve())
+if __name__ == "__main__":
+    main()

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/PKG-INFO ADDED Viewed

@@ -0,0 +1,73 @@
+Metadata-Version: 2.4
+Name: morph-websearch-mcp
+Version: 0.1.0
+Summary: Web search MCP server with AI-powered content extraction
+License-Expression: MIT
+Requires-Python: >=3.13
+Description-Content-Type: text/markdown
+Requires-Dist: mcp>=1.0.0
+Requires-Dist: crawl4ai>=0.4.0
+Requires-Dist: requests>=2.31.0
+Requires-Dist: openai>=1.0.0
+Requires-Dist: beautifulsoup4>=4.12.0
+# websearch-mcp
+MCP server providing web search, web fetch, and AI-powered web extraction — all results compacted for minimal context usage.
+## Tools
+| Tool | Input | Output |
+|------|-------|--------|
+| `websearch` | `{query, num_results?}` | `[{title, url, snippet, content}]` |
+| `webfetch` | `{url}` | `{url, content}` |
+| `webextract` | `{query}` | `{answer, sources: [{title, url}]}` |
+All page content is compacted via morph before returning, stripping irrelevant boilerplate.
+## Install
+```bash
+pip install morph-websearch-mcp
+# or
+uv add morph-websearch-mcp
+```
+## Setup
+Set your morph API key:
+```bash
+export MORPH_API_KEY="sk-..."
+```
+## MCP Client Config
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "websearch-mcp",
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```
+If installing from source:
+```json
+{
+  "mcpServers": {
+    "websearch-mcp": {
+      "command": "uv",
+      "args": ["run", "--directory", "/path/to/websearch-mcp", "main.py"],
+      "env": {
+        "MORPH_API_KEY": "sk-..."
+      }
+    }
+  }
+}
+```

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/SOURCES.txt ADDED Viewed

@@ -0,0 +1,9 @@
+README.md
+main.py
+pyproject.toml
+morph_websearch_mcp.egg-info/PKG-INFO
+morph_websearch_mcp.egg-info/SOURCES.txt
+morph_websearch_mcp.egg-info/dependency_links.txt
+morph_websearch_mcp.egg-info/entry_points.txt
+morph_websearch_mcp.egg-info/requires.txt
+morph_websearch_mcp.egg-info/top_level.txt

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/entry_points.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ [console_scripts]
2	+ websearch-mcp = main:main

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/requires.txt ADDED Viewed

@@ -0,0 +1,5 @@
+mcp>=1.0.0
+crawl4ai>=0.4.0
+requests>=2.31.0
+openai>=1.0.0
+beautifulsoup4>=4.12.0

morph_websearch_mcp-0.1.0/morph_websearch_mcp.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ main

morph_websearch_mcp-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,17 @@
+[project]
+name = "morph-websearch-mcp"
+version = "0.1.0"
+description = "Web search MCP server with AI-powered content extraction"
+readme = "README.md"
+requires-python = ">=3.13"
+license = "MIT"
+dependencies = [
+    "mcp>=1.0.0",
+    "crawl4ai>=0.4.0",
+    "requests>=2.31.0",
+    "openai>=1.0.0",
+    "beautifulsoup4>=4.12.0",
+]
+[project.scripts]
+websearch-mcp = "main:main"

morph_websearch_mcp-0.1.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0