PyPI - academia-mcp - Versions diffs - 1.11.3__tar.gz → 1.11.5__tar.gz - Mend

academia-mcp 1.11.3tar.gz → 1.11.5tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (54) hide show

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: academia-mcp
-Version: 1.11.3
+Version: 1.11.5
 Summary: MCP server that provides different tools to search for scientific publications
 Author-email: Ilya Gusev <phoenixilya@gmail.com>
 Project-URL: Homepage, https://github.com/IlyaGusev/academia_mcp
@@ -12,16 +12,14 @@ Description-Content-Type: text/markdown
 License-File: LICENSE
 Requires-Dist: mcp>=1.10.1
 Requires-Dist: xmltodict>=0.14.0
-Requires-Dist: types-xmltodict>=0.14.0
 Requires-Dist: requests>=2.32.0
-Requires-Dist: types-requests>=2.32.0
 Requires-Dist: pypdf>=5.1.0
 Requires-Dist: beautifulsoup4>=4.12.0
-Requires-Dist: types-beautifulsoup4>=4.12.0
 Requires-Dist: markdownify==0.14.1
+Requires-Dist: types-xmltodict>=0.14.0
+Requires-Dist: types-requests>=2.32.0
+Requires-Dist: types-beautifulsoup4>=4.12.0
 Requires-Dist: acl-anthology==0.5.2
-Requires-Dist: markdown==3.7.0
-Requires-Dist: types-markdown==3.7.0.20250322
 Requires-Dist: huggingface-hub>=0.32.4
 Requires-Dist: fire>=0.7.0
 Requires-Dist: openai>=1.97.1
@@ -31,6 +29,8 @@ Requires-Dist: pymupdf>=1.26.4
 Requires-Dist: pillow>=11.3.0
 Requires-Dist: pydantic-settings>=2.6.0
 Requires-Dist: youtube-transcript-api>=1.2.2
+Requires-Dist: paddlepaddle>=3.2.0
+Requires-Dist: paddleocr>=3.2.0
 Dynamic: license-file
 # Academia MCP
@@ -70,12 +70,16 @@ make install
 ### Quickstart
 - Run over HTTP (default transport):
 ```bash
+python -m academia_mcp --transport streamable-http
+# OR
 uv run -m academia_mcp --transport streamable-http
 ```
 - Run over stdio (for local MCP clients like Claude Desktop):
 ```bash
 python -m academia_mcp --transport stdio
+# OR
+uv run -m academia_mcp --transport stdio
 ```
 Notes:
@@ -122,7 +126,7 @@ Availability notes:
 - Set one or more of `EXA_API_KEY`, `BRAVE_API_KEY`, `TAVILY_API_KEY` to enable `web_search` and provider tools.
 ### Environment variables
-Set as needed depending on which tools you use:
+Set as needed, depending on which tools you use:
 - `OPENROUTER_API_KEY`: required for LLM-related tools.
 - `BASE_URL`: override OpenRouter base URL.
@@ -152,7 +156,7 @@ docker run --rm -p 5056:5056 \
   academia_mcp
 ```
-Or use existing image: `phoenix120/academia_mcp`
+Or use existing image: [`phoenix120/academia_mcp`](https://hub.docker.com/repository/docker/phoenix120/academia_mcp)
 ### Examples
 - [Comprehensive report screencast (YouTube)](https://www.youtube.com/watch?v=4bweqQcN6w8)

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/README.md RENAMED Viewed

@@ -35,12 +35,16 @@ make install
 ### Quickstart
 - Run over HTTP (default transport):
 ```bash
+python -m academia_mcp --transport streamable-http
+# OR
 uv run -m academia_mcp --transport streamable-http
 ```
 - Run over stdio (for local MCP clients like Claude Desktop):
 ```bash
 python -m academia_mcp --transport stdio
+# OR
+uv run -m academia_mcp --transport stdio
 ```
 Notes:
@@ -87,7 +91,7 @@ Availability notes:
 - Set one or more of `EXA_API_KEY`, `BRAVE_API_KEY`, `TAVILY_API_KEY` to enable `web_search` and provider tools.
 ### Environment variables
-Set as needed depending on which tools you use:
+Set as needed, depending on which tools you use:
 - `OPENROUTER_API_KEY`: required for LLM-related tools.
 - `BASE_URL`: override OpenRouter base URL.
@@ -117,7 +121,7 @@ docker run --rm -p 5056:5056 \
   academia_mcp
 ```
-Or use existing image: `phoenix120/academia_mcp`
+Or use existing image: [`phoenix120/academia_mcp`](https://hub.docker.com/repository/docker/phoenix120/academia_mcp)
 ### Examples
 - [Comprehensive report screencast (YouTube)](https://www.youtube.com/watch?v=4bweqQcN6w8)

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp/server.py RENAMED Viewed

@@ -17,6 +17,7 @@ from academia_mcp.tools.s2 import (
     s2_get_references,
     s2_corpus_id_from_arxiv_id,
     s2_get_info,
+    s2_search,
 )
 from academia_mcp.tools.hf_datasets_search import hf_datasets_search
 from academia_mcp.tools.anthology_search import anthology_search
@@ -40,7 +41,7 @@ from academia_mcp.tools.bitflip import (
     score_research_proposals,
 )
 from academia_mcp.tools.review import review_pdf_paper, download_pdf_paper
-from academia_mcp.tools.show_image import show_image, describe_image
+from academia_mcp.tools.image_processing import show_image, describe_image
 from academia_mcp.tools.speech_to_text import speech_to_text
 from academia_mcp.tools.yt_transcript import yt_transcript
@@ -86,6 +87,7 @@ def create_server(
     server.add_tool(s2_get_citations, structured_output=True)
     server.add_tool(s2_get_references, structured_output=True)
     server.add_tool(s2_get_info, structured_output=True)
+    server.add_tool(s2_search, structured_output=True)
     server.add_tool(s2_corpus_id_from_arxiv_id)
     server.add_tool(hf_datasets_search)
     server.add_tool(anthology_search)

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp/tools/__init__.py RENAMED Viewed

@@ -2,7 +2,13 @@ from .arxiv_search import arxiv_search
 from .anthology_search import anthology_search
 from .arxiv_download import arxiv_download
 from .hf_datasets_search import hf_datasets_search
-from .s2 import s2_get_references, s2_get_citations, s2_corpus_id_from_arxiv_id, s2_get_info
+from .s2 import (
+    s2_get_references,
+    s2_get_citations,
+    s2_corpus_id_from_arxiv_id,
+    s2_get_info,
+    s2_search,
+)
 from .document_qa import document_qa
 from .latex import (
     compile_latex,
@@ -14,7 +20,7 @@ from .web_search import web_search, tavily_web_search, exa_web_search, brave_web
 from .visit_webpage import visit_webpage
 from .bitflip import extract_bitflip_info, generate_research_proposals, score_research_proposals
 from .review import review_pdf_paper, download_pdf_paper, review_pdf_paper_by_url
-from .show_image import show_image, describe_image
+from .image_processing import show_image, describe_image
 from .speech_to_text import speech_to_text
 from .yt_transcript import yt_transcript
@@ -26,6 +32,7 @@ __all__ = [
     "s2_get_citations",
     "s2_corpus_id_from_arxiv_id",
     "s2_get_info",
+    "s2_search",
     "hf_datasets_search",
     "document_qa",
     "compile_latex",

academia_mcp-1.11.3/academia_mcp/tools/show_image.py → academia_mcp-1.11.5/academia_mcp/tools/image_processing.py RENAMED Viewed

@@ -1,16 +1,28 @@
+import asyncio
 import base64
-from pathlib import Path
+import contextlib
+import json
+import logging
+import os
+import threading
 from io import BytesIO
-from typing import Dict, Optional
+from pathlib import Path
 from textwrap import dedent
+from typing import Dict, List, Optional, Any
 import httpx
+from paddleocr import PaddleOCR  # type: ignore
 from PIL import Image
+from pydantic import BaseModel
 from academia_mcp.files import get_workspace_dir
+from academia_mcp.llm import ChatMessage, llm_acall
 from academia_mcp.settings import settings
-from academia_mcp.llm import llm_acall, ChatMessage
+paddlex_logger = logging.getLogger("paddlex")
+paddleocr_logger = logging.getLogger("paddleocr")
+paddlex_logger.setLevel(logging.ERROR)
+paddleocr_logger.setLevel(logging.ERROR)
 DESCRIBE_PROMPTS = {
     "general": "Provide a general description of this image. Focus on the main subjects, colors, and overall scene.",
@@ -37,16 +49,64 @@ DESCRIBE_PROMPTS = {
         - If layout is multi-column or tabular, reconstruct lines top-to-bottom, left-to-right; use line breaks between blocks.
         - For any uncertain or low-confidence characters, mark with a '?' and include a note.
         - After the raw extraction, provide a clean, normalized version (fixing obvious OCR artifacts) as a separate section.
-        Return two sections:
+        Return three sections:
+        [GENERAL IMAGE DESCRIPTION]
+        ...
         [RAW TRANSCRIPTION]
         ...
-        [NORMALIZED]
+        [NORMALIZED TRANSCRIPTION]
         ...
         """
     ),
 }
+class OCRBox(BaseModel):  # type: ignore
+    poly: List[List[float]]
+    text: str
+    score: float
+class OCRSingleton:
+    instance: Optional[PaddleOCR] = None
+    lock: threading.Lock = threading.Lock()
+    @classmethod
+    def get(cls) -> PaddleOCR:
+        if cls.instance is not None:
+            return cls.instance
+        with cls.lock:
+            if cls.instance is None:
+                with open(os.devnull, "w") as devnull:
+                    with contextlib.redirect_stderr(devnull):
+                        cls.instance = PaddleOCR(
+                            use_doc_orientation_classify=False,
+                            use_doc_unwarping=False,
+                            use_textline_orientation=False,
+                        )
+        return cls.instance
+async def _run_ocr(path: str) -> Dict[str, Any]:
+    def _sync_ocr(path: str) -> Dict[str, Any]:
+        try:
+            ocr = OCRSingleton.get()
+            with open(os.devnull, "w") as devnull:
+                with contextlib.redirect_stderr(devnull):
+                    result = ocr.predict(input=path)[0]
+            rec_texts = result["rec_texts"]
+            rec_scores = result["rec_scores"]
+            rec_polys = result["rec_polys"]
+        except Exception as e:
+            return {"error": str(e)}
+        items = []
+        for poly, text, score in zip(rec_polys, rec_texts, rec_scores):
+            items.append(OCRBox(poly=poly, text=text, score=score).model_dump())
+        return {"boxes": items}
+    return await asyncio.to_thread(_sync_ocr, path)
 def show_image(path: str) -> Dict[str, str]:
     """
     Reads an image from the specified URL or from the current work directory.
@@ -91,7 +151,7 @@ async def describe_image(
             - "general": General description of the image
             - "detailed": Detailed analysis of the image
             - "chess": Analysis of a chess position
-            - "text": Extract and describe text or numbers from the image
+            - "text": Extract and describe text or numbers with an OCR pipeline.
             - "custom": Custom description based on user prompt
     """
     image_base64 = show_image(path)["image_base64"]
@@ -116,4 +176,12 @@ async def describe_image(
         messages=[ChatMessage(role="user", content=content)],
         **llm_kwargs,
     )
+    if description_type == "text":
+        ocr_response = await _run_ocr(path)
+        response = json.dumps(
+            {
+                "vlm_response": response,
+                "ocr_response": ocr_response if ocr_response else [],
+            }
+        )
     return response

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp/tools/s2.py RENAMED Viewed

@@ -8,10 +8,12 @@ from pydantic import BaseModel, Field
 from academia_mcp.utils import get_with_retries
-PAPER_URL_TEMPLATE = "https://api.semanticscholar.org/graph/v1/paper/{paper_id}?fields={fields}"
-CITATIONS_URL_TEMPLATE = "https://api.semanticscholar.org/graph/v1/paper/{paper_id}/citations?fields={fields}&offset={offset}&limit={limit}"
-REFERENCES_URL_TEMPLATE = "https://api.semanticscholar.org/graph/v1/paper/{paper_id}/references?fields={fields}&offset={offset}&limit={limit}"
-FIELDS = "title,authors,externalIds,venue,citationCount,publicationDate"
+BASE_URL = "https://api.semanticscholar.org/graph/v1"
+PAPER_URL_TEMPLATE = "{base_url}/paper/{paper_id}"
+CITATIONS_URL_TEMPLATE = "{base_url}/paper/{paper_id}/citations"
+REFERENCES_URL_TEMPLATE = "{base_url}/paper/{paper_id}/references"
+SEARCH_URL_TEMPLATE = "{base_url}/paper/search"
+FIELDS = "paperId,title,authors,externalIds,venue,citationCount,publicationDate"
 class S2PaperInfo(BaseModel):  # type: ignore
@@ -38,7 +40,10 @@ def _format_authors(authors: List[Dict[str, Any]]) -> List[str]:
 def _clean_entry(entry: Dict[str, Any]) -> S2PaperInfo:
-    entry = entry["citingPaper"] if "citingPaper" in entry else entry["citedPaper"]
+    if "citingPaper" in entry:
+        entry = entry["citingPaper"]
+    elif "citedPaper" in entry:
+        entry = entry["citedPaper"]
     external_ids = entry.get("externalIds")
     if not external_ids:
         external_ids = dict()
@@ -88,17 +93,17 @@ def s2_get_citations(
         arxiv_id = arxiv_id.split("v")[0]
     paper_id = f"arxiv:{arxiv_id}"
-    url = CITATIONS_URL_TEMPLATE.format(
-        paper_id=paper_id, fields=FIELDS, offset=offset, limit=limit
-    )
-    response = get_with_retries(url)
+    url = CITATIONS_URL_TEMPLATE.format(base_url=BASE_URL, paper_id=paper_id)
+    payload = {"fields": FIELDS, "offset": offset, "limit": limit}
+    response = get_with_retries(url, params=payload)
     result = response.json()
     entries = result["data"]
     total_count = len(result["data"]) + result["offset"]
     if "next" in result:
-        paper_url = PAPER_URL_TEMPLATE.format(paper_id=paper_id, fields=FIELDS)
-        paper_response = get_with_retries(paper_url)
+        paper_url = PAPER_URL_TEMPLATE.format(base_url=BASE_URL, paper_id=paper_id)
+        payload = {"fields": FIELDS}
+        paper_response = get_with_retries(paper_url, params=payload)
         paper_result = paper_response.json()
         total_count = paper_result["citationCount"]
@@ -123,10 +128,9 @@ def s2_get_references(
         arxiv_id = arxiv_id.split("v")[0]
     paper_id = f"arxiv:{arxiv_id}"
-    url = REFERENCES_URL_TEMPLATE.format(
-        paper_id=paper_id, fields=FIELDS, offset=offset, limit=limit
-    )
-    response = get_with_retries(url)
+    url = REFERENCES_URL_TEMPLATE.format(base_url=BASE_URL, paper_id=paper_id)
+    payload = {"fields": FIELDS, "offset": offset, "limit": limit}
+    response = get_with_retries(url, params=payload)
     result = response.json()
     entries = result["data"]
     total_count = len(result["data"]) + result["offset"]
@@ -143,8 +147,9 @@ def s2_corpus_id_from_arxiv_id(arxiv_id: str) -> int:
     assert isinstance(arxiv_id, str), "Error: Your arxiv_id must be a string"
     if "v" in arxiv_id:
         arxiv_id = arxiv_id.split("v")[0]
-    paper_url = PAPER_URL_TEMPLATE.format(paper_id=f"arxiv:{arxiv_id}", fields="externalIds")
-    response = get_with_retries(paper_url)
+    paper_url = PAPER_URL_TEMPLATE.format(base_url=BASE_URL, paper_id=f"arxiv:{arxiv_id}")
+    payload = {"fields": "externalIds"}
+    response = get_with_retries(paper_url, params=payload)
     result = response.json()
     return int(result["externalIds"]["CorpusId"])
@@ -159,8 +164,10 @@ def s2_get_info(arxiv_id: str) -> S2PaperInfo:
     assert isinstance(arxiv_id, str), "Error: Your arxiv_id must be a string"
     if "v" in arxiv_id:
         arxiv_id = arxiv_id.split("v")[0]
-    paper_url = PAPER_URL_TEMPLATE.format(paper_id=f"arxiv:{arxiv_id}", fields=FIELDS)
-    response = get_with_retries(paper_url)
+    paper_id = f"arxiv:{arxiv_id}"
+    payload = {"fields": FIELDS}
+    paper_url = PAPER_URL_TEMPLATE.format(base_url=BASE_URL, paper_id=paper_id)
+    response = get_with_retries(paper_url, params=payload)
     json_data = response.json()
     return S2PaperInfo(
         arxiv_id=json_data.get("externalIds", {}).get("ArXiv"),
@@ -171,3 +178,45 @@ def s2_get_info(arxiv_id: str) -> S2PaperInfo:
         citation_count=int(json_data.get("citationCount", 0)),
         publication_date=str(json_data.get("publicationDate", "")),
     )
+def s2_search(
+    query: str,
+    offset: int = 0,
+    limit: int = 5,
+    min_citation_count: int = 0,
+    publication_date: Optional[str] = None,
+) -> S2SearchResponse:
+    """
+    Search the S2 corpus for a given query.
+    Args:
+        query: The query to search for.
+        offset: The offset to scroll through results. 10 items will be skipped if offset=10. 0 by default.
+        limit: The maximum number of items to return. limit=50 by default.
+        min_citation_count: The minimum citation count to return. 0 by default.
+        publication_date: Restricts results to the given range of publication dates or years (inclusive).
+            Accepts the format <startDate>:<endDate> with each date in YYYY-MM-DD format. None by default.
+    """
+    url = SEARCH_URL_TEMPLATE.format(base_url=BASE_URL)
+    payload = {
+        "query": query,
+        "offset": offset,
+        "limit": limit,
+        "minCitationCount": min_citation_count,
+        "fields": FIELDS,
+    }
+    if publication_date:
+        payload["publicationDateOrYear"] = publication_date
+    response = get_with_retries(url, params=payload, backoff_factor=10.0, num_retries=5)
+    result = response.json()
+    if "data" not in result:
+        return S2SearchResponse(
+            total_count=0,
+            returned_count=0,
+            offset=offset if offset else 0,
+            results=[],
+        )
+    entries = result["data"]
+    total_count = result["total"]
+    return _format_entries(entries, offset if offset else 0, total_count)

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp/utils.py RENAMED Viewed

@@ -42,7 +42,7 @@ def post_with_retries(
 def get_with_retries(
     url: str,
     api_key: Optional[str] = None,
-    timeout: int = 30,
+    timeout: int = 60,
     num_retries: int = 3,
     backoff_factor: float = 3.0,
     params: Optional[Dict[str, Any]] = None,

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: academia-mcp
-Version: 1.11.3
+Version: 1.11.5
 Summary: MCP server that provides different tools to search for scientific publications
 Author-email: Ilya Gusev <phoenixilya@gmail.com>
 Project-URL: Homepage, https://github.com/IlyaGusev/academia_mcp
@@ -12,16 +12,14 @@ Description-Content-Type: text/markdown
 License-File: LICENSE
 Requires-Dist: mcp>=1.10.1
 Requires-Dist: xmltodict>=0.14.0
-Requires-Dist: types-xmltodict>=0.14.0
 Requires-Dist: requests>=2.32.0
-Requires-Dist: types-requests>=2.32.0
 Requires-Dist: pypdf>=5.1.0
 Requires-Dist: beautifulsoup4>=4.12.0
-Requires-Dist: types-beautifulsoup4>=4.12.0
 Requires-Dist: markdownify==0.14.1
+Requires-Dist: types-xmltodict>=0.14.0
+Requires-Dist: types-requests>=2.32.0
+Requires-Dist: types-beautifulsoup4>=4.12.0
 Requires-Dist: acl-anthology==0.5.2
-Requires-Dist: markdown==3.7.0
-Requires-Dist: types-markdown==3.7.0.20250322
 Requires-Dist: huggingface-hub>=0.32.4
 Requires-Dist: fire>=0.7.0
 Requires-Dist: openai>=1.97.1
@@ -31,6 +29,8 @@ Requires-Dist: pymupdf>=1.26.4
 Requires-Dist: pillow>=11.3.0
 Requires-Dist: pydantic-settings>=2.6.0
 Requires-Dist: youtube-transcript-api>=1.2.2
+Requires-Dist: paddlepaddle>=3.2.0
+Requires-Dist: paddleocr>=3.2.0
 Dynamic: license-file
 # Academia MCP
@@ -70,12 +70,16 @@ make install
 ### Quickstart
 - Run over HTTP (default transport):
 ```bash
+python -m academia_mcp --transport streamable-http
+# OR
 uv run -m academia_mcp --transport streamable-http
 ```
 - Run over stdio (for local MCP clients like Claude Desktop):
 ```bash
 python -m academia_mcp --transport stdio
+# OR
+uv run -m academia_mcp --transport stdio
 ```
 Notes:
@@ -122,7 +126,7 @@ Availability notes:
 - Set one or more of `EXA_API_KEY`, `BRAVE_API_KEY`, `TAVILY_API_KEY` to enable `web_search` and provider tools.
 ### Environment variables
-Set as needed depending on which tools you use:
+Set as needed, depending on which tools you use:
 - `OPENROUTER_API_KEY`: required for LLM-related tools.
 - `BASE_URL`: override OpenRouter base URL.
@@ -152,7 +156,7 @@ docker run --rm -p 5056:5056 \
   academia_mcp
 ```
-Or use existing image: `phoenix120/academia_mcp`
+Or use existing image: [`phoenix120/academia_mcp`](https://hub.docker.com/repository/docker/phoenix120/academia_mcp)
 ### Examples
 - [Comprehensive report screencast (YouTube)](https://www.youtube.com/watch?v=4bweqQcN6w8)

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp.egg-info/SOURCES.txt RENAMED Viewed

@@ -25,11 +25,11 @@ academia_mcp/tools/arxiv_search.py
 academia_mcp/tools/bitflip.py
 academia_mcp/tools/document_qa.py
 academia_mcp/tools/hf_datasets_search.py
+academia_mcp/tools/image_processing.py
 academia_mcp/tools/latex.py
 academia_mcp/tools/py.typed
 academia_mcp/tools/review.py
 academia_mcp/tools/s2.py
-academia_mcp/tools/show_image.py
 academia_mcp/tools/speech_to_text.py
 academia_mcp/tools/visit_webpage.py
 academia_mcp/tools/web_search.py
@@ -41,11 +41,11 @@ tests/test_bitflip.py
 tests/test_document_qa.py
 tests/test_extract_json.py
 tests/test_hf_dataset_search.py
+tests/test_image_processing.py
 tests/test_latex.py
 tests/test_review.py
 tests/test_s2.py
 tests/test_server.py
-tests/test_show_image.py
 tests/test_speech_to_text.py
 tests/test_visit_webpage.py
 tests/test_web_search.py

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/academia_mcp.egg-info/requires.txt RENAMED Viewed

@@ -1,15 +1,13 @@
 mcp>=1.10.1
 xmltodict>=0.14.0
-types-xmltodict>=0.14.0
 requests>=2.32.0
-types-requests>=2.32.0
 pypdf>=5.1.0
 beautifulsoup4>=4.12.0
-types-beautifulsoup4>=4.12.0
 markdownify==0.14.1
+types-xmltodict>=0.14.0
+types-requests>=2.32.0
+types-beautifulsoup4>=4.12.0
 acl-anthology==0.5.2
-markdown==3.7.0
-types-markdown==3.7.0.20250322
 huggingface-hub>=0.32.4
 fire>=0.7.0
 openai>=1.97.1
@@ -19,3 +17,5 @@ pymupdf>=1.26.4
 pillow>=11.3.0
 pydantic-settings>=2.6.0
 youtube-transcript-api>=1.2.2
+paddlepaddle>=3.2.0
+paddleocr>=3.2.0

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "academia-mcp"
-version = "1.11.3"
+version = "1.11.5"
 description = "MCP server that provides different tools to search for scientific publications"
 readme = "README.md"
 authors = [
@@ -19,16 +19,14 @@ classifiers = [
 dependencies = [
     "mcp>=1.10.1",
     "xmltodict>=0.14.0",
-    "types-xmltodict>=0.14.0",
     "requests>=2.32.0",
-    "types-requests>=2.32.0",
     "pypdf>=5.1.0",
     "beautifulsoup4>=4.12.0",
-    "types-beautifulsoup4>=4.12.0",
     "markdownify==0.14.1",
+    "types-xmltodict>=0.14.0",
+    "types-requests>=2.32.0",
+    "types-beautifulsoup4>=4.12.0",
     "acl-anthology==0.5.2",
-    "markdown==3.7.0",
-    "types-markdown==3.7.0.20250322",
     "huggingface-hub>=0.32.4",
     "fire>=0.7.0",
     "openai>=1.97.1",
@@ -38,6 +36,8 @@ dependencies = [
     "pillow>=11.3.0",
     "pydantic-settings>=2.6.0",
     "youtube-transcript-api>=1.2.2",
+    "paddlepaddle>=3.2.0",
+    "paddleocr>=3.2.0",
 ]
 [dependency-groups]

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/tests/test_bitflip.py RENAMED Viewed

@@ -35,18 +35,3 @@ async def test_bitflip_score_research_proposals_base() -> None:
     assert scores.proposals[1].strengths is not None
     assert scores.proposals[0].weaknesses is not None
     assert scores.proposals[1].weaknesses is not None
-async def test_bitflip_score_research_proposals_str() -> None:
-    arxiv_id = "2503.07826"
-    bit = (await extract_bitflip_info(arxiv_id)).bit
-    proposals = await generate_research_proposals(bit=bit, num_proposals=2)
-    scores = await score_research_proposals(proposals)
-    assert scores.proposals
-    assert len(scores.proposals) == 2
-    assert scores.proposals[0].spark is not None
-    assert scores.proposals[1].spark is not None
-    assert scores.proposals[0].strengths is not None
-    assert scores.proposals[1].strengths is not None
-    assert scores.proposals[0].weaknesses is not None
-    assert scores.proposals[1].weaknesses is not None

academia_mcp-1.11.3/tests/test_show_image.py → academia_mcp-1.11.5/tests/test_image_processing.py RENAMED Viewed

@@ -29,3 +29,9 @@ async def test_describe_image_base(test_image_url: str) -> None:
     result = await describe_image(test_image_url)
     assert result is not None
     assert "Interrogator" in result
+async def test_describe_image_text(test_image_url: str) -> None:
+    result = await describe_image(test_image_url, description_type="text")
+    assert result is not None
+    assert '"text": "Interrogator"' in result

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/tests/test_s2.py RENAMED Viewed

@@ -3,6 +3,7 @@ from academia_mcp.tools import (
     s2_get_references,
     s2_corpus_id_from_arxiv_id,
     s2_get_info,
+    s2_search,
 )
@@ -40,3 +41,31 @@ def test_s2_get_info() -> None:
     assert info.citation_count is not None
     assert info.publication_date is not None
     assert info.external_ids["CorpusId"] == 272593138
+def test_s2_search_base() -> None:
+    result = s2_search("transformers")
+    assert result.total_count >= 1
+    assert "transformers" in str(result.results).lower()
+    assert result.offset == 0
+    assert result.returned_count == 5
+def test_s2_search_offset() -> None:
+    result = s2_search("transformers", offset=10)
+    assert result.total_count >= 1
+    assert "transformers" in str(result.results).lower()
+    assert result.offset == 10
+    assert result.returned_count == 5
+def test_s2_search_min_citation_count() -> None:
+    result = s2_search("transformers", min_citation_count=100000)
+    assert result.total_count >= 2 and result.total_count <= 10
+def test_s2_search_publication_date() -> None:
+    result = s2_search(
+        "transformers", min_citation_count=100000, publication_date="2017-01-01:2017-12-31"
+    )
+    assert result.total_count == 1

{academia_mcp-1.11.3 → academia_mcp-1.11.5}/tests/test_visit_webpage.py RENAMED Viewed

@@ -7,7 +7,6 @@ def test_visit_webpage_basic() -> None:
     assert content.id == "https://example.com/"
     assert content.provider == "basic"
     assert "Example Domain" in content.text
-    assert "illustrative" in content.text
 def test_visit_webpage_exa() -> None:
@@ -16,7 +15,6 @@ def test_visit_webpage_exa() -> None:
     assert content.id == "https://example.com/"
     assert content.provider == "exa"
     assert "Example Domain" in content.text
-    assert "illustrative" in content.text
 def test_visit_webpage_pdf() -> None: