PyPI - academia-mcp - Versions diffs - 1.1.4__tar.gz → 1.2.0__tar.gz - Mend

academia-mcp 1.1.4tar.gz → 1.2.0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (43) hide show

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: academia-mcp
-Version: 1.1.4
+Version: 1.2.0
 Summary: MCP server that provides different tools to search for scientific publications
 Author-email: Ilya Gusev <phoenixilya@gmail.com>
 Project-URL: Homepage, https://github.com/IlyaGusev/academia_mcp
@@ -31,6 +31,7 @@ Requires-Dist: pytest>=8.4.1
 Requires-Dist: openai>=1.97.1
 Requires-Dist: jinja2>=3.1.6
 Requires-Dist: datasets>=4.0.0
+Requires-Dist: pytest-asyncio>=1.1.0
 Dynamic: license-file
 # Academia MCP

academia_mcp-1.2.0/academia_mcp/llm.py ADDED Viewed

@@ -0,0 +1,38 @@
+import os
+from typing import List, Dict, Any
+from pydantic import BaseModel
+from openai import AsyncOpenAI
+from openai.types.chat.chat_completion_message import ChatCompletionMessage
+class ChatMessage(BaseModel):  # type: ignore
+    role: str
+    content: str | List[Dict[str, Any]]
+ChatMessages = List[ChatMessage]
+async def llm_acall(model_name: str, prompt: str) -> str:
+    key = os.getenv("OPENROUTER_API_KEY", "")
+    assert key, "Please set OPENROUTER_API_KEY in the environment variables"
+    base_url = os.getenv("BASE_URL", "https://openrouter.ai/api/v1")
+    messages: ChatMessages = [
+        ChatMessage(role="user", content=prompt),
+    ]
+    client = AsyncOpenAI(base_url=base_url, api_key=key)
+    response: ChatCompletionMessage = (
+        (
+            await client.chat.completions.create(
+                model=model_name,
+                messages=messages,
+                temperature=0.0,
+            )
+        )
+        .choices[0]
+        .message
+    )
+    assert response.content, "Response content is None"
+    return response.content

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp/server.py RENAMED Viewed

@@ -15,7 +15,12 @@ from .tools.document_qa import document_qa
 from .tools.md_to_pdf import md_to_pdf
 from .tools.web_search import web_search, tavily_web_search, exa_web_search, brave_web_search
 from .tools.visit_webpage import visit_webpage
-from .tools.bitflip import propose_improvement_idea, extract_bitflip_info
+from .tools.bitflip import (
+    extract_bitflip_info,
+    generate_research_proposal,
+    score_research_proposals,
+)
 load_dotenv()
@@ -53,6 +58,9 @@ def run(
     server.add_tool(anthology_search)
     server.add_tool(md_to_pdf)
     server.add_tool(visit_webpage)
+    server.add_tool(extract_bitflip_info)
+    server.add_tool(generate_research_proposal)
+    server.add_tool(score_research_proposals)
     if os.getenv("TAVILY_API_KEY"):
         server.add_tool(tavily_web_search)
@@ -64,8 +72,6 @@ def run(
         server.add_tool(web_search)
     if os.getenv("OPENROUTER_API_KEY"):
         server.add_tool(document_qa)
-        server.add_tool(propose_improvement_idea)
-        server.add_tool(extract_bitflip_info)
     if port is None:
         port = find_free_port()

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp/tools/__init__.py RENAMED Viewed

@@ -7,7 +7,7 @@ from .document_qa import document_qa
 from .md_to_pdf import md_to_pdf
 from .web_search import web_search, tavily_web_search, exa_web_search, brave_web_search
 from .visit_webpage import visit_webpage
-from .bitflip import propose_improvement_idea, extract_bitflip_info
+from .bitflip import extract_bitflip_info, generate_research_proposal, score_research_proposals
 __all__ = [
@@ -24,6 +24,7 @@ __all__ = [
     "exa_web_search",
     "brave_web_search",
     "visit_webpage",
-    "propose_improvement_idea",
     "extract_bitflip_info",
+    "generate_research_proposal",
+    "score_research_proposals",
 ]

academia_mcp-1.2.0/academia_mcp/tools/bitflip.py ADDED Viewed

@@ -0,0 +1,282 @@
+# https://arxiv.org/abs/2504.12976
+# https://web.stanford.edu/class/cs197c/slides/02-literature-search.pdf
+import json
+import os
+import random
+from typing import List, Optional, Any
+from pydantic import BaseModel
+from datasets import load_dataset  # type: ignore
+from academia_mcp.tools.arxiv_download import arxiv_download
+from academia_mcp.utils import extract_json, encode_prompt
+from academia_mcp.llm import llm_acall
+class ProposalDataset:
+    dataset: Optional[List[Any]] = None
+    @classmethod
+    def get_dataset(cls) -> List[Any]:
+        if cls.dataset is None:
+            cls.dataset = list(load_dataset("UniverseTBD/hypogen-dr1")["train"])
+        return cls.dataset
+EXTRACT_PROMPT = """
+You are a highly advanced research assistant.
+You specialize in reading scientific papers for hypothesis generation and identifying innovative ideas.
+## Example (BERT in NLP)
+Before you begin, let 's revisit the Bit-Flip concept with an example (BERT in NLP):
+- Bit: Traditional NLP models (RNNs, LSTMs) process text sequentially,
+limiting their ability to understand long-range dependencies and fully capture bidirectional context.
+- Flip: Instead, consider entire sentences at once, allowing context from both directions. This helps capture nuanced relationships among words.
+- Spark: Bidirectional context for NLP.
+## Framework
+A Bit-Flip inverts a commonly held assumption,
+questioning existing constraints or reapplying techniques to new domains/scales.
+The "Bit" is the prevailing belief, and the "Flip" is the counterargument.
+## Guidance for analysis
+1. Bit (Technical Insight):
+- Provide at least two sentences clearly stating the status quo or conventional approach.
+- Highlight the limitation or problem it creates.
+- Include enough detail so it is self-contained and does not rely on additional context from elsewhere.
+2. Flip (Innovation):
+- Provide at least two sentences describing the novel approach or perspective.
+- Explain the method or technique that enables this change.
+- Include enough detail so the Flip is understandable on its own.
+3. Spark (Core Summary):
+- A concise 4-6 word phrase capturing the core idea.
+Now, consider this research abstract:
+{{abstract}}
+Your task:
+Identify the Bit, Flip, and Spark from the abstract in a detailed manner:
+- Bit: at least two sentences, with sufficient detail about the conventional approach and its limitation.
+- Flip: at least two sentences, describing the new approach or perspective with enough detail to understand the main technique.
+- Spark: a concise 4-6 word summary of the core idea.
+Follow these rules:
+- Do not cite the paper itself or its authors.
+- Instead of saying "We/I introduced an idea", just say "An idea was introduced ...".
+Return only the JSON object in this exact format (no extra text):
+{
+    "bit": "Technical limitation or conventional approach, in at least two sentences",
+    "flip": "Innovative approach or solution, in at least two sentences",
+    "spark": "4-6 word summary"
+}
+"""
+IMPROVEMENT_PROMPT = """
+You are a highly advanced research assistant.
+You specialize in hypothesis generation and identifying innovative ideas.
+You are given a Bit, which is a technical limitation or conventional approach of some paper.
+Your task is to propose an improvement idea for the Bit called Flip and summarize it in a Spark.
+Do not propose any human annotations or human-in-the-loop, the idea should be automatically verifiable.
+Try to be as specific as possible.
+{% for example in examples %}
+## Example {{loop.index}}
+- Bit: {{example["bit"]}}
+- Chain of reasoning: {{example["chain_of_reasoning"]}}
+- Flip: {{example["flip"]}}
+- Spark: {{example["spark"]}}
+{% endfor %}
+Now, please propose a chain of reasoning that leads to an improvement idea for this Bit:
+{{bit}}
+{% if additional_context %}Additional context:
+{{additional_context}}{% endif %}
+Finalize your idea by providing the idea details:
+- Abstract: An abstract that summarizes the proposal in conference format (approximately 250 words).
+- Experiments: A list of experiments that would be conducted to validate the proposal. Ensure these are simple and feasible. Be specific in exactly how you would test the hypothesis, and detail precise algorithmic changes. Include the evaluation metrics you would use.
+- Risks and limitations: A list of potential risks and limitations of the proposal.
+Return only the JSON object in this exact format (no extra text):
+{
+    "chain_of_reasoning": "Chain of reasoning that leads to an improvement idea for this Bit. At least 5 sentences.",
+    "flip": "Innovative approach or solution, in at least two sentences",
+    "spark": "4-6 word summary",
+    "abstract": "An abstract that summarizes the proposal in conference format (approximately 250 words).",
+    "experiments": ["...", "..."],
+    "risks_and_limitations": "A list of potential risks and limitations of the proposal."
+}
+"""
+SCORE_PROMPT = """
+You are a highly advanced research assistant.
+You are given a list of research proposals.
+Your task is to score the proposals.
+Proposals:
+{% for proposal in proposals %}
+- Proposal ID: {{proposal["proposal_id"]}}
+- Spark: {{proposal["spark"]}}
+- Abstract: {{proposal["abstract"]}}
+- Experiments: {{proposal["experiments"]}}
+- Risks and limitations: {{proposal["risks_and_limitations"]}}
+{% endfor %}
+Here are the criteria:
+- "Strengths": A list of strengths of the proposal.
+- "Weaknesses": A list of weaknesses of the proposal.
+- "Novelty": Is the proposal novel? A rating from 1 to 4 (low, medium, high, very high).
+- "Clarity": Is the proposal clear? A rating from 1 to 4 (low, medium, high, very high).
+- "Significance": Is the proposal significant? A rating from 1 to 4 (low, medium, high, very high).
+- "Feasibility": Is the proposal feasible and easy to implement? A rating from 1 to 4 (low, medium, high, very high).
+- "Soundness": Is the proposal sound? A rating from 1 to 4 (poor, fair, good, excellent).
+- "Overall": A rating from 1 to 10 (very strong reject to award quality).
+Return only scores for all proposals in this exact format (no extra text):
+[
+    {
+        "proposal_id": 0,
+        "spark": "...",
+        "strengths": ["...", "..."],
+        "weaknesses": ["...", "..."],
+        "novelty": 2,
+        "clarity": 2,
+        "significance": 2,
+        "feasibility": 2,
+        "soundness": 2,
+        "overall": 5
+    },
+    ...
+]
+"""
+class BitFlipInfo(BaseModel):  # type: ignore
+    bit: str
+    flip: str
+    spark: str
+class Proposal(BaseModel):  # type: ignore
+    proposal_id: Optional[int] = None
+    flip: str
+    spark: str
+    abstract: str
+    experiments: List[str]
+    risks_and_limitations: List[str]
+class ProposalScores(BaseModel):  # type: ignore
+    proposal_id: int
+    spark: str
+    strengths: List[str]
+    weaknesses: List[str]
+    novelty: int
+    clarity: int
+    significance: int
+    feasibility: int
+    soundness: int
+    overall: int
+async def extract_bitflip_info(arxiv_id: str) -> str:
+    """
+    Extracts the Bit-Flip information from the arXiv paper.
+    A Bit-Flip is a technique that inverts a commonly held assumption,
+    questioning existing constraints or reapplying techniques to new domains/scales.
+    The "Bit" is the prevailing belief, and the "Flip" is the counterargument.
+    Returns a JSON object in this format:
+    {
+        "bit": "Technical limitation or conventional approach, in at least two sentences",
+        "flip": "Innovative approach or solution, in at least two sentences",
+        "spark": "4-6 word summary of the core idea"
+    }
+    Use `json.loads` to deserialize the result if you want to get specific fields.
+    Args:
+        arxiv_id: The arXiv ID of the paper to extract the Bit-Flip information from.
+    """
+    model_name = os.getenv("BITFLIP_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
+    paper = arxiv_download(arxiv_id)
+    abstract = json.loads(paper)["abstract"]
+    prompt = encode_prompt(EXTRACT_PROMPT, abstract=abstract)
+    content = await llm_acall(model_name=model_name, prompt=prompt)
+    result = extract_json(content)
+    bitflip_info: BitFlipInfo = BitFlipInfo.model_validate(result)
+    return str(bitflip_info.model_dump_json())
+async def generate_research_proposal(bit: str, additional_context: str = "") -> str:
+    """
+    Proposes an improvement idea for the Bit.
+    Args:
+        bit: The Bit to propose an improvement idea for. The bit is a technical limitation or conventional approach of some paper.
+        additional_context: Additional context to use when proposing the improvement idea.
+    Returns a JSON string with a research proposal in this format:
+    {
+        "proposal_id": ...,
+        "flip": "Innovative approach or solution, in at least two sentences",
+        "spark": "4-6 word summary",
+        "abstract": "An abstract that summarizes the proposal in conference format (approximately 250 words).",
+        "experiments": ["...", "..."],
+        "risks_and_limitations": "A list of potential risks and limitations of the proposal."
+    }
+    Use `json.loads` to deserialize the result if you want to get specific fields.
+    """
+    model_name = os.getenv("BITFLIP_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
+    examples = ProposalDataset.get_dataset()[:]
+    examples = random.choices(examples, k=4)
+    prompt = encode_prompt(
+        IMPROVEMENT_PROMPT, bit=bit, examples=examples, additional_context=additional_context
+    )
+    content = await llm_acall(model_name=model_name, prompt=prompt)
+    result = extract_json(content)
+    proposal: Proposal = Proposal.model_validate(result)
+    proposal.proposal_id = random.randint(0, 1000000)
+    return str(proposal.model_dump_json())
+async def score_research_proposals(proposals: List[str]) -> str:
+    """
+    Scores a list of research proposals.
+    Use proposals obtained with the `generate_research_proposal` tool.
+    Returns a JSON string with a list of scores in this format:
+    [
+        {
+            "proposal_id": 0,
+            "spark": "...",
+            "strengths": ["...", "..."],
+            "weaknesses": ["...", "..."],
+            "novelty": 2,
+            "clarity": 2,
+            "significance": 2,
+            "feasibility": 2,
+            "soundness": 2,
+            "overall": 5
+        },
+        ...
+    ]
+    Use `json.loads` to deserialize the result if you want to get specific fields.
+    Args:
+        proposals: A list of JSON strings with research proposals.
+    """
+    model_name = os.getenv("BITFLIP_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
+    proposals = [Proposal.model_validate_json(proposal) for proposal in proposals]
+    prompt = encode_prompt(SCORE_PROMPT, proposals=proposals)
+    content = await llm_acall(model_name=model_name, prompt=prompt)
+    scores = extract_json(content)
+    final_scores = [ProposalScores.model_validate(score) for score in scores]
+    return json.dumps([s.model_dump() for s in final_scores], ensure_ascii=False)

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp/tools/document_qa.py RENAMED Viewed

@@ -1,18 +1,15 @@
 import os
-from typing import List, Any, Dict, cast
+from typing import List, Any, Dict
 from dotenv import load_dotenv
 from pydantic import BaseModel
-from openai import OpenAI
-from openai.types.chat import ChatCompletionMessageParam, ChatCompletionMessage
+from academia_mcp.llm import llm_acall
 load_dotenv()
-SYSTEM_PROMPT = (
-    "You are a helpful assistant that answers questions about documents accurately and concisely."
-)
-PROMPT = """Please answer the following questions based solely on the provided document.
+PROMPT = """You are a helpful assistant that answers questions about documents accurately and concisely.
+Please answer the following questions based solely on the provided document.
 If there is no answer in the document, output "There is no answer in the provided document".
 First cite ALL relevant document fragments, then provide a final answer.
 Answer all given questions one by one.
@@ -40,7 +37,7 @@ class ChatMessage(BaseModel):  # type: ignore
 ChatMessages = List[ChatMessage]
-def document_qa(
+async def document_qa(
     document: str,
     question: str,
 ) -> str:
@@ -64,33 +61,7 @@ def document_qa(
     assert question and question.strip(), "Please provide non-empty 'question'"
     assert document and document.strip(), "Please provide non-empty 'document'"
-    base_url = os.getenv("BASE_URL", "https://openrouter.ai/api/v1")
-    key = os.getenv("OPENROUTER_API_KEY", "")
-    assert key, "Please set OPENROUTER_API_KEY in the environment variables"
     model_name = os.getenv("DOCUMENT_QA_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
-    messages: ChatMessages = [
-        ChatMessage(role="system", content=SYSTEM_PROMPT),
-        ChatMessage(
-            role="user",
-            content=PROMPT.format(question=question, document=document),
-        ),
-    ]
-    sdk_messages = [
-        cast(ChatCompletionMessageParam, m.model_dump(exclude_none=True)) for m in messages
-    ]
-    client = OpenAI(base_url=base_url, api_key=key)
-    response: ChatCompletionMessage = (
-        client.chat.completions.create(
-            model=model_name,
-            messages=sdk_messages,
-            temperature=0.0,
-        )
-        .choices[0]
-        .message
-    )
-    if response.content is None:
-        raise Exception("Response content is None")
-    return response.content.strip()
+    prompt = PROMPT.format(question=question, document=document)
+    content = await llm_acall(model_name=model_name, prompt=prompt)
+    return content.strip()

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: academia-mcp
-Version: 1.1.4
+Version: 1.2.0
 Summary: MCP server that provides different tools to search for scientific publications
 Author-email: Ilya Gusev <phoenixilya@gmail.com>
 Project-URL: Homepage, https://github.com/IlyaGusev/academia_mcp
@@ -31,6 +31,7 @@ Requires-Dist: pytest>=8.4.1
 Requires-Dist: openai>=1.97.1
 Requires-Dist: jinja2>=3.1.6
 Requires-Dist: datasets>=4.0.0
+Requires-Dist: pytest-asyncio>=1.1.0
 Dynamic: license-file
 # Academia MCP

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp.egg-info/SOURCES.txt RENAMED Viewed

@@ -4,6 +4,7 @@ pyproject.toml
 academia_mcp/__init__.py
 academia_mcp/__main__.py
 academia_mcp/files.py
+academia_mcp/llm.py
 academia_mcp/py.typed
 academia_mcp/server.py
 academia_mcp/utils.py

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/academia_mcp.egg-info/requires.txt RENAMED Viewed

@@ -19,3 +19,4 @@ pytest>=8.4.1
 openai>=1.97.1
 jinja2>=3.1.6
 datasets>=4.0.0
+pytest-asyncio>=1.1.0

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "academia-mcp"
-version = "1.1.4"
+version = "1.2.0"
 description = "MCP server that provides different tools to search for scientific publications"
 readme = "README.md"
 authors = [
@@ -38,6 +38,7 @@ dependencies = [
     "openai>=1.97.1",
     "jinja2>=3.1.6",
     "datasets>=4.0.0",
+    "pytest-asyncio>=1.1.0",
 ]
 [project.urls]
@@ -63,3 +64,6 @@ include = ["academia_mcp*"]
 module = "pydantic.*"
 follow_imports = "skip"
+[tool.pytest.ini_options]
+asyncio_mode = "auto"
+asyncio_default_test_loop_scope = "function"

academia_mcp-1.2.0/tests/test_bitflip.py ADDED Viewed

@@ -0,0 +1,38 @@
+import json
+from academia_mcp.tools.bitflip import (
+    extract_bitflip_info,
+    generate_research_proposal,
+    score_research_proposals,
+)
+async def test_bitflip_extract_info() -> None:
+    arxiv_id = "2409.06820"
+    result = json.loads(await extract_bitflip_info(arxiv_id))
+    assert result is not None
+    assert result["bit"]
+async def test_bitflip_generate_research_proposal() -> None:
+    arxiv_id = "2503.07826"
+    bit = json.loads(await extract_bitflip_info(arxiv_id))["bit"]
+    result = json.loads(await generate_research_proposal(bit=bit))
+    assert result is not None
+    assert result["flip"]
+async def test_bitflip_score_research_proposals() -> None:
+    arxiv_id = "2503.07826"
+    bit = json.loads(await extract_bitflip_info(arxiv_id))["bit"]
+    proposal1 = await generate_research_proposal(bit=bit)
+    proposal2 = await generate_research_proposal(bit=bit)
+    scores = json.loads(await score_research_proposals([proposal1, proposal2]))
+    assert scores
+    assert len(scores) == 2
+    assert scores[0]["spark"] is not None
+    assert scores[1]["spark"] is not None
+    assert scores[0]["strengths"] is not None
+    assert scores[1]["strengths"] is not None
+    assert scores[0]["weaknesses"] is not None
+    assert scores[1]["weaknesses"] is not None

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/tests/test_document_qa.py RENAMED Viewed

@@ -17,16 +17,16 @@ English constituency parsing both with large and limited training data.
 """
-def test_document_qa_base() -> None:
-    answer = document_qa(
+async def test_document_qa_base() -> None:
+    answer = await document_qa(
         question="What is BLEU on the WMT 2014 English-to-German translation task?",
         document=DOCUMENT1,
     )
     assert "28.4" in answer
-def test_document_qa_real_question() -> None:
+async def test_document_qa_real_question() -> None:
     questions = "What is the best model for the Russian language according to the role-play benchmark and its final score?"
     document = arxiv_download("2409.06820")
-    answer = document_qa(question=questions, document=document)
+    answer = await document_qa(question=questions, document=document)
     assert "4.62" in answer or "4.68" in answer

{academia_mcp-1.1.4 → academia_mcp-1.2.0}/tests/test_web_search.py RENAMED Viewed

@@ -6,7 +6,6 @@ from academia_mcp.tools import web_search
 def test_web_search_base() -> None:
     result = web_search("autoregressive models path-star graphs", limit=20)
     assert "The Mystery of the Pathological" in result
-    assert "The Pitfalls of Next-Token Prediction" in result
     results = json.loads(result)
     assert results
     assert "score" not in str(results)

academia_mcp-1.1.4/academia_mcp/tools/bitflip.py DELETED Viewed

@@ -1,193 +0,0 @@
-# https://arxiv.org/abs/2504.12976
-# https://web.stanford.edu/class/cs197c/slides/02-literature-search.pdf
-import json
-import os
-import random
-from typing import List, Dict, Any
-from openai import OpenAI
-from pydantic import BaseModel
-from openai.types.chat import ChatCompletionMessage
-from datasets import load_dataset  # type: ignore
-from academia_mcp.tools.arxiv_download import arxiv_download
-from academia_mcp.utils import extract_json, encode_prompt
-EXTRACT_PROMPT = """
-You are a highly advanced research assistant.
-You specialize in reading scientific papers for hypothesis generation and identifying innovative ideas.
-## Example (BERT in NLP)
-Before you begin, let 's revisit the Bit-Flip concept with an example (BERT in NLP):
-- Bit: Traditional NLP models (RNNs, LSTMs) process text sequentially,
-limiting their ability to understand long-range dependencies and fully capture bidirectional context.
-- Flip: Instead, consider entire sentences at once, allowing context from both directions. This helps capture nuanced relationships among words.
-- Spark: Bidirectional context for NLP.
-## Framework
-A Bit-Flip inverts a commonly held assumption,
-questioning existing constraints or reapplying techniques to new domains/scales.
-The "Bit" is the prevailing belief, and the "Flip" is the counterargument.
-## Guidance for analysis
-1. Bit (Technical Insight):
-- Provide at least two sentences clearly stating the status quo or conventional approach.
-- Highlight the limitation or problem it creates.
-- Include enough detail so it is self-contained and does not rely on additional context from elsewhere.
-2. Flip (Innovation):
-- Provide at least two sentences describing the novel approach or perspective.
-- Explain the method or technique that enables this change.
-- Include enough detail so the Flip is understandable on its own.
-3. Spark (Core Summary):
-- A concise 4-6 word phrase capturing the core idea.
-Now, consider this research abstract:
-{{abstract}}
-Your task:
-Identify the Bit, Flip, and Spark from the abstract in a detailed manner:
-- Bit: at least two sentences, with sufficient detail about the conventional approach and its limitation.
-- Flip: at least two sentences, describing the new approach or perspective with enough detail to understand the main technique.
-- Spark: a concise 4-6 word summary of the core idea.
-Follow these rules:
-- Do not cite the paper itself or its authors.
-- Instead of saying "We/I introduced an idea", just say "An idea was introduced ...".
-Return only the JSON object in this exact format (no extra text):
-{
-    "bit": "Technical limitation or conventional approach, in at least two sentences",
-    "flip": "Innovative approach or solution, in at least two sentences",
-    "spark": "4-6 word summary"
-}
-"""
-IMPROVEMENT_PROMPT = """
-You are a highly advanced research assistant.
-You specialize in hypothesis generation and identifying innovative ideas.
-You are given a Bit, which is a technical limitation or conventional approach of some paper.
-Your task is to propose an improvement idea for the Bit called Flip and summarize it in a Spark.
-Do not propose any human annotations or human-in-the-loop, the idea should be automatically verifiable.
-Try to be as specific as possible.
-{% for example in examples %}
-## Example {{loop.index}}
-- Bit: {{example["bit"]}}
-- Chain of reasoning: {{example["chain_of_reasoning"]}}
-- Flip: {{example["flip"]}}
-- Spark: {{example["spark"]}}
-{% endfor %}
-Now, please propose a chain of reasoning that leads to an improvement idea for this Bit:
-{{bit}}
-Return only the JSON object in this exact format (no extra text):
-{
-    "chain_of_reasoning": "Chain of reasoning that leads to an improvement idea for this Bit. At least 5 sentences.",
-    "flip": "Innovative approach or solution, in at least two sentences",
-    "spark": "4-6 word summary"
-}
-"""
-class ChatMessage(BaseModel):  # type: ignore
-    role: str
-    content: str | List[Dict[str, Any]]
-ChatMessages = List[ChatMessage]
-def extract_bitflip_info(arxiv_id: str) -> str:
-    """
-    Extracts the Bit-Flip information from the arXiv paper.
-    A Bit-Flip is a technique that inverts a commonly held assumption,
-    questioning existing constraints or reapplying techniques to new domains/scales.
-    The "Bit" is the prevailing belief, and the "Flip" is the counterargument.
-    Returns a JSON object in this format:
-    {
-        "bit": "Technical limitation or conventional approach, in at least two sentences",
-        "flip": "Innovative approach or solution, in at least two sentences",
-        "spark": "4-6 word summary of the core idea"
-    }
-    Use `json.loads` to deserialize the result if you want to get specific fields.
-    Args:
-        arxiv_id: The arXiv ID of the paper to extract the Bit-Flip information from.
-    """
-    base_url = os.getenv("BASE_URL", "https://openrouter.ai/api/v1")
-    key = os.getenv("OPENROUTER_API_KEY", "")
-    assert key, "Please set OPENROUTER_API_KEY in the environment variables"
-    model_name = os.getenv("BITFLIP_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
-    paper = arxiv_download(arxiv_id)
-    abstract = json.loads(paper)["abstract"]
-    prompt = encode_prompt(EXTRACT_PROMPT, abstract=abstract)
-    messages: ChatMessages = [
-        ChatMessage(role="user", content=prompt),
-    ]
-    client = OpenAI(base_url=base_url, api_key=key)
-    response: ChatCompletionMessage = (
-        client.chat.completions.create(
-            model=model_name,
-            messages=messages,
-            temperature=0.0,
-        )
-        .choices[0]
-        .message
-    )
-    assert response.content, "Response content is None"
-    result = extract_json(response.content)
-    return json.dumps(result, ensure_ascii=False)
-def propose_improvement_idea(arxiv_id: str) -> str:
-    """
-    Proposes an improvement idea for the arXiv paper.
-    Returns a JSON object in this format:
-    {
-        "chain_of_reasoning": "Chain of reasoning that leads to an improvement idea.",
-        "flip": "Innovative approach or solution",
-        "spark": "4-6 word summary"
-    }
-    Use `json.loads` to deserialize the result if you want to get specific fields.
-    Args:
-        arxiv_id: The arXiv ID of the paper to propose an improvement idea for.
-    """
-    base_url = os.getenv("BASE_URL", "https://openrouter.ai/api/v1")
-    key = os.getenv("OPENROUTER_API_KEY", "")
-    assert key, "Please set OPENROUTER_API_KEY in the environment variables"
-    model_name = os.getenv("BITFLIP_MODEL_NAME", "deepseek/deepseek-chat-v3-0324")
-    bitflip_info = json.loads(extract_bitflip_info(arxiv_id))
-    bit = bitflip_info["bit"]
-    examples = list(load_dataset("UniverseTBD/hypogen-dr1")["train"])
-    random.shuffle(examples)
-    examples = examples[:4]
-    prompt = encode_prompt(IMPROVEMENT_PROMPT, bit=bit, examples=examples)
-    messages: ChatMessages = [
-        ChatMessage(role="user", content=prompt),
-    ]
-    client = OpenAI(base_url=base_url, api_key=key)
-    response: ChatCompletionMessage = (
-        client.chat.completions.create(
-            model=model_name,
-            messages=messages,
-            temperature=0.0,
-        )
-        .choices[0]
-        .message
-    )
-    assert response.content, "Response content is None"
-    result = extract_json(response.content)
-    return json.dumps(result, ensure_ascii=False)

academia_mcp-1.1.4/tests/test_bitflip.py DELETED Viewed

@@ -1,19 +0,0 @@
-from academia_mcp.tools.bitflip import extract_bitflip_info, propose_improvement_idea
-def test_bitflip_extract_info() -> None:
-    arxiv_id = "2409.06820"
-    result = extract_bitflip_info(arxiv_id)
-    assert result is not None
-    assert "bit" in result
-    assert "flip" in result
-    assert "spark" in result
-def test_bitflip_propose_improvement_idea() -> None:
-    arxiv_id = "2503.07826"
-    result = propose_improvement_idea(arxiv_id)
-    assert result is not None
-    assert "chain_of_reasoning" in result
-    assert "flip" in result
-    assert "spark" in result