PyPI - aiagents4pharma - Versions diffs - 1.30.0__py3-none-any.whl → 1.30.1__py3-none-any.whl - Mend

aiagents4pharma 1.30.0py3-none-any.whl → 1.30.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

aiagents4pharma/talk2scholars/agents/main_agent.py CHANGED Viewed

@@ -1,11 +1,14 @@
 #!/usr/bin/env python3
 """
-Main agent for the talk2scholars app using ReAct pattern.
+Main agent module for initializing and running the Talk2Scholars application.
-This module implements a hierarchical agent system where a supervisor agent
-routes queries to specialized sub-agents. It follows the LangGraph patterns
-for multi-agent systems and implements proper state management.
+This module sets up the hierarchical agent system using LangGraph and integrates
+various sub-agents for handling different tasks such as semantic scholar, zotero,
+PDF processing, and paper downloading.
+Functions:
+- get_app: Initializes and returns the LangGraph-based hierarchical agent system.
 """
 import logging
@@ -16,6 +19,8 @@ from langchain_core.language_models.chat_models import BaseChatModel
 from langgraph.checkpoint.memory import MemorySaver
 from ..agents.s2_agent import get_app as get_app_s2
 from ..agents.zotero_agent import get_app as get_app_zotero
+from ..agents.pdf_agent import get_app as get_app_pdf
+from ..agents.paper_download_agent import get_app as get_app_paper_download
 from ..state.state_talk2scholars import Talk2Scholars
 # Initialize logger
@@ -43,12 +48,13 @@ def get_app(uniq_id, llm_model: BaseChatModel):
         >>> app = get_app("thread_123")
         >>> result = app.invoke(initial_state)
     """
-    if llm_model.model_name == "gpt-4o-mini":
-        llm_model = ChatOpenAI(
-            model="gpt-4o-mini",
-            temperature=0,
-            model_kwargs={"parallel_tool_calls": False},
-        )
+    if hasattr(llm_model, "model_name"):
+        if llm_model.model_name == "gpt-4o-mini":
+            llm_model = ChatOpenAI(
+                model="gpt-4o-mini",
+                temperature=0,
+                model_kwargs={"parallel_tool_calls": False},
+            )
     # Load hydra configuration
     logger.log(logging.INFO, "Launching Talk2Scholars with thread_id %s", uniq_id)
     with hydra.initialize(version_base=None, config_path="../configs/"):
@@ -62,6 +68,8 @@ def get_app(uniq_id, llm_model: BaseChatModel):
         [
             get_app_s2(uniq_id, llm_model),  # semantic scholar
             get_app_zotero(uniq_id, llm_model),  # zotero
+            get_app_pdf(uniq_id, llm_model),  # pdf
+            get_app_paper_download(uniq_id, llm_model),  # paper download
         ],
         model=llm_model,
         state_schema=Talk2Scholars,

aiagents4pharma/talk2scholars/agents/paper_download_agent.py CHANGED Viewed

@@ -20,6 +20,7 @@ from ..tools.s2.query_results import query_results
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 def get_app(uniq_id, llm_model: BaseChatModel):
     """
     Initializes and returns the LangGraph application for the Talk2Scholars paper download agent.
@@ -39,14 +40,12 @@ def get_app(uniq_id, llm_model: BaseChatModel):
     with hydra.initialize(version_base=None, config_path="../configs"):
         cfg = hydra.compose(
             config_name="config",
-            overrides=["agents/talk2scholars/paper_download_agent=default"]
+            overrides=["agents/talk2scholars/paper_download_agent=default"],
         )
         cfg = cfg.agents.talk2scholars.paper_download_agent
     # Define tools properly
-    tools = ToolNode(
-    [download_arxiv_paper, query_results]
-    )
+    tools = ToolNode([download_arxiv_paper, query_results])
     # Define the model
     logger.info("Using OpenAI model %s", llm_model)
@@ -54,7 +53,7 @@ def get_app(uniq_id, llm_model: BaseChatModel):
         llm_model,
         tools=tools,
         state_schema=Talk2Scholars,
-        prompt=cfg.prompt,
+        prompt=cfg.paper_download_agent,
         checkpointer=MemorySaver(),
     )
@@ -79,7 +78,7 @@ def get_app(uniq_id, llm_model: BaseChatModel):
     checkpointer = MemorySaver()
     # Compile the graph
-    app = workflow.compile(checkpointer=checkpointer)
+    app = workflow.compile(checkpointer=checkpointer, name="agent_paper_download")
     # Logging the information and returning the app
     logger.info("Compiled the graph")

aiagents4pharma/talk2scholars/agents/pdf_agent.py CHANGED Viewed

@@ -26,10 +26,7 @@ logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-def get_app(
-    uniq_id,
-    llm_model: BaseChatModel
-):
+def get_app(uniq_id, llm_model: BaseChatModel):
     """
     Initializes and returns the LangGraph application for the PDF agent.
@@ -40,7 +37,7 @@ def get_app(
     Args:
         uniq_id (str): A unique identifier for the current conversation session or thread.
-        llm_model (BaseChatModel, optional): The language model instance to be used.
+        llm_model (BaseChatModel, optional): The language model instance to be used.
             Defaults to ChatOpenAI(model="gpt-4o-mini", temperature=0).
     Returns:
@@ -71,10 +68,7 @@ def get_app(
             Any: The response generated by the language model after processing the state.
         """
         logger.info("Creating Agent_PDF node with thread_id %s", uniq_id)
-        response = model.invoke(
-            state,
-            {"configurable": {"thread_id": uniq_id}}
-        )
+        response = model.invoke(state, {"configurable": {"thread_id": uniq_id}})
         return response
     # Define the tool node that includes the PDF QnA tool.
@@ -100,7 +94,7 @@ def get_app(
     checkpointer = MemorySaver()
     # Compile the graph into a runnable app.
-    app = workflow.compile(checkpointer=checkpointer)
+    app = workflow.compile(checkpointer=checkpointer, name="agent_pdf")
     logger.info("Compiled the PDF agent graph.")
     return app

aiagents4pharma/talk2scholars/configs/agents/talk2scholars/main_agent/default.yaml CHANGED Viewed

@@ -1,13 +1,22 @@
 _target_: agents.main_agent.get_app
 temperature: 0
 system_prompt: >
-  You are the Talk2Scholars agent coordinating academic paper discovery and analysis.
+  You are Talk2Scholars agent coordinating academic paper discovery
+  and analysis with help of the following agents:
+   1. Agent S2: This agent can be used to search and recommend papers
+      from Semantic Scholar. Use this agent when the user asks for
+      general paper/article searches and recommendations, or to retrieve information
+      from the last displayed results table or query abstract of last
+      displayed results.
+   2. Agent Zotero: This agent can be used to retrieve, display, and query
+      papers/articles from the Zotero library. Use this agent only when the user
+      explicitly asks for papers from Zotero. This tool can also be used to
+      save papers in the zotero library.
+   3. Agent PaperFetch: This agent can be used to download papers/articles
+      from ArXiv.
+   4. Agent PDFQuery: This agent can be used to query contents of an
+      uploaded or downloaded PDF/paper/article.
-  You have access to the following agents:
-  1. S2_agent: This agent can be used to search and recommend papers
-     from Semantic Scholar. Use this agent when the user asks for
-     general paper searches and recommendations.
-  2. Zotero_agent: This agent can be used to retrieve, display, and query
-     papers from the Zotero library. Use this agent only when the user
-     explicitly asks for papers from Zotero. This tool can also be used to
-     save papers in under collections in the zotero library
+   Your final response should be a one sentence summary of the information
+   retrieved from the agents above. Do not repeat the information already
+   displayed to the user in the response of the agents.

aiagents4pharma/talk2scholars/configs/agents/talk2scholars/s2_agent/default.yaml CHANGED Viewed

@@ -15,5 +15,5 @@ s2_agent: >
   1. When user requests papers, use search/recommendation tools to find papers
   2. Use `display_results` tool to display the response from the search/recommendation tools
   3. Use `query_results` tool to query over the selected paper only when the user asks to
-  4. When the user wants recommendations, you can get the "paper_id" using `query_results` tool in the "last_displayed_results" key, then
-     pass the "paper_id" to `search`, `single_paper_rec` or `multi_paper_rec` tools depending on the user's query. Do not use "arxiv_id"
+  4. When the user wants recommendations, you can get the "semantic_scholar_paper_id" using `query_results` tool in the "last_displayed_results" key, then
+     pass the "semantic_scholar_paper_id" to `search`, `single_paper_rec` or `multi_paper_rec` tools depending on the user's query. Do not use "arxiv_id"

aiagents4pharma/talk2scholars/configs/app/frontend/default.yaml CHANGED Viewed

@@ -8,6 +8,7 @@ page:
 llms:
   available_models:
     - "OpenAI/gpt-4o-mini"
+    - "NVIDIA/llama-3.3-70b-instruct"
 # # Chat UI configuration
 # chat:
 #   assistant_avatar: "🤖"

aiagents4pharma/talk2scholars/configs/tools/multi_paper_recommendation/default.yaml CHANGED Viewed

@@ -6,10 +6,15 @@ api_fields:
   - "title"
   - "abstract"
   - "year"
-  - "authors"
+  - "authors.name"
+  - "authors.authorId"
   - "citationCount"
   - "url"
   - "externalIds"
+  - "venue"
+  - "publicationVenue" # Full object, instead of specific subfields
+  - "journal" # Full object, instead of specific subfields
+  - "publicationDate"
 # Commented fields that could be added later if needed
 # Default headers and params

aiagents4pharma/talk2scholars/configs/tools/search/default.yaml CHANGED Viewed

@@ -6,10 +6,16 @@ api_fields:
   - "title"
   - "abstract"
   - "year"
-  - "authors"
+  - "authors.name"
+  - "authors.authorId"
   - "citationCount"
   - "url"
   - "externalIds"
+  - "venue"
+  - "publicationVenue" # Full object, instead of specific subfields
+  - "journal" # Full object, instead of specific subfields
+  - "publicationDate"
 # Commented fields that could be added later if needed
 #  - "publicationTypes"
 #  - "openAccessPdf"

aiagents4pharma/talk2scholars/configs/tools/single_paper_recommendation/default.yaml CHANGED Viewed

@@ -6,10 +6,15 @@ api_fields:
   - "title"
   - "abstract"
   - "year"
-  - "authors"
+  - "authors.name"
+  - "authors.authorId"
   - "citationCount"
   - "url"
   - "externalIds"
+  - "venue"
+  - "publicationVenue" # Full object, instead of specific subfields
+  - "journal" # Full object, instead of specific subfields
+  - "publicationDate"
 # Commented fields that could be added later if needed
 #  - "publicationTypes"
 #  - "openAccessPdf"

aiagents4pharma/talk2scholars/configs/tools/zotero_read/default.yaml CHANGED Viewed

@@ -53,4 +53,4 @@ zotero:
       "Web Page",
     ]
-  filter_excluded_types: ["attachment", "note", "annotation"]
+  # filter_excluded_types: ["attachment", "note", "annotation"]

aiagents4pharma/talk2scholars/state/state_talk2scholars.py CHANGED Viewed

@@ -9,6 +9,7 @@ across agent interactions.
 import logging
 from typing import Annotated, Any, Dict
 from langchain_core.language_models import BaseChatModel
+from langchain_core.embeddings import Embeddings
 from langgraph.prebuilt.chat_agent_executor import AgentState
 # Configure logging
@@ -54,6 +55,8 @@ class Talk2Scholars(AgentState):
         multi_papers (Dict[str, Any]): Stores multiple recommended papers from various sources.
         zotero_read (Dict[str, Any]): Stores the papers retrieved from Zotero.
         llm_model (BaseChatModel): The language model instance used for generating responses.
+        text_embedding_model (Embeddings): The text embedding model used for
+        similarity calculations.
     """
     # Agent state fields
@@ -63,4 +66,4 @@ class Talk2Scholars(AgentState):
     pdf_data: Annotated[Dict[str, Any], replace_dict]
     zotero_read: Annotated[Dict[str, Any], replace_dict]
     llm_model: BaseChatModel
-    pdf_data: Annotated[Dict[str, Any], replace_dict]
+    text_embedding_model: Embeddings

aiagents4pharma/talk2scholars/tests/test_llm_main_integration.py CHANGED Viewed

@@ -1,58 +1,89 @@
 """
 Integration tests for talk2scholars system with OpenAI.
+This test triggers all sub-agents by sending a conversation that covers:
+- Searching Semantic Scholar (S2 agent)
+- Retrieving Zotero results (Zotero agent)
+- Querying PDF content (PDF agent)
+- Downloading paper details from arXiv (Paper Download agent)
 """
-import os
-import pytest
-import hydra
-from langchain_openai import ChatOpenAI
-from langchain_core.messages import HumanMessage, AIMessage
-from ..agents.main_agent import get_app
-from ..state.state_talk2scholars import Talk2Scholars
+# This will be covered in the next pr.
-# pylint: disable=redefined-outer-name
-@pytest.mark.skipif(
-    not os.getenv("OPENAI_API_KEY"), reason="Requires OpenAI API key to run"
-)
-def test_main_agent_real_llm():
-    """
-    Test that the main agent invokes S2 agent correctly
-    and updates the state with real LLM execution.
-    """
-    # Load Hydra Configuration EXACTLY like in main_agent.py
-    with hydra.initialize(version_base=None, config_path="../configs"):
-        cfg = hydra.compose(
-            config_name="config", overrides=["agents/talk2scholars/main_agent=default"]
-        )
-    hydra_cfg = cfg.agents.talk2scholars.main_agent
-    assert hydra_cfg is not None, "Hydra config failed to load"
-    # Use the real OpenAI API (ensure env variable is set)
-    llm = ChatOpenAI(model="gpt-4o-mini", temperature=hydra_cfg.temperature)
-    # Initialize main agent workflow (WITH real Hydra config)
-    thread_id = "test_thread"
-    app = get_app(thread_id, llm)
-    # Provide an actual user query
-    initial_state = Talk2Scholars(
-        messages=[HumanMessage(content="Find AI papers on transformers")]
-    )
-    # Invoke the agent (triggers supervisor → s2_agent)
-    result = app.invoke(
-        initial_state,
-        {"configurable": {"config_id": thread_id, "thread_id": thread_id}},
-    )
-    # Assert that the supervisor routed correctly
-    assert "messages" in result, "Expected messages in response"
-    # Fix: Accept AIMessage as a valid response type
-    assert isinstance(
-        result["messages"][-1], (HumanMessage, AIMessage, str)
-    ), "Last message should be a valid response"
+#
+# import os
+# import pytest
+# import hydra
+# from langchain_openai import ChatOpenAI
+# from langchain_core.messages import HumanMessage, AIMessage
+# from ..agents.main_agent import get_app
+# from ..state.state_talk2scholars import Talk2Scholars
+#
+# # pylint: disable=redefined-outer-name,too-few-public-methods
+#
+#
+# @pytest.mark.skipif(
+#     not os.getenv("OPENAI_API_KEY"), reason="Requires OpenAI API key to run"
+# )
+# def test_main_agent_real_llm():
+#     """
+#     Integration test for the Talk2Scholars system using a real OpenAI LLM.
+#     This test verifies that the supervisor correctly routes to all sub-agents by
+#     providing a conversation with queries intended to trigger each agent.
+#     """
+#     # Load Hydra configuration EXACTLY like in main_agent.py
+#     with hydra.initialize(version_base=None, config_path="../configs"):
+#         cfg = hydra.compose(
+#             config_name="config", overrides=["agents/talk2scholars/main_agent=default"]
+#         )
+#     hydra_cfg = cfg.agents.talk2scholars.main_agent
+#     assert hydra_cfg is not None, "Hydra config failed to load"
+#
+#     # Use the real OpenAI API (ensure OPENAI_API_KEY is set in environment)
+#     llm = ChatOpenAI(model="gpt-4o-mini", temperature=hydra_cfg.temperature)
+#
+#     # Initialize the main agent workflow (with real Hydra config)
+#     thread_id = "test_thread"
+#     app = get_app(thread_id, llm)
+#
+#     # Provide a multi-turn conversation intended to trigger all sub-agents:
+#     # - S2 agent: "Search Semantic Scholar for AI papers on transformers."
+#     # - Zotero agent: "Retrieve Zotero results for these papers."
+#     # - PDF agent: "Analyze the attached PDF and summarize its key findings."
+#     # - Paper Download agent: "Download the paper details from arXiv."
+#     initial_state = Talk2Scholars(
+#         messages=[
+#             HumanMessage(
+#                 content="Search Semantic Scholar for AI papers on transformers."
+#             ),
+#             HumanMessage(content="Also, retrieve Zotero results for these papers."),
+#             HumanMessage(
+#                 content="I have attached a PDF; analyze it and tell me the key findings."
+#             ),
+#             HumanMessage(content="Finally, download the paper from arXiv."),
+#         ]
+#     )
+#
+#     # Invoke the agent (which routes to the appropriate sub-agents)
+#     result = app.invoke(
+#         initial_state,
+#         {"configurable": {"config_id": thread_id, "thread_id": thread_id}},
+#     )
+#
+#     # Assert that the result contains messages and that the final message is valid.
+#     assert "messages" in result, "Expected 'messages' in the response"
+#     last_message = result["messages"][-1]
+#     assert isinstance(
+#         last_message, (HumanMessage, AIMessage, str)
+#     ), "Last message should be a valid response type"
+#
+#     # Concatenate message texts (if available) to perform keyword checks.
+#     output_text = " ".join(
+#         msg.content if hasattr(msg, "content") else str(msg)
+#         for msg in result["messages"]
+#     ).lower()
+#
+#     # Check for keywords that suggest each sub-agent was invoked.
+#     for keyword in ["semantic scholar", "zotero", "pdf", "arxiv"]:
+#         assert (
+#             keyword in output_text
+#         ), f"Expected keyword '{keyword}' in the output response"

aiagents4pharma/talk2scholars/tests/test_main_agent.py CHANGED Viewed

@@ -65,6 +65,13 @@ def dummy_get_app_zotero(uniq_id, llm_model):
     return DummyWorkflow(supervisor_args={"agent": "zotero", "uniq_id": uniq_id})
+def dummy_get_app_pdf(uniq_id, llm_model):
+    """Return a DummyWorkflow for the PDF agent."""
+    dummy_get_app_pdf.called_uniq_id = uniq_id
+    dummy_get_app_pdf.called_llm_model = llm_model
+    return DummyWorkflow(supervisor_args={"agent": "pdf", "uniq_id": uniq_id})
 def dummy_create_supervisor(apps, model, state_schema, **kwargs):
     """Return a DummyWorkflow for the supervisor."""
     dummy_create_supervisor.called_kwargs = kwargs
@@ -136,6 +143,15 @@ def patch_hydra(monkeypatch):
     )
+def dummy_get_app_paper_download(uniq_id, llm_model):
+    """Return a DummyWorkflow for the paper download agent."""
+    dummy_get_app_paper_download.called_uniq_id = uniq_id
+    dummy_get_app_paper_download.called_llm_model = llm_model
+    return DummyWorkflow(
+        supervisor_args={"agent": "paper_download", "uniq_id": uniq_id}
+    )
 @pytest.fixture(autouse=True)
 def patch_sub_agents_and_supervisor(monkeypatch):
     """Patch the sub-agents and supervisor creation functions."""
@@ -146,6 +162,14 @@ def patch_sub_agents_and_supervisor(monkeypatch):
         "aiagents4pharma.talk2scholars.agents.main_agent.get_app_zotero",
         dummy_get_app_zotero,
     )
+    monkeypatch.setattr(
+        "aiagents4pharma.talk2scholars.agents.main_agent.get_app_pdf",
+        dummy_get_app_pdf,
+    )
+    monkeypatch.setattr(
+        "aiagents4pharma.talk2scholars.agents.main_agent.get_app_paper_download",
+        dummy_get_app_paper_download,
+    )
     monkeypatch.setattr(
         "aiagents4pharma.talk2scholars.agents.main_agent.create_supervisor",
         dummy_create_supervisor,

aiagents4pharma/talk2scholars/tests/test_question_and_answer_tool.py CHANGED Viewed

@@ -3,7 +3,6 @@ Unit tests for question_and_answer tool functionality.
 """
 from langchain.docstore.document import Document
 from ..tools.pdf import question_and_answer
 from ..tools.pdf.question_and_answer import (
     extract_text_from_pdf_data,
@@ -11,6 +10,8 @@ from ..tools.pdf.question_and_answer import (
     generate_answer,
 )
+# pylint: disable=redefined-outer-name,too-few-public-methods
 def test_extract_text_from_pdf_data():
     """
@@ -46,14 +47,14 @@ DUMMY_PDF_BYTES = (
 )
-def fake_generate_answer(question, pdf_bytes, _llm_model):
+def fake_generate_answer2(question, pdf_url, _text_embedding_model):
     """
-    Fake generate_answer function to bypass external dependencies.
+    Fake generate_answer2 function to bypass external dependencies.
     """
     return {
         "answer": "Mock answer",
         "question": question,
-        "pdf_bytes_length": len(pdf_bytes),
+        "pdf_url": pdf_url,
     }
@@ -61,30 +62,31 @@ def test_question_and_answer_tool_success(monkeypatch):
     """
     Test that question_and_answer_tool returns the expected result on success.
     """
-    monkeypatch.setattr(
-        question_and_answer, "generate_answer", fake_generate_answer
-    )
-    # Create a valid state with pdf_data containing both pdf_object and pdf_url,
-    # and include a dummy llm_model.
+    # Patch generate_answer2 because the tool calls that.
+    monkeypatch.setattr(question_and_answer, "generate_answer2", fake_generate_answer2)
+    dummy_text_embedding_model = object()  # Provide a dummy text embedding model.
+    # Create a valid state with pdf_data and include dummy llm_model and text_embedding_model.
     state = {
         "pdf_data": {"pdf_object": DUMMY_PDF_BYTES, "pdf_url": "http://dummy.url"},
         "llm_model": object(),  # Provide a dummy LLM model instance.
+        "text_embedding_model": dummy_text_embedding_model,
     }
     question = "What is in the PDF?"
-    # Call the underlying function directly via .func to bypass the StructuredTool wrapper.
     result = question_and_answer_tool.func(
         question=question, tool_call_id="test_call_id", state=state
     )
     assert result["answer"] == "Mock answer"
     assert result["question"] == question
-    assert result["pdf_bytes_length"] == len(DUMMY_PDF_BYTES)
+    assert result["pdf_url"] == "http://dummy.url"
 def test_question_and_answer_tool_no_pdf_data():
     """
     Test that an error is returned if the state lacks the 'pdf_data' key.
     """
-    state = {}  # pdf_data key is missing.
+    state = {
+        "text_embedding_model": object(),  # Added to avoid KeyError.
+    }
     question = "Any question?"
     result = question_and_answer_tool.func(
         question=question, tool_call_id="test_call_id", state=state
@@ -97,7 +99,11 @@ def test_question_and_answer_tool_no_pdf_object():
     """
     Test that an error is returned if the pdf_object is missing within pdf_data.
     """
-    state = {"pdf_data": {"pdf_object": None}}
+    state = {
+        "pdf_data": {"pdf_object": None},
+        "text_embedding_model": object(),  # Added to avoid KeyError.
+        "llm_model": object(),  # Dummy LLM model.
+    }
     question = "Any question?"
     result = question_and_answer_tool.func(
         question=question, tool_call_id="test_call_id", state=state
@@ -114,8 +120,9 @@ def test_question_and_answer_tool_no_llm_model():
     Test that an error is returned if the LLM model is missing in the state.
     """
     state = {
-        "pdf_data": {"pdf_object": DUMMY_PDF_BYTES, "pdf_url": "http://dummy.url"}
-        # Note: llm_model is intentionally omitted.
+        "pdf_data": {"pdf_object": DUMMY_PDF_BYTES, "pdf_url": "http://dummy.url"},
+        "text_embedding_model": object(),  # Added to avoid KeyError.
+        # llm_model is intentionally omitted.
     }
     question = "What is in the PDF?"
     result = question_and_answer_tool.func(
@@ -124,6 +131,57 @@ def test_question_and_answer_tool_no_llm_model():
     assert result == {"error": "No LLM model found in state."}
+def test_generate_answer2_actual(monkeypatch):
+    """
+    Test the actual behavior of generate_answer2 using fake dependencies
+    to exercise its internal logic.
+    """
+    # Create a fake PyPDFLoader that does not perform a network call.
+    class FakePyPDFLoader:
+        """class to fake PyPDFLoader"""
+        def __init__(self, file_path, headers=None):
+            """Initialize the fake PyPDFLoader."""
+            self.file_path = file_path
+            self.headers = headers
+        def lazy_load(self):
+            """Return a list with one fake Document."""
+            # Return a list with one fake Document.
+            return [Document(page_content="Answer for Test question?")]
+    monkeypatch.setattr(question_and_answer, "PyPDFLoader", FakePyPDFLoader)
+    # Create a fake vector store that returns a controlled result for similarity_search.
+    class FakeVectorStore:
+        """Fake vector store for similarity search."""
+        def similarity_search(self, query):
+            """Return a list with one Document containing our expected answer."""
+            # Return a list with one Document containing our expected answer.
+            return [Document(page_content=f"Answer for {query}")]
+    monkeypatch.setattr(
+        question_and_answer.InMemoryVectorStore,
+        "from_documents",
+        lambda docs, emb: FakeVectorStore(),
+    )
+    # Provide a dummy text embedding model.
+    dummy_text_embedding_model = object()
+    question = "Test question?"
+    pdf_url = "http://dummy.pdf"
+    # Call generate_answer2 without triggering an actual network call.
+    result = question_and_answer.generate_answer2(
+        question, pdf_url, dummy_text_embedding_model
+    )
+    # The function should join the page content from the similarity search.
+    expected = "Answer for Test question?"
+    assert result == expected
 def test_generate_answer(monkeypatch):
     """
     Test generate_answer function with controlled monkeypatched dependencies.
@@ -141,12 +199,15 @@ def test_generate_answer(monkeypatch):
         """
         Fake Annoy.from_documents function that returns a fake vector store.
         """
         # pylint: disable=too-few-public-methods, unused-argument
         class FakeVectorStore:
             """Fake vector store for similarity search."""
             def similarity_search(self, _question, k):
                 """Return a list with a single dummy Document."""
                 return [Document(page_content="dummy content")]
         return FakeVectorStore()
     monkeypatch.setattr(
@@ -157,9 +218,11 @@ def test_generate_answer(monkeypatch):
         """
         Fake load_qa_chain function that returns a fake QA chain.
         """
         # pylint: disable=too-few-public-methods, unused-argument
         class FakeChain:
             """Fake QA chain for testing generate_answer."""
             def invoke(self, **kwargs):
                 """
                 Fake invoke method that returns a mock answer.
@@ -169,6 +232,7 @@ def test_generate_answer(monkeypatch):
                     "answer": "real mock answer",
                     "question": input_data.get("question"),
                 }
         return FakeChain()
     monkeypatch.setattr(question_and_answer, "load_qa_chain", fake_load_qa_chain)

aiagents4pharma 1.30.0__py3-none-any.whl → 1.30.1__py3-none-any.whl

aiagents4pharma 1.30.0py3-none-any.whl → 1.30.1py3-none-any.whl