PyPI - langroid - Versions diffs - 0.1.249__tar.gz → 0.1.251__tar.gz - Mend

langroid 0.1.249tar.gz → 0.1.251tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (130) hide show

{langroid-0.1.249 → langroid-0.1.251}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: langroid
-Version: 0.1.249
+Version: 0.1.251
 Summary: Harness LLMs with Multi-Agent Programming
 License: MIT
 Author: Prasad Chalasani
@@ -237,6 +237,8 @@ teacher_task.run()
 <summary> <b>Click to expand</b></summary>
 - **May 2024:**
+  - [Much-Improved Citation](https://github.com/langroid/langroid/issues/477)
+    generation and display when using `DocChatAgent`.
   - `gpt-4o` is now the default LLM throughout; Update tests and examples to work
     with this LLM; use tokenizer corresponding to the LLM.
   - `gemini 1.5 pro` support via `litellm`

{langroid-0.1.249 → langroid-0.1.251}/README.md RENAMED Viewed

@@ -123,6 +123,8 @@ teacher_task.run()
 <summary> <b>Click to expand</b></summary>
 - **May 2024:**
+  - [Much-Improved Citation](https://github.com/langroid/langroid/issues/477)
+    generation and display when using `DocChatAgent`.
   - `gpt-4o` is now the default LLM throughout; Update tests and examples to work
     with this LLM; use tokenizer corresponding to the LLM.
   - `gemini 1.5 pro` support via `litellm`

{langroid-0.1.249 → langroid-0.1.251}/langroid/__init__.py RENAMED Viewed

@@ -41,7 +41,7 @@ from .agent.chat_agent import (
     ChatAgentConfig,
 )
-from .agent.task import Task
+from .agent.task import Task, TaskConfig
 try:
     from .agent.callbacks.chainlit import (
@@ -64,8 +64,11 @@ from .mytypes import (
     Entity,
 )
+from .exceptions import InfiniteLoopException
 __all__ = [
     "mytypes",
+    "exceptions",
     "utils",
     "parsing",
     "prompts",
@@ -82,6 +85,7 @@ __all__ = [
     "ChatDocument",
     "ChatDocMetaData",
     "Task",
+    "TaskConfig",
     "DocMetaData",
     "Document",
     "Entity",
@@ -89,6 +93,7 @@ __all__ = [
     "run_batch_tasks",
     "llm_response_batch",
     "agent_response_batch",
+    "InfiniteLoopException",
 ]
 if chainlit_available:
     __all__.extend(

{langroid-0.1.249 → langroid-0.1.251}/langroid/agent/base.py RENAMED Viewed

@@ -87,6 +87,7 @@ class Agent(ABC):
         self.llm_tools_map: Dict[str, Type[ToolMessage]] = {}
         self.llm_tools_handled: Set[str] = set()
         self.llm_tools_usable: Set[str] = set()
+        self.interactive: bool | None = None
         self.total_llm_token_cost = 0.0
         self.total_llm_token_usage = 0
         self.token_stats_str = ""
@@ -223,8 +224,8 @@ class Agent(ABC):
         ):
             setattr(self, tool, lambda obj: obj.response(self))
-        if hasattr(message_class, "handle_message_fallback") and inspect.isfunction(
-            message_class.handle_message_fallback
+        if hasattr(message_class, "handle_message_fallback") and (
+            inspect.isfunction(message_class.handle_message_fallback)
         ):
             setattr(
                 self,
@@ -279,9 +280,9 @@ class Agent(ABC):
         ]
         return "\n\n".join(sample_convo)
-    def agent_response_template(self) -> ChatDocument:
+    def create_agent_response(self, content: str | None = None) -> ChatDocument:
         """Template for agent_response."""
-        return self._response_template(Entity.AGENT)
+        return self._response_template(Entity.AGENT, content)
     async def agent_response_async(
         self,
@@ -342,19 +343,19 @@ class Agent(ABC):
             ),
         )
-    def _response_template(self, e: Entity) -> ChatDocument:
+    def _response_template(self, e: Entity, content: str | None = None) -> ChatDocument:
         """Template for response from entity `e`."""
         return ChatDocument(
-            content="",
+            content=content or "",
             tool_messages=[],
             metadata=ChatDocMetaData(
                 source=e, sender=e, sender_name=self.config.name, tool_ids=[]
             ),
         )
-    def user_response_template(self) -> ChatDocument:
+    def create_user_response(self, content: str | None = None) -> ChatDocument:
         """Template for user_response."""
-        return self._response_template(Entity.USER)
+        return self._response_template(Entity.USER, content)
     async def user_response_async(
         self,
@@ -377,11 +378,21 @@ class Agent(ABC):
             (str) User response, packaged as a ChatDocument
         """
-        if self.default_human_response is not None:
+        # When msg explicitly addressed to user, this means an actual human response
+        # is being sought.
+        need_human_response = (
+            isinstance(msg, ChatDocument) and msg.metadata.recipient == Entity.USER
+        )
+        interactive = (
+            self.interactive if self.interactive is not None else settings.interactive
+        )
+        if self.default_human_response is not None and not need_human_response:
             # useful for automated testing
             user_msg = self.default_human_response
-        elif not settings.interactive:
-            user_msg = ""
+        elif not interactive and not need_human_response:
+            return None
         else:
             if self.callbacks.get_user_response is not None:
                 # ask user with empty prompt: no need for prompt
@@ -440,9 +451,9 @@ class Agent(ABC):
         return True
-    def llm_response_template(self) -> ChatDocument:
+    def create_llm_response(self, content: str | None = None) -> ChatDocument:
         """Template for llm_response."""
-        return self._response_template(Entity.LLM)
+        return self._response_template(Entity.LLM, content)
     @no_type_check
     async def llm_response_async(
@@ -736,6 +747,24 @@ class Agent(ABC):
     def _get_one_tool_message(self, json_str: str) -> Optional[ToolMessage]:
         json_data = json.loads(json_str)
+        # check if the json_data contains a "properties" field
+        # which further contains the actual tool-call
+        # (some weak LLMs do this). E.g. gpt-4o sometimes generates this:
+        # TOOL: {
+        #     "type": "object",
+        #     "properties": {
+        #         "request": "square",
+        #         "number": 9
+        #     },
+        #     "required": [
+        #         "number",
+        #         "request"
+        #     ]
+        # }
+        properties = json_data.get("properties")
+        if properties is not None:
+            json_data = properties
         request = json_data.get("request")
         if (
             request is None

{langroid-0.1.249 → langroid-0.1.251}/langroid/agent/chat_agent.py RENAMED Viewed

@@ -273,10 +273,11 @@ class ChatAgent(Agent):
                 example = "" if self.config.use_tools else (msg_cls.usage_example())
                 if example != "":
                     example = "EXAMPLE: " + example
+                class_instructions = msg_cls.instructions()
                 guidance = (
                     ""
-                    if msg_cls.instructions() == ""
-                    else ("GUIDANCE: " + msg_cls.instructions())
+                    if class_instructions == ""
+                    else ("GUIDANCE: " + class_instructions)
                 )
                 if guidance == "" and example == "":
                     continue
@@ -783,23 +784,20 @@ class ChatAgent(Agent):
         if self.llm is None:
             return
         if not citation_only and (not self.llm.get_stream() or is_cached):
-            # We expect response to be LLMResponse in this context
-            if not isinstance(response, LLMResponse):
-                raise ValueError(
-                    "Expected response to be LLMResponse, but got "
-                    f"{type(response)} instead."
-                )
             # We would have already displayed the msg "live" ONLY if
             # streaming was enabled, AND we did not find a cached response.
             # If we are here, it means the response has not yet been displayed.
             cached = f"[red]{self.indent}(cached)[/red]" if is_cached else ""
             if not settings.quiet:
+                chat_doc = (
+                    response
+                    if isinstance(response, ChatDocument)
+                    else ChatDocument.from_LLMResponse(response, displayed=True)
+                )
                 print(cached + "[green]" + escape(str(response)))
                 self.callbacks.show_llm_response(
                     content=str(response),
-                    is_tool=self.has_tool_message_attempt(
-                        ChatDocument.from_LLMResponse(response, displayed=True),
-                    ),
+                    is_tool=self.has_tool_message_attempt(chat_doc),
                     cached=is_cached,
                 )
         if isinstance(response, LLMResponse):

{langroid-0.1.249 → langroid-0.1.251}/langroid/agent/special/doc_chat_agent.py RENAMED Viewed

@@ -14,7 +14,6 @@ pip install "langroid[hf-embeddings]"
 """
 import logging
-import re
 from functools import cache
 from typing import Any, Dict, List, Optional, Set, Tuple, no_type_check
@@ -31,6 +30,7 @@ from langroid.agent.special.relevance_extractor_agent import (
     RelevanceExtractorAgentConfig,
 )
 from langroid.agent.task import Task
+from langroid.agent.tools.retrieval_tool import RetrievalTool
 from langroid.embedding_models.models import OpenAIEmbeddingsConfig
 from langroid.language_models.base import StreamingIfAllowed
 from langroid.language_models.openai_gpt import OpenAIChatModel, OpenAIGPTConfig
@@ -82,21 +82,47 @@ except ImportError:
     pass
-def extract_citations(text: str) -> List[int]:
-    # Find all patterns that match [[<numbers>]]
-    matches = re.findall(r"\[\[([\d,]+)\]\]", text)
+def extract_markdown_references(md_string: str) -> list[int]:
+    """
+    Extracts markdown references (e.g., [^1], [^2]) from a string and returns
+    them as a sorted list of integers.
+    Args:
+        md_string (str): The markdown string containing references.
+    Returns:
+        list[int]: A sorted list of unique integers from the markdown references.
+    """
+    import re
+    # Regex to find all occurrences of [^<number>]
+    matches = re.findall(r"\[\^(\d+)\]", md_string)
+    # Convert matches to integers, remove duplicates with set, and sort
+    return sorted(set(int(match) for match in matches))
-    # Initialize a set to hold distinct citation numbers
-    citations: Set[int] = set()
-    # Process each match
-    for match in matches:
-        # Split numbers by comma and convert to integers
-        numbers = match.split(",")
-        citations.update(int(number) for number in numbers)
+def format_footnote_text(content: str, width: int = 80) -> str:
+    """
+    Formats the content part of a footnote (i.e. not the first line that
+    appears right after the reference [^4])
+    It wraps the text so that no line is longer than the specified width and indents
+    lines as necessary for markdown footnotes.
+    Args:
+        content (str): The text of the footnote to be formatted.
+        width (int): Maximum width of the text lines.
-    # Return a sorted list of unique citations
-    return sorted(citations)
+    Returns:
+        str: Properly formatted markdown footnote text.
+    """
+    import textwrap
+    # Wrap the text to the specified width
+    wrapped_lines = textwrap.wrap(content, width)
+    if len(wrapped_lines) == 0:
+        return ""
+    indent = "    "  # Indentation for markdown footnotes
+    return indent + ("\n" + indent).join(wrapped_lines)
 class DocChatAgentConfig(ChatAgentConfig):
@@ -438,6 +464,13 @@ class DocChatAgent(ChatAgent):
         self.setup_documents(docs, filter=self.config.filter)
         return len(docs)
+    def retrieval_tool(self, msg: RetrievalTool) -> str:
+        """Handle the RetrievalTool message"""
+        self.config.retrieve_only = True
+        self.config.parsing.n_similar_docs = msg.num_results
+        content_doc = self.answer_from_docs(msg.query)
+        return content_doc.content
     @staticmethod
     def document_compatible_dataframe(
         df: pd.DataFrame,
@@ -808,14 +841,15 @@ class DocChatAgent(ChatAgent):
         final_answer = answer_doc.content.strip()
         show_if_debug(final_answer, "SUMMARIZE_RESPONSE= ")
-        citations = extract_citations(final_answer)
+        citations = extract_markdown_references(final_answer)
         citations_str = ""
         if len(citations) > 0:
             # append [i] source, content for each citation
             citations_str = "\n".join(
                 [
-                    f"[{c}] {passages[c-1].metadata.source}\n{passages[c-1].content}"
+                    f"[^{c}] {passages[c-1].metadata.source}"
+                    f"\n{format_footnote_text(passages[c-1].content)}"
                     for c in citations
                 ]
             )

{langroid-0.1.249 → langroid-0.1.251}/langroid/agent/special/lance_rag/critic_agent.py RENAMED Viewed

@@ -70,13 +70,19 @@ class QueryPlanCriticConfig(LanceQueryPlanAgentConfig):
       plan execution FAILED, and your feedback should say INVALID along
       with the ERROR message, `suggested_fix` that aims to help the assistant
       fix the problem (or simply equals "address the the error shown in feedback")
+    - Ask yourself, is the ANSWER in the expected form, e.g.
+        if the question is asking for the name of an ENTITY with max SIZE,
+        then the answer should be the ENTITY name, NOT the SIZE!!
     - If the ANSWER is in the expected form, then the QUERY PLAN is likely VALID,
       and your feedback should say VALID, with empty `suggested_fix`.
+      ===> HOWEVER!!! Watch out for a spurious correct-looking answer, for EXAMPLE:
+      the query was to find the ENTITY with a maximum SIZE,
+      but the dataframe calculation is find the SIZE, NOT the ENTITY!!
     - If the ANSWER is {NO_ANSWER} or of the wrong form,
       then try to DIAGNOSE the problem IN THE FOLLOWING ORDER:
       - DATAFRAME CALCULATION -- is it doing the right thing?
         Is it finding the Index of a row instead of the value in a column?
-        Or another example: mmaybe it is finding the maximum population
+        Or another example: maybe it is finding the maximum population
            rather than the CITY with the maximum population?
         If you notice a problem with the DATAFRAME CALCULATION, then
         ONLY SUBMIT FEEDBACK ON THE DATAFRAME CALCULATION, and DO NOT

{langroid-0.1.249 → langroid-0.1.251}/langroid/agent/special/lance_rag/query_planner_agent.py RENAMED Viewed

@@ -195,7 +195,7 @@ class LanceQueryPlanAgent(ChatAgent):
                 plan=self.curr_query_plan,
                 answer=self.result,
             )
-            response_tmpl = self.agent_response_template()
+            response_tmpl = self.create_agent_response()
             # ... add the QueryPlanAnswerTool to the response
             # (Notice how the Agent is directly sending a tool, not the LLM)
             response_tmpl.tool_messages = [query_plan_answer_tool]

langroid 0.1.249__tar.gz → 0.1.251__tar.gz

langroid 0.1.249tar.gz → 0.1.251tar.gz