PyPI - langroid - Versions diffs - 0.1.229__py3-none-any.whl → 0.1.231__py3-none-any.whl - Mend

langroid 0.1.229py3-none-any.whl → 0.1.231py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

langroid/agent/batch.py CHANGED Viewed

@@ -31,6 +31,7 @@ def run_batch_task_gen(
     turns: int = -1,
     message: Optional[str] = None,
     handle_exceptions: bool = False,
+    max_cost: float = 0.0,
 ) -> list[U]:
     """
     Generate and run copies of a task async/concurrently one per item in `items` list.
@@ -50,6 +51,7 @@ def run_batch_task_gen(
         turns (int): number of turns to run, -1 for infinite
         message (Optional[str]): optionally overrides the console status messages
         handle_exceptions: bool: Whether to replace exceptions with outputs of None
+        max_cost: float: maximum cost to run the task (default 0.0 for unlimited)
     Returns:
         list[Any]: list of final results
@@ -62,7 +64,7 @@ def run_batch_task_gen(
             task_i.agent.llm.set_stream(False)
         task_i.agent.config.show_stats = False
-        result = await task_i.run_async(input, turns=turns)
+        result = await task_i.run_async(input, turns=turns, max_cost=max_cost)
         return result
     async def _do_all(
@@ -120,6 +122,7 @@ def run_batch_tasks(
     sequential: bool = True,
     batch_size: Optional[int] = None,
     turns: int = -1,
+    max_cost: float = 0.0,
 ) -> List[U]:
     """
     Run copies of `task` async/concurrently one per item in `items` list.
@@ -137,6 +140,7 @@ def run_batch_tasks(
         batch_size (Optional[int]): The number of tasks to run at a time,
             if None, unbatched
         turns (int): number of turns to run, -1 for infinite
+        max_cost: float: maximum cost to run the task (default 0.0 for unlimited)
     Returns:
         list[Any]: list of final results
@@ -151,6 +155,7 @@ def run_batch_tasks(
         batch_size,
         turns,
         message,
+        max_cost=max_cost,
     )

langroid/agent/task.py CHANGED Viewed

@@ -170,7 +170,7 @@ class Task:
                 agent.set_system_message(system_message)
             if user_message:
                 agent.set_user_message(user_message)
+        self.max_cost: float = 0
         self.logger: None | RichFileLogger = None
         self.tsv_logger: None | logging.Logger = None
         self.color_log: bool = False if settings.notebook else True
@@ -375,11 +375,13 @@ class Task:
         msg: Optional[str | ChatDocument] = None,
         turns: int = -1,
         caller: None | Task = None,
+        max_cost: float = 0,
     ) -> Optional[ChatDocument]:
         """Synchronous version of `run_async()`.
         See `run_async()` for details."""
         self.task_progress = False
         self.n_stalled_steps = 0
+        self.max_cost = max_cost
         assert (
             msg is None or isinstance(msg, str) or isinstance(msg, ChatDocument)
         ), f"msg arg in Task.run() must be None, str, or ChatDocument, not {type(msg)}"
@@ -418,6 +420,7 @@ class Task:
         msg: Optional[str | ChatDocument] = None,
         turns: int = -1,
         caller: None | Task = None,
+        max_cost: float = 0,
     ) -> Optional[ChatDocument]:
         """
         Loop over `step()` until task is considered done or `turns` is reached.
@@ -434,6 +437,7 @@ class Task:
             turns (int): number of turns to run the task for;
                 default is -1, which means run until task is done.
             caller (Task|None): the calling task, if any
+            max_cost (float): maximum cost allowed for the task (default 0 -> no limit)
         Returns:
             Optional[ChatDocument]: valid result of the task.
@@ -444,6 +448,8 @@ class Task:
         # message can be considered to be from the USER
         # (from the POV of this agent's LLM).
         self.task_progress = False
+        self.n_stalled_steps = 0
+        self.max_cost = max_cost
         if (
             isinstance(msg, ChatDocument)
             and msg.metadata.recipient != ""
@@ -819,6 +825,7 @@ class Task:
                 self.pending_message,
                 turns=actual_turns,
                 caller=self,
+                max_cost=self.max_cost,
             )
             result_str = str(ChatDocument.to_LLMMessage(result))
             maybe_tool = len(extract_top_level_json(result_str)) > 0
@@ -1051,6 +1058,16 @@ class Task:
             )
             return True
+        if self.max_cost > 0 and self.agent.llm is not None:
+            try:
+                if self.agent.llm.tot_tokens_cost()[1] > self.max_cost:
+                    logger.warning(
+                        f"Task {self.name} exceeded max cost {self.max_cost}; exiting."
+                    )
+                    return True
+            except Exception:
+                pass
         return (
             # no valid response from any entity/agent in current turn
             result is None

langroid/language_models/base.py CHANGED Viewed

@@ -449,6 +449,18 @@ class LanguageModel(ABC):
             s += f"{model}: {counter}\n"
         return s
+    @classmethod
+    def tot_tokens_cost(cls) -> Tuple[int, float]:
+        """
+        Return total tokens used and total cost across all models.
+        """
+        total_tokens = 0
+        total_cost = 0.0
+        for counter in cls.usage_cost_dict.values():
+            total_tokens += counter.total_tokens
+            total_cost += counter.cost
+        return total_tokens, total_cost
     def followup_to_standalone(
         self, chat_history: List[Tuple[str, str]], question: str
     ) -> str:

langroid/language_models/openai_gpt.py CHANGED Viewed

@@ -49,7 +49,7 @@ from langroid.language_models.utils import (
     retry_with_exponential_backoff,
 )
 from langroid.utils.configuration import settings
-from langroid.utils.constants import NO_ANSWER, Colors
+from langroid.utils.constants import Colors
 from langroid.utils.system import friendly_error
 logging.getLogger("openai").setLevel(logging.ERROR)
@@ -847,9 +847,9 @@ class OpenAIGPT(LanguageModel):
         try:
             return self._generate(prompt, max_tokens)
         except Exception as e:
-            # capture exceptions not handled by retry, so we don't crash
+            # log and re-raise exception
             logging.error(friendly_error(e, "Error in OpenAIGPT.generate: "))
-            return LLMResponse(message=NO_ANSWER, cached=False)
+            raise e
     def _generate(self, prompt: str, max_tokens: int) -> LLMResponse:
         if self.config.use_chat_for_completion:
@@ -917,9 +917,9 @@ class OpenAIGPT(LanguageModel):
         try:
             return await self._agenerate(prompt, max_tokens)
         except Exception as e:
-            # capture exceptions not handled by retry, so we don't crash
+            # log and re-raise exception
             logging.error(friendly_error(e, "Error in OpenAIGPT.agenerate: "))
-            return LLMResponse(message=NO_ANSWER, cached=False)
+            raise e
     async def _agenerate(self, prompt: str, max_tokens: int) -> LLMResponse:
         # note we typically will not have self.config.stream = True
@@ -1019,9 +1019,9 @@ class OpenAIGPT(LanguageModel):
         try:
             return self._chat(messages, max_tokens, functions, function_call)
         except Exception as e:
-            # capture exceptions not handled by retry, so we don't crash
+            # log and re-raise exception
             logging.error(friendly_error(e, "Error in OpenAIGPT.chat: "))
-            return LLMResponse(message=NO_ANSWER, cached=False)
+            raise e
     async def achat(
         self,
@@ -1072,9 +1072,9 @@ class OpenAIGPT(LanguageModel):
             result = await self._achat(messages, max_tokens, functions, function_call)
             return result
         except Exception as e:
-            # capture exceptions not handled by retry, so we don't crash
+            # log and re-raise exception
             logging.error(friendly_error(e, "Error in OpenAIGPT.achat: "))
-            return LLMResponse(message=NO_ANSWER, cached=False)
+            raise e
     @retry_with_exponential_backoff
     def _chat_completions_with_backoff(self, **kwargs):  # type: ignore

langroid/language_models/utils.py CHANGED Viewed

@@ -62,6 +62,7 @@ def retry_with_exponential_backoff(
                 if num_retries > max_retries:
                     raise Exception(
                         f"Maximum number of retries ({max_retries}) exceeded."
+                        f" Last error: {e}."
                     )
                 # Increment the delay

{langroid-0.1.229.dist-info → langroid-0.1.231.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: langroid
-Version: 0.1.229
+Version: 0.1.231
 Summary: Harness LLMs with Multi-Agent Programming
 License: MIT
 Author: Prasad Chalasani

{langroid-0.1.229.dist-info → langroid-0.1.231.dist-info}/RECORD RENAMED Viewed

@@ -1,7 +1,7 @@
 langroid/__init__.py,sha256=qgY-OqzYSWOc6EytQJN9sH2PwDp1UIzP9lXhrYH6aLU,1645
 langroid/agent/__init__.py,sha256=_D8dxnfdr92ch1CIrUkKjrB5HVvsQdn62b1Fb2kBxV8,785
 langroid/agent/base.py,sha256=jyGFmojrFuOy81lUkNsJlR6mLIOY6kOD20P9dhEcEuw,35059
-langroid/agent/batch.py,sha256=T9dgSPThrmIWxQxqDlGwhHa7yw3XIKE_U30bLMRDpNQ,9481
+langroid/agent/batch.py,sha256=H64Vy0P5-Y1KNftNW7NhM1zLC5d8bFG_AcXC9nji23s,9745
 langroid/agent/callbacks/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langroid/agent/callbacks/chainlit.py,sha256=aYuJ8M4VDHr5oymoXL2bpThM7p6P9L45fgJf3MLdkWo,20997
 langroid/agent/chat_agent.py,sha256=X5uVMm9qdw3j-FRf4hbN8k8ByaSdtQCTuU8olKE0sbs,38750
@@ -32,7 +32,7 @@ langroid/agent/special/sql/utils/populate_metadata.py,sha256=x2OMKfmIBnJESBG3qKt
 langroid/agent/special/sql/utils/system_message.py,sha256=qKLHkvQWRQodTtPLPxr1GSLUYUFASZU8x-ybV67cB68,1885
 langroid/agent/special/sql/utils/tools.py,sha256=6uB2424SLtmapui9ggcEr0ZTiB6_dL1-JRGgN8RK9Js,1332
 langroid/agent/special/table_chat_agent.py,sha256=-Qtqr2FP8VcyYcA-Pzqa9ucSl1-nXudbNsv_qakSSco,9041
-langroid/agent/task.py,sha256=sFncTES0L_O2IpbnHRrNzad0HhtsbHoQ7j3Cjc9eTt0,49711
+langroid/agent/task.py,sha256=YlWCNWG7vX_HoMvhqoQzoEghNGJK8Yskx4pbnnWDpcc,50408
 langroid/agent/tool_message.py,sha256=2kPsQUwi3ZzINTUNj10huKnZLjLp5SXmefacTHx8QDc,8304
 langroid/agent/tools/__init__.py,sha256=q-maq3k2BXhPAU99G0H6-j_ozoRvx15I1RFpPVicQIU,304
 langroid/agent/tools/duckduckgo_search_tool.py,sha256=mLGhlgs6pwbYZIwrOs9shfh1dMBVT4DtkR29pYL3cCQ,1900
@@ -59,15 +59,15 @@ langroid/embedding_models/protoc/embeddings_pb2_grpc.py,sha256=9dYQqkW3JPyBpSEje
 langroid/embedding_models/remote_embeds.py,sha256=6_kjXByVbqhY9cGwl9R83ZcYC2km-nGieNNAo1McHaY,5151
 langroid/language_models/__init__.py,sha256=5L9ndEEC8iLJHjDJmYFTnv6-2-3xsxWUMHcugR8IeDs,821
 langroid/language_models/azure_openai.py,sha256=ncRCbKooqLVOY-PWQUIo9C3yTuKEFbAwyngXT_M4P7k,5989
-langroid/language_models/base.py,sha256=Yy_6TP9Qj5CmNtDVQfbcyfytCsvGyow0e1OeqhWGY0A,20638
+langroid/language_models/base.py,sha256=B6dX43ZR65mIvjD95W4RcfpT-WpmiuEcstR3eMrr56Y,21029
 langroid/language_models/config.py,sha256=5UF3DzO1a-Dfsc3vghE0XGq7g9t_xDsRCsuRiU4dgBg,366
 langroid/language_models/openai_assistants.py,sha256=9K-DEAL2aSWHeXj2hwCo2RAlK9_1oCPtqX2u1wISCj8,36
-langroid/language_models/openai_gpt.py,sha256=3W0gi7_Ja0c0vuT8SDv8ioOWXyUKs7zJORx8BV-QT2g,49672
+langroid/language_models/openai_gpt.py,sha256=hR0ibmumIq1TnOGdb80SW0EN6YZn6DZazd5waFHKqGk,49357
 langroid/language_models/prompt_formatter/__init__.py,sha256=9JXFF22QNMmbQV1q4nrIeQVTtA3Tx8tEZABLtLBdFyc,352
 langroid/language_models/prompt_formatter/base.py,sha256=eDS1sgRNZVnoajwV_ZIha6cba5Dt8xjgzdRbPITwx3Q,1221
 langroid/language_models/prompt_formatter/hf_formatter.py,sha256=TFL6ppmeQWnzr6CKQzRZFYY810zE1mr8DZnhw6i85ok,5217
 langroid/language_models/prompt_formatter/llama2_formatter.py,sha256=YdcO88qyBeuMENVIVvVqSYuEpvYSTndUe_jd6hVTko4,2899
-langroid/language_models/utils.py,sha256=u-VZImPsEKFc10yI-AfRhKkU9_RVCVqyQbwzR2Xc_WE,4758
+langroid/language_models/utils.py,sha256=j8xEEm__-2b9eql1oTiWQk5dHW59UwmrRKs5kMHaGGo,4803
 langroid/mytypes.py,sha256=opL488mtHKob1uJeK_h1-kNjU5GZwkgCfXhBQCsONWU,2614
 langroid/parsing/__init__.py,sha256=2O5HOW8nDE3v-JInc5z2wIbFGejf4h5ZTdPqxsFtaWE,870
 langroid/parsing/agent_chats.py,sha256=sbZRV9ujdM5QXvvuHVjIi2ysYSYlap-uqfMMUKulrW0,1068
@@ -120,7 +120,7 @@ langroid/vector_store/meilisearch.py,sha256=d2huA9P-NoYRuAQ9ZeXJmMKr7ry8u90RUSR2
 langroid/vector_store/momento.py,sha256=9cui31TTrILid2KIzUpBkN2Ey3g_CZWOQVdaFsA4Ors,10045
 langroid/vector_store/qdrant_cloud.py,sha256=3im4Mip0QXLkR6wiqVsjV1QvhSElfxdFSuDKddBDQ-4,188
 langroid/vector_store/qdrantdb.py,sha256=foKRxRv0BBony6S4Vt0Vav9Rn9HMxZvcIh1cE7nosFE,13524
-langroid-0.1.229.dist-info/LICENSE,sha256=EgVbvA6VSYgUlvC3RvPKehSg7MFaxWDsFuzLOsPPfJg,1065
-langroid-0.1.229.dist-info/METADATA,sha256=2FXDkWjDrhYNvrCDCdshNanmBCAzW8N1t_4UUR9iNVI,47863
-langroid-0.1.229.dist-info/WHEEL,sha256=FMvqSimYX_P7y0a7UY-_Mc83r5zkBZsCYPm7Lr0Bsq4,88
-langroid-0.1.229.dist-info/RECORD,,
+langroid-0.1.231.dist-info/LICENSE,sha256=EgVbvA6VSYgUlvC3RvPKehSg7MFaxWDsFuzLOsPPfJg,1065
+langroid-0.1.231.dist-info/METADATA,sha256=uomAdAunAEaqZaWqjmDyaOsL_WN_J4AYH06YNnFNREQ,47863
+langroid-0.1.231.dist-info/WHEEL,sha256=FMvqSimYX_P7y0a7UY-_Mc83r5zkBZsCYPm7Lr0Bsq4,88
+langroid-0.1.231.dist-info/RECORD,,

{langroid-0.1.229.dist-info → langroid-0.1.231.dist-info}/LICENSE RENAMED Viewed

File without changes

{langroid-0.1.229.dist-info → langroid-0.1.231.dist-info}/WHEEL RENAMED Viewed

File without changes

langroid 0.1.229__py3-none-any.whl → 0.1.231__py3-none-any.whl

langroid 0.1.229py3-none-any.whl → 0.1.231py3-none-any.whl